{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "global_step": 53003, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 3.1426775612822127e-09, "loss": 2.3284, "step": 1 }, { "epoch": 0.0, "learning_rate": 6.285355122564425e-09, "loss": 1.9229, "step": 2 }, { "epoch": 0.0, "learning_rate": 9.428032683846639e-09, "loss": 1.9701, "step": 3 }, { "epoch": 0.0, "learning_rate": 1.257071024512885e-08, "loss": 1.5306, "step": 4 }, { "epoch": 0.0, "learning_rate": 1.5713387806411064e-08, "loss": 2.2599, "step": 5 }, { "epoch": 0.0, "learning_rate": 1.8856065367693278e-08, "loss": 3.0715, "step": 6 }, { "epoch": 0.0, "learning_rate": 2.1998742928975488e-08, "loss": 1.9998, "step": 7 }, { "epoch": 0.0, "learning_rate": 2.51414204902577e-08, "loss": 1.7711, "step": 8 }, { "epoch": 0.0, "learning_rate": 2.8284098051539915e-08, "loss": 1.8987, "step": 9 }, { "epoch": 0.0, "learning_rate": 3.142677561282213e-08, "loss": 1.8848, "step": 10 }, { "epoch": 0.0, "learning_rate": 3.456945317410434e-08, "loss": 2.1677, "step": 11 }, { "epoch": 0.0, "learning_rate": 3.7712130735386556e-08, "loss": 3.1555, "step": 12 }, { "epoch": 0.0, "learning_rate": 4.085480829666876e-08, "loss": 2.199, "step": 13 }, { "epoch": 0.0, "learning_rate": 4.3997485857950976e-08, "loss": 2.1254, "step": 14 }, { "epoch": 0.0, "learning_rate": 4.7140163419233186e-08, "loss": 2.262, "step": 15 }, { "epoch": 0.0, "learning_rate": 5.02828409805154e-08, "loss": 2.0558, "step": 16 }, { "epoch": 0.0, "learning_rate": 5.3425518541797613e-08, "loss": 1.7191, "step": 17 }, { "epoch": 0.0, "learning_rate": 5.656819610307983e-08, "loss": 2.1042, "step": 18 }, { "epoch": 0.0, "learning_rate": 5.971087366436203e-08, "loss": 2.7185, "step": 19 }, { "epoch": 0.0, "learning_rate": 6.285355122564426e-08, "loss": 2.1084, "step": 20 }, { "epoch": 0.0, "learning_rate": 6.599622878692647e-08, "loss": 1.7351, "step": 21 }, { "epoch": 0.0, "learning_rate": 6.913890634820868e-08, "loss": 2.0829, "step": 22 }, { "epoch": 0.0, "learning_rate": 7.228158390949089e-08, "loss": 1.5532, "step": 23 }, { "epoch": 0.0, "learning_rate": 7.542426147077311e-08, "loss": 2.1121, "step": 24 }, { "epoch": 0.0, "learning_rate": 7.856693903205531e-08, "loss": 3.2354, "step": 25 }, { "epoch": 0.0, "learning_rate": 8.170961659333752e-08, "loss": 2.0542, "step": 26 }, { "epoch": 0.0, "learning_rate": 8.485229415461976e-08, "loss": 2.2134, "step": 27 }, { "epoch": 0.0, "learning_rate": 8.799497171590195e-08, "loss": 2.084, "step": 28 }, { "epoch": 0.0, "learning_rate": 9.113764927718416e-08, "loss": 1.7523, "step": 29 }, { "epoch": 0.0, "learning_rate": 9.428032683846637e-08, "loss": 1.8601, "step": 30 }, { "epoch": 0.0, "learning_rate": 9.74230043997486e-08, "loss": 2.5544, "step": 31 }, { "epoch": 0.0, "learning_rate": 1.005656819610308e-07, "loss": 2.2145, "step": 32 }, { "epoch": 0.0, "learning_rate": 1.0370835952231302e-07, "loss": 1.7723, "step": 33 }, { "epoch": 0.0, "learning_rate": 1.0685103708359523e-07, "loss": 1.8213, "step": 34 }, { "epoch": 0.0, "learning_rate": 1.0999371464487745e-07, "loss": 1.67, "step": 35 }, { "epoch": 0.0, "learning_rate": 1.1313639220615966e-07, "loss": 1.8082, "step": 36 }, { "epoch": 0.0, "learning_rate": 1.1627906976744187e-07, "loss": 2.3624, "step": 37 }, { "epoch": 0.0, "learning_rate": 1.1942174732872407e-07, "loss": 2.3142, "step": 38 }, { "epoch": 0.0, "learning_rate": 1.225644248900063e-07, "loss": 1.9458, "step": 39 }, { "epoch": 0.0, "learning_rate": 1.2570710245128851e-07, "loss": 1.7742, "step": 40 }, { "epoch": 0.0, "learning_rate": 1.2884978001257073e-07, "loss": 1.6548, "step": 41 }, { "epoch": 0.0, "learning_rate": 1.3199245757385294e-07, "loss": 1.5028, "step": 42 }, { "epoch": 0.0, "learning_rate": 1.3513513513513515e-07, "loss": 1.8174, "step": 43 }, { "epoch": 0.0, "learning_rate": 1.3827781269641736e-07, "loss": 2.4834, "step": 44 }, { "epoch": 0.0, "learning_rate": 1.4142049025769957e-07, "loss": 1.9055, "step": 45 }, { "epoch": 0.0, "learning_rate": 1.4456316781898178e-07, "loss": 1.8129, "step": 46 }, { "epoch": 0.0, "learning_rate": 1.47705845380264e-07, "loss": 1.5329, "step": 47 }, { "epoch": 0.0, "learning_rate": 1.5084852294154622e-07, "loss": 1.7294, "step": 48 }, { "epoch": 0.0, "learning_rate": 1.5399120050282843e-07, "loss": 1.4347, "step": 49 }, { "epoch": 0.0, "learning_rate": 1.5713387806411062e-07, "loss": 2.0177, "step": 50 }, { "epoch": 0.0, "learning_rate": 1.6027655562539285e-07, "loss": 1.6119, "step": 51 }, { "epoch": 0.0, "learning_rate": 1.6341923318667504e-07, "loss": 1.5515, "step": 52 }, { "epoch": 0.0, "learning_rate": 1.6656191074795727e-07, "loss": 1.3372, "step": 53 }, { "epoch": 0.0, "learning_rate": 1.697045883092395e-07, "loss": 1.4161, "step": 54 }, { "epoch": 0.0, "learning_rate": 1.728472658705217e-07, "loss": 1.6285, "step": 55 }, { "epoch": 0.0, "learning_rate": 1.759899434318039e-07, "loss": 2.2935, "step": 56 }, { "epoch": 0.0, "learning_rate": 1.7913262099308614e-07, "loss": 1.7076, "step": 57 }, { "epoch": 0.0, "learning_rate": 1.8227529855436833e-07, "loss": 1.1895, "step": 58 }, { "epoch": 0.0, "learning_rate": 1.8541797611565056e-07, "loss": 1.4247, "step": 59 }, { "epoch": 0.0, "learning_rate": 1.8856065367693275e-07, "loss": 1.2524, "step": 60 }, { "epoch": 0.0, "learning_rate": 1.9170333123821498e-07, "loss": 1.4194, "step": 61 }, { "epoch": 0.0, "learning_rate": 1.948460087994972e-07, "loss": 1.7637, "step": 62 }, { "epoch": 0.0, "learning_rate": 1.979886863607794e-07, "loss": 1.7362, "step": 63 }, { "epoch": 0.0, "learning_rate": 2.011313639220616e-07, "loss": 1.5607, "step": 64 }, { "epoch": 0.0, "learning_rate": 2.042740414833438e-07, "loss": 1.1157, "step": 65 }, { "epoch": 0.0, "learning_rate": 2.0741671904462603e-07, "loss": 1.3258, "step": 66 }, { "epoch": 0.0, "learning_rate": 2.1055939660590827e-07, "loss": 1.5315, "step": 67 }, { "epoch": 0.0, "learning_rate": 2.1370207416719045e-07, "loss": 1.5536, "step": 68 }, { "epoch": 0.0, "learning_rate": 2.1684475172847266e-07, "loss": 1.6401, "step": 69 }, { "epoch": 0.0, "learning_rate": 2.199874292897549e-07, "loss": 1.3096, "step": 70 }, { "epoch": 0.0, "learning_rate": 2.2313010685103708e-07, "loss": 1.26, "step": 71 }, { "epoch": 0.0, "learning_rate": 2.2627278441231932e-07, "loss": 1.1534, "step": 72 }, { "epoch": 0.0, "learning_rate": 2.294154619736015e-07, "loss": 1.1215, "step": 73 }, { "epoch": 0.0, "learning_rate": 2.3255813953488374e-07, "loss": 1.3006, "step": 74 }, { "epoch": 0.0, "learning_rate": 2.3570081709616595e-07, "loss": 2.0072, "step": 75 }, { "epoch": 0.0, "learning_rate": 2.3884349465744814e-07, "loss": 1.2823, "step": 76 }, { "epoch": 0.0, "learning_rate": 2.4198617221873037e-07, "loss": 1.3381, "step": 77 }, { "epoch": 0.0, "learning_rate": 2.451288497800126e-07, "loss": 1.2105, "step": 78 }, { "epoch": 0.0, "learning_rate": 2.482715273412948e-07, "loss": 1.1254, "step": 79 }, { "epoch": 0.0, "learning_rate": 2.5141420490257703e-07, "loss": 1.6947, "step": 80 }, { "epoch": 0.0, "learning_rate": 2.545568824638592e-07, "loss": 1.9039, "step": 81 }, { "epoch": 0.0, "learning_rate": 2.5769956002514145e-07, "loss": 1.3438, "step": 82 }, { "epoch": 0.0, "learning_rate": 2.608422375864237e-07, "loss": 1.17, "step": 83 }, { "epoch": 0.0, "learning_rate": 2.6398491514770587e-07, "loss": 1.1388, "step": 84 }, { "epoch": 0.0, "learning_rate": 2.671275927089881e-07, "loss": 1.0967, "step": 85 }, { "epoch": 0.0, "learning_rate": 2.702702702702703e-07, "loss": 1.2397, "step": 86 }, { "epoch": 0.0, "learning_rate": 2.734129478315525e-07, "loss": 1.529, "step": 87 }, { "epoch": 0.0, "learning_rate": 2.765556253928347e-07, "loss": 1.1624, "step": 88 }, { "epoch": 0.0, "learning_rate": 2.796983029541169e-07, "loss": 1.4232, "step": 89 }, { "epoch": 0.0, "learning_rate": 2.8284098051539913e-07, "loss": 0.9879, "step": 90 }, { "epoch": 0.0, "learning_rate": 2.8598365807668137e-07, "loss": 1.261, "step": 91 }, { "epoch": 0.0, "learning_rate": 2.8912633563796355e-07, "loss": 1.2229, "step": 92 }, { "epoch": 0.0, "learning_rate": 2.922690131992458e-07, "loss": 1.6223, "step": 93 }, { "epoch": 0.0, "learning_rate": 2.95411690760528e-07, "loss": 1.6289, "step": 94 }, { "epoch": 0.0, "learning_rate": 2.985543683218102e-07, "loss": 1.3357, "step": 95 }, { "epoch": 0.0, "learning_rate": 3.0169704588309245e-07, "loss": 1.0081, "step": 96 }, { "epoch": 0.0, "learning_rate": 3.0483972344437463e-07, "loss": 1.2473, "step": 97 }, { "epoch": 0.0, "learning_rate": 3.0798240100565687e-07, "loss": 1.3545, "step": 98 }, { "epoch": 0.0, "learning_rate": 3.1112507856693905e-07, "loss": 1.271, "step": 99 }, { "epoch": 0.0, "learning_rate": 3.1426775612822123e-07, "loss": 1.9968, "step": 100 }, { "epoch": 0.0, "learning_rate": 3.1741043368950347e-07, "loss": 1.2684, "step": 101 }, { "epoch": 0.0, "learning_rate": 3.205531112507857e-07, "loss": 1.0969, "step": 102 }, { "epoch": 0.0, "learning_rate": 3.2369578881206794e-07, "loss": 1.2051, "step": 103 }, { "epoch": 0.0, "learning_rate": 3.268384663733501e-07, "loss": 1.1518, "step": 104 }, { "epoch": 0.0, "learning_rate": 3.299811439346323e-07, "loss": 1.3201, "step": 105 }, { "epoch": 0.0, "learning_rate": 3.3312382149591455e-07, "loss": 1.7745, "step": 106 }, { "epoch": 0.0, "learning_rate": 3.362664990571968e-07, "loss": 1.2182, "step": 107 }, { "epoch": 0.0, "learning_rate": 3.39409176618479e-07, "loss": 1.3018, "step": 108 }, { "epoch": 0.0, "learning_rate": 3.4255185417976115e-07, "loss": 1.1751, "step": 109 }, { "epoch": 0.0, "learning_rate": 3.456945317410434e-07, "loss": 1.2613, "step": 110 }, { "epoch": 0.0, "learning_rate": 3.488372093023256e-07, "loss": 1.1025, "step": 111 }, { "epoch": 0.0, "learning_rate": 3.519798868636078e-07, "loss": 1.2858, "step": 112 }, { "epoch": 0.0, "learning_rate": 3.5512256442489005e-07, "loss": 1.3763, "step": 113 }, { "epoch": 0.0, "learning_rate": 3.582652419861723e-07, "loss": 1.0487, "step": 114 }, { "epoch": 0.0, "learning_rate": 3.614079195474544e-07, "loss": 0.9884, "step": 115 }, { "epoch": 0.0, "learning_rate": 3.6455059710873665e-07, "loss": 1.2909, "step": 116 }, { "epoch": 0.0, "learning_rate": 3.676932746700189e-07, "loss": 1.1835, "step": 117 }, { "epoch": 0.0, "learning_rate": 3.708359522313011e-07, "loss": 1.3356, "step": 118 }, { "epoch": 0.0, "learning_rate": 3.7397862979258336e-07, "loss": 1.629, "step": 119 }, { "epoch": 0.0, "learning_rate": 3.771213073538655e-07, "loss": 1.1683, "step": 120 }, { "epoch": 0.0, "learning_rate": 3.8026398491514773e-07, "loss": 1.0308, "step": 121 }, { "epoch": 0.0, "learning_rate": 3.8340666247642996e-07, "loss": 1.0338, "step": 122 }, { "epoch": 0.0, "learning_rate": 3.865493400377122e-07, "loss": 1.0219, "step": 123 }, { "epoch": 0.0, "learning_rate": 3.896920175989944e-07, "loss": 1.2122, "step": 124 }, { "epoch": 0.0, "learning_rate": 3.9283469516027657e-07, "loss": 1.5852, "step": 125 }, { "epoch": 0.0, "learning_rate": 3.959773727215588e-07, "loss": 1.0768, "step": 126 }, { "epoch": 0.0, "learning_rate": 3.99120050282841e-07, "loss": 1.3674, "step": 127 }, { "epoch": 0.0, "learning_rate": 4.022627278441232e-07, "loss": 1.3527, "step": 128 }, { "epoch": 0.0, "learning_rate": 4.0540540540540546e-07, "loss": 0.9195, "step": 129 }, { "epoch": 0.0, "learning_rate": 4.085480829666876e-07, "loss": 1.2995, "step": 130 }, { "epoch": 0.0, "learning_rate": 4.1169076052796983e-07, "loss": 1.63, "step": 131 }, { "epoch": 0.0, "learning_rate": 4.1483343808925207e-07, "loss": 1.0869, "step": 132 }, { "epoch": 0.0, "learning_rate": 4.179761156505343e-07, "loss": 0.8753, "step": 133 }, { "epoch": 0.0, "learning_rate": 4.2111879321181654e-07, "loss": 1.1115, "step": 134 }, { "epoch": 0.0, "learning_rate": 4.242614707730987e-07, "loss": 0.9833, "step": 135 }, { "epoch": 0.0, "learning_rate": 4.274041483343809e-07, "loss": 1.2812, "step": 136 }, { "epoch": 0.0, "learning_rate": 4.3054682589566314e-07, "loss": 1.2772, "step": 137 }, { "epoch": 0.0, "learning_rate": 4.3368950345694533e-07, "loss": 1.1592, "step": 138 }, { "epoch": 0.0, "learning_rate": 4.3683218101822757e-07, "loss": 1.0361, "step": 139 }, { "epoch": 0.0, "learning_rate": 4.399748585795098e-07, "loss": 0.9494, "step": 140 }, { "epoch": 0.0, "learning_rate": 4.43117536140792e-07, "loss": 1.0978, "step": 141 }, { "epoch": 0.0, "learning_rate": 4.4626021370207417e-07, "loss": 1.0672, "step": 142 }, { "epoch": 0.0, "learning_rate": 4.494028912633564e-07, "loss": 1.5312, "step": 143 }, { "epoch": 0.0, "learning_rate": 4.5254556882463864e-07, "loss": 1.3782, "step": 144 }, { "epoch": 0.0, "learning_rate": 4.556882463859209e-07, "loss": 0.7325, "step": 145 }, { "epoch": 0.0, "learning_rate": 4.58830923947203e-07, "loss": 1.036, "step": 146 }, { "epoch": 0.0, "learning_rate": 4.6197360150848525e-07, "loss": 0.952, "step": 147 }, { "epoch": 0.0, "learning_rate": 4.651162790697675e-07, "loss": 0.983, "step": 148 }, { "epoch": 0.0, "learning_rate": 4.682589566310497e-07, "loss": 1.2439, "step": 149 }, { "epoch": 0.0, "learning_rate": 4.714016341923319e-07, "loss": 1.287, "step": 150 }, { "epoch": 0.0, "learning_rate": 4.7454431175361414e-07, "loss": 1.4391, "step": 151 }, { "epoch": 0.0, "learning_rate": 4.776869893148963e-07, "loss": 0.9108, "step": 152 }, { "epoch": 0.0, "learning_rate": 4.808296668761786e-07, "loss": 0.9745, "step": 153 }, { "epoch": 0.0, "learning_rate": 4.839723444374607e-07, "loss": 1.1494, "step": 154 }, { "epoch": 0.0, "learning_rate": 4.87115021998743e-07, "loss": 0.9468, "step": 155 }, { "epoch": 0.0, "learning_rate": 4.902576995600252e-07, "loss": 1.4968, "step": 156 }, { "epoch": 0.0, "learning_rate": 4.934003771213074e-07, "loss": 1.036, "step": 157 }, { "epoch": 0.0, "learning_rate": 4.965430546825896e-07, "loss": 0.8283, "step": 158 }, { "epoch": 0.0, "learning_rate": 4.996857322438718e-07, "loss": 0.9498, "step": 159 }, { "epoch": 0.0, "learning_rate": 5.028284098051541e-07, "loss": 1.0489, "step": 160 }, { "epoch": 0.0, "learning_rate": 5.059710873664362e-07, "loss": 1.0328, "step": 161 }, { "epoch": 0.0, "learning_rate": 5.091137649277184e-07, "loss": 1.3146, "step": 162 }, { "epoch": 0.0, "learning_rate": 5.122564424890006e-07, "loss": 0.9943, "step": 163 }, { "epoch": 0.0, "learning_rate": 5.153991200502829e-07, "loss": 1.1758, "step": 164 }, { "epoch": 0.0, "learning_rate": 5.185417976115651e-07, "loss": 1.0002, "step": 165 }, { "epoch": 0.0, "learning_rate": 5.216844751728474e-07, "loss": 0.973, "step": 166 }, { "epoch": 0.0, "learning_rate": 5.248271527341296e-07, "loss": 1.242, "step": 167 }, { "epoch": 0.0, "learning_rate": 5.279698302954117e-07, "loss": 1.2678, "step": 168 }, { "epoch": 0.0, "learning_rate": 5.311125078566939e-07, "loss": 1.1594, "step": 169 }, { "epoch": 0.0, "learning_rate": 5.342551854179762e-07, "loss": 0.8403, "step": 170 }, { "epoch": 0.0, "learning_rate": 5.373978629792584e-07, "loss": 1.0835, "step": 171 }, { "epoch": 0.0, "learning_rate": 5.405405405405406e-07, "loss": 1.0526, "step": 172 }, { "epoch": 0.0, "learning_rate": 5.436832181018228e-07, "loss": 1.1791, "step": 173 }, { "epoch": 0.0, "learning_rate": 5.46825895663105e-07, "loss": 1.2537, "step": 174 }, { "epoch": 0.0, "learning_rate": 5.499685732243872e-07, "loss": 1.4349, "step": 175 }, { "epoch": 0.0, "learning_rate": 5.531112507856694e-07, "loss": 1.2142, "step": 176 }, { "epoch": 0.0, "learning_rate": 5.562539283469517e-07, "loss": 1.193, "step": 177 }, { "epoch": 0.0, "learning_rate": 5.593966059082338e-07, "loss": 1.0875, "step": 178 }, { "epoch": 0.0, "learning_rate": 5.625392834695161e-07, "loss": 1.1252, "step": 179 }, { "epoch": 0.0, "learning_rate": 5.656819610307983e-07, "loss": 1.145, "step": 180 }, { "epoch": 0.0, "learning_rate": 5.688246385920806e-07, "loss": 1.5691, "step": 181 }, { "epoch": 0.0, "learning_rate": 5.719673161533627e-07, "loss": 1.1388, "step": 182 }, { "epoch": 0.0, "learning_rate": 5.751099937146449e-07, "loss": 0.9514, "step": 183 }, { "epoch": 0.0, "learning_rate": 5.782526712759271e-07, "loss": 1.2727, "step": 184 }, { "epoch": 0.0, "learning_rate": 5.813953488372094e-07, "loss": 1.0483, "step": 185 }, { "epoch": 0.0, "learning_rate": 5.845380263984916e-07, "loss": 1.0743, "step": 186 }, { "epoch": 0.0, "learning_rate": 5.876807039597738e-07, "loss": 1.2606, "step": 187 }, { "epoch": 0.0, "learning_rate": 5.90823381521056e-07, "loss": 1.2793, "step": 188 }, { "epoch": 0.0, "learning_rate": 5.939660590823381e-07, "loss": 0.8307, "step": 189 }, { "epoch": 0.0, "learning_rate": 5.971087366436204e-07, "loss": 1.142, "step": 190 }, { "epoch": 0.0, "learning_rate": 6.002514142049026e-07, "loss": 1.0215, "step": 191 }, { "epoch": 0.0, "learning_rate": 6.033940917661849e-07, "loss": 0.9888, "step": 192 }, { "epoch": 0.0, "learning_rate": 6.065367693274671e-07, "loss": 0.9916, "step": 193 }, { "epoch": 0.0, "learning_rate": 6.096794468887493e-07, "loss": 1.3304, "step": 194 }, { "epoch": 0.0, "learning_rate": 6.128221244500314e-07, "loss": 0.8751, "step": 195 }, { "epoch": 0.0, "learning_rate": 6.159648020113137e-07, "loss": 1.1221, "step": 196 }, { "epoch": 0.0, "learning_rate": 6.191074795725959e-07, "loss": 0.899, "step": 197 }, { "epoch": 0.0, "learning_rate": 6.222501571338781e-07, "loss": 1.1347, "step": 198 }, { "epoch": 0.0, "learning_rate": 6.253928346951603e-07, "loss": 1.2391, "step": 199 }, { "epoch": 0.0, "learning_rate": 6.285355122564425e-07, "loss": 1.3823, "step": 200 }, { "epoch": 0.0, "learning_rate": 6.316781898177248e-07, "loss": 1.186, "step": 201 }, { "epoch": 0.0, "learning_rate": 6.348208673790069e-07, "loss": 0.7866, "step": 202 }, { "epoch": 0.0, "learning_rate": 6.379635449402892e-07, "loss": 1.1498, "step": 203 }, { "epoch": 0.0, "learning_rate": 6.411062225015714e-07, "loss": 1.1234, "step": 204 }, { "epoch": 0.0, "learning_rate": 6.442489000628536e-07, "loss": 1.1131, "step": 205 }, { "epoch": 0.0, "learning_rate": 6.473915776241359e-07, "loss": 1.3056, "step": 206 }, { "epoch": 0.0, "learning_rate": 6.50534255185418e-07, "loss": 0.8256, "step": 207 }, { "epoch": 0.0, "learning_rate": 6.536769327467001e-07, "loss": 1.1061, "step": 208 }, { "epoch": 0.0, "learning_rate": 6.568196103079824e-07, "loss": 0.9729, "step": 209 }, { "epoch": 0.0, "learning_rate": 6.599622878692646e-07, "loss": 1.1805, "step": 210 }, { "epoch": 0.0, "learning_rate": 6.631049654305469e-07, "loss": 1.0167, "step": 211 }, { "epoch": 0.0, "learning_rate": 6.662476429918291e-07, "loss": 1.2101, "step": 212 }, { "epoch": 0.0, "learning_rate": 6.693903205531113e-07, "loss": 1.1053, "step": 213 }, { "epoch": 0.0, "learning_rate": 6.725329981143936e-07, "loss": 1.0325, "step": 214 }, { "epoch": 0.0, "learning_rate": 6.756756756756758e-07, "loss": 1.1042, "step": 215 }, { "epoch": 0.0, "learning_rate": 6.78818353236958e-07, "loss": 1.0911, "step": 216 }, { "epoch": 0.0, "learning_rate": 6.819610307982402e-07, "loss": 1.0399, "step": 217 }, { "epoch": 0.0, "learning_rate": 6.851037083595223e-07, "loss": 1.2097, "step": 218 }, { "epoch": 0.0, "learning_rate": 6.882463859208045e-07, "loss": 1.2649, "step": 219 }, { "epoch": 0.0, "learning_rate": 6.913890634820868e-07, "loss": 1.0072, "step": 220 }, { "epoch": 0.0, "learning_rate": 6.94531741043369e-07, "loss": 1.1851, "step": 221 }, { "epoch": 0.0, "learning_rate": 6.976744186046513e-07, "loss": 0.8771, "step": 222 }, { "epoch": 0.0, "learning_rate": 7.008170961659334e-07, "loss": 0.957, "step": 223 }, { "epoch": 0.0, "learning_rate": 7.039597737272156e-07, "loss": 1.1519, "step": 224 }, { "epoch": 0.0, "learning_rate": 7.071024512884979e-07, "loss": 1.3264, "step": 225 }, { "epoch": 0.0, "learning_rate": 7.102451288497801e-07, "loss": 1.0406, "step": 226 }, { "epoch": 0.0, "learning_rate": 7.133878064110624e-07, "loss": 0.9446, "step": 227 }, { "epoch": 0.0, "learning_rate": 7.165304839723446e-07, "loss": 0.9987, "step": 228 }, { "epoch": 0.0, "learning_rate": 7.196731615336266e-07, "loss": 1.0275, "step": 229 }, { "epoch": 0.0, "learning_rate": 7.228158390949088e-07, "loss": 1.3141, "step": 230 }, { "epoch": 0.0, "learning_rate": 7.259585166561911e-07, "loss": 1.5143, "step": 231 }, { "epoch": 0.0, "learning_rate": 7.291011942174733e-07, "loss": 0.8321, "step": 232 }, { "epoch": 0.0, "learning_rate": 7.322438717787556e-07, "loss": 0.953, "step": 233 }, { "epoch": 0.0, "learning_rate": 7.353865493400378e-07, "loss": 1.075, "step": 234 }, { "epoch": 0.0, "learning_rate": 7.3852922690132e-07, "loss": 1.199, "step": 235 }, { "epoch": 0.0, "learning_rate": 7.416719044626022e-07, "loss": 1.0882, "step": 236 }, { "epoch": 0.0, "learning_rate": 7.448145820238844e-07, "loss": 1.2022, "step": 237 }, { "epoch": 0.0, "learning_rate": 7.479572595851667e-07, "loss": 1.2401, "step": 238 }, { "epoch": 0.0, "learning_rate": 7.510999371464488e-07, "loss": 0.8079, "step": 239 }, { "epoch": 0.0, "learning_rate": 7.54242614707731e-07, "loss": 1.0872, "step": 240 }, { "epoch": 0.0, "learning_rate": 7.573852922690133e-07, "loss": 0.9564, "step": 241 }, { "epoch": 0.0, "learning_rate": 7.605279698302955e-07, "loss": 1.1395, "step": 242 }, { "epoch": 0.0, "learning_rate": 7.636706473915776e-07, "loss": 1.1041, "step": 243 }, { "epoch": 0.0, "learning_rate": 7.668133249528599e-07, "loss": 1.0516, "step": 244 }, { "epoch": 0.0, "learning_rate": 7.699560025141421e-07, "loss": 1.0565, "step": 245 }, { "epoch": 0.0, "learning_rate": 7.730986800754244e-07, "loss": 1.0716, "step": 246 }, { "epoch": 0.0, "learning_rate": 7.762413576367066e-07, "loss": 0.8914, "step": 247 }, { "epoch": 0.0, "learning_rate": 7.793840351979888e-07, "loss": 1.0396, "step": 248 }, { "epoch": 0.0, "learning_rate": 7.825267127592711e-07, "loss": 1.2782, "step": 249 }, { "epoch": 0.0, "learning_rate": 7.856693903205531e-07, "loss": 1.4081, "step": 250 }, { "epoch": 0.0, "learning_rate": 7.888120678818353e-07, "loss": 1.0736, "step": 251 }, { "epoch": 0.0, "learning_rate": 7.919547454431176e-07, "loss": 0.8242, "step": 252 }, { "epoch": 0.0, "learning_rate": 7.950974230043998e-07, "loss": 0.9595, "step": 253 }, { "epoch": 0.0, "learning_rate": 7.98240100565682e-07, "loss": 0.9561, "step": 254 }, { "epoch": 0.0, "learning_rate": 8.013827781269643e-07, "loss": 1.1061, "step": 255 }, { "epoch": 0.0, "learning_rate": 8.045254556882465e-07, "loss": 1.5353, "step": 256 }, { "epoch": 0.0, "learning_rate": 8.076681332495287e-07, "loss": 1.1865, "step": 257 }, { "epoch": 0.0, "learning_rate": 8.108108108108109e-07, "loss": 1.1501, "step": 258 }, { "epoch": 0.0, "learning_rate": 8.139534883720931e-07, "loss": 0.9708, "step": 259 }, { "epoch": 0.0, "learning_rate": 8.170961659333752e-07, "loss": 0.9094, "step": 260 }, { "epoch": 0.0, "learning_rate": 8.202388434946575e-07, "loss": 1.1132, "step": 261 }, { "epoch": 0.0, "learning_rate": 8.233815210559397e-07, "loss": 1.0897, "step": 262 }, { "epoch": 0.0, "learning_rate": 8.26524198617222e-07, "loss": 1.1045, "step": 263 }, { "epoch": 0.0, "learning_rate": 8.296668761785041e-07, "loss": 1.0447, "step": 264 }, { "epoch": 0.0, "learning_rate": 8.328095537397863e-07, "loss": 0.9625, "step": 265 }, { "epoch": 0.01, "learning_rate": 8.359522313010686e-07, "loss": 1.1235, "step": 266 }, { "epoch": 0.01, "learning_rate": 8.390949088623508e-07, "loss": 1.0155, "step": 267 }, { "epoch": 0.01, "learning_rate": 8.422375864236331e-07, "loss": 1.376, "step": 268 }, { "epoch": 0.01, "learning_rate": 8.453802639849153e-07, "loss": 1.3188, "step": 269 }, { "epoch": 0.01, "learning_rate": 8.485229415461974e-07, "loss": 0.9403, "step": 270 }, { "epoch": 0.01, "learning_rate": 8.516656191074796e-07, "loss": 1.0941, "step": 271 }, { "epoch": 0.01, "learning_rate": 8.548082966687618e-07, "loss": 0.9063, "step": 272 }, { "epoch": 0.01, "learning_rate": 8.57950974230044e-07, "loss": 1.0757, "step": 273 }, { "epoch": 0.01, "learning_rate": 8.610936517913263e-07, "loss": 1.1615, "step": 274 }, { "epoch": 0.01, "learning_rate": 8.642363293526085e-07, "loss": 1.2682, "step": 275 }, { "epoch": 0.01, "learning_rate": 8.673790069138907e-07, "loss": 0.9115, "step": 276 }, { "epoch": 0.01, "learning_rate": 8.705216844751729e-07, "loss": 0.8856, "step": 277 }, { "epoch": 0.01, "learning_rate": 8.736643620364551e-07, "loss": 0.9466, "step": 278 }, { "epoch": 0.01, "learning_rate": 8.768070395977374e-07, "loss": 1.1325, "step": 279 }, { "epoch": 0.01, "learning_rate": 8.799497171590196e-07, "loss": 1.1678, "step": 280 }, { "epoch": 0.01, "learning_rate": 8.830923947203018e-07, "loss": 1.2165, "step": 281 }, { "epoch": 0.01, "learning_rate": 8.86235072281584e-07, "loss": 0.8744, "step": 282 }, { "epoch": 0.01, "learning_rate": 8.893777498428662e-07, "loss": 1.0094, "step": 283 }, { "epoch": 0.01, "learning_rate": 8.925204274041483e-07, "loss": 1.106, "step": 284 }, { "epoch": 0.01, "learning_rate": 8.956631049654306e-07, "loss": 1.107, "step": 285 }, { "epoch": 0.01, "learning_rate": 8.988057825267128e-07, "loss": 1.1844, "step": 286 }, { "epoch": 0.01, "learning_rate": 9.019484600879951e-07, "loss": 1.1776, "step": 287 }, { "epoch": 0.01, "learning_rate": 9.050911376492773e-07, "loss": 1.3655, "step": 288 }, { "epoch": 0.01, "learning_rate": 9.082338152105595e-07, "loss": 0.847, "step": 289 }, { "epoch": 0.01, "learning_rate": 9.113764927718418e-07, "loss": 1.1498, "step": 290 }, { "epoch": 0.01, "learning_rate": 9.145191703331239e-07, "loss": 1.0636, "step": 291 }, { "epoch": 0.01, "learning_rate": 9.17661847894406e-07, "loss": 0.9299, "step": 292 }, { "epoch": 0.01, "learning_rate": 9.208045254556883e-07, "loss": 1.1753, "step": 293 }, { "epoch": 0.01, "learning_rate": 9.239472030169705e-07, "loss": 1.2192, "step": 294 }, { "epoch": 0.01, "learning_rate": 9.270898805782527e-07, "loss": 1.0001, "step": 295 }, { "epoch": 0.01, "learning_rate": 9.30232558139535e-07, "loss": 1.0437, "step": 296 }, { "epoch": 0.01, "learning_rate": 9.333752357008172e-07, "loss": 1.1469, "step": 297 }, { "epoch": 0.01, "learning_rate": 9.365179132620994e-07, "loss": 1.0261, "step": 298 }, { "epoch": 0.01, "learning_rate": 9.396605908233816e-07, "loss": 1.0095, "step": 299 }, { "epoch": 0.01, "learning_rate": 9.428032683846638e-07, "loss": 1.26, "step": 300 }, { "epoch": 0.01, "learning_rate": 9.459459459459461e-07, "loss": 0.8144, "step": 301 }, { "epoch": 0.01, "learning_rate": 9.490886235072283e-07, "loss": 0.8932, "step": 302 }, { "epoch": 0.01, "learning_rate": 9.522313010685104e-07, "loss": 0.9535, "step": 303 }, { "epoch": 0.01, "learning_rate": 9.553739786297925e-07, "loss": 1.0673, "step": 304 }, { "epoch": 0.01, "learning_rate": 9.585166561910748e-07, "loss": 1.2014, "step": 305 }, { "epoch": 0.01, "learning_rate": 9.616593337523571e-07, "loss": 1.4066, "step": 306 }, { "epoch": 0.01, "learning_rate": 9.648020113136392e-07, "loss": 0.9187, "step": 307 }, { "epoch": 0.01, "learning_rate": 9.679446888749215e-07, "loss": 0.9512, "step": 308 }, { "epoch": 0.01, "learning_rate": 9.710873664362038e-07, "loss": 0.7672, "step": 309 }, { "epoch": 0.01, "learning_rate": 9.74230043997486e-07, "loss": 1.1479, "step": 310 }, { "epoch": 0.01, "learning_rate": 9.773727215587681e-07, "loss": 1.1672, "step": 311 }, { "epoch": 0.01, "learning_rate": 9.805153991200504e-07, "loss": 1.2704, "step": 312 }, { "epoch": 0.01, "learning_rate": 9.836580766813325e-07, "loss": 1.3102, "step": 313 }, { "epoch": 0.01, "learning_rate": 9.868007542426148e-07, "loss": 0.7455, "step": 314 }, { "epoch": 0.01, "learning_rate": 9.899434318038969e-07, "loss": 0.9101, "step": 315 }, { "epoch": 0.01, "learning_rate": 9.930861093651792e-07, "loss": 1.1035, "step": 316 }, { "epoch": 0.01, "learning_rate": 9.962287869264615e-07, "loss": 1.1301, "step": 317 }, { "epoch": 0.01, "learning_rate": 9.993714644877435e-07, "loss": 1.3669, "step": 318 }, { "epoch": 0.01, "learning_rate": 1.0025141420490258e-06, "loss": 1.1868, "step": 319 }, { "epoch": 0.01, "learning_rate": 1.0056568196103081e-06, "loss": 1.1357, "step": 320 }, { "epoch": 0.01, "learning_rate": 1.0087994971715904e-06, "loss": 0.9201, "step": 321 }, { "epoch": 0.01, "learning_rate": 1.0119421747328725e-06, "loss": 1.097, "step": 322 }, { "epoch": 0.01, "learning_rate": 1.0150848522941548e-06, "loss": 0.8192, "step": 323 }, { "epoch": 0.01, "learning_rate": 1.0182275298554369e-06, "loss": 1.1199, "step": 324 }, { "epoch": 0.01, "learning_rate": 1.0213702074167191e-06, "loss": 1.3755, "step": 325 }, { "epoch": 0.01, "learning_rate": 1.0245128849780012e-06, "loss": 1.1584, "step": 326 }, { "epoch": 0.01, "learning_rate": 1.0276555625392835e-06, "loss": 0.8633, "step": 327 }, { "epoch": 0.01, "learning_rate": 1.0307982401005658e-06, "loss": 1.0121, "step": 328 }, { "epoch": 0.01, "learning_rate": 1.0339409176618479e-06, "loss": 1.0696, "step": 329 }, { "epoch": 0.01, "learning_rate": 1.0370835952231302e-06, "loss": 0.9875, "step": 330 }, { "epoch": 0.01, "learning_rate": 1.0402262727844125e-06, "loss": 1.2487, "step": 331 }, { "epoch": 0.01, "learning_rate": 1.0433689503456947e-06, "loss": 1.1157, "step": 332 }, { "epoch": 0.01, "learning_rate": 1.0465116279069768e-06, "loss": 0.8723, "step": 333 }, { "epoch": 0.01, "learning_rate": 1.0496543054682591e-06, "loss": 1.0724, "step": 334 }, { "epoch": 0.01, "learning_rate": 1.0527969830295412e-06, "loss": 0.8437, "step": 335 }, { "epoch": 0.01, "learning_rate": 1.0559396605908235e-06, "loss": 0.9606, "step": 336 }, { "epoch": 0.01, "learning_rate": 1.0590823381521056e-06, "loss": 1.0601, "step": 337 }, { "epoch": 0.01, "learning_rate": 1.0622250157133878e-06, "loss": 1.1794, "step": 338 }, { "epoch": 0.01, "learning_rate": 1.0653676932746701e-06, "loss": 1.1051, "step": 339 }, { "epoch": 0.01, "learning_rate": 1.0685103708359524e-06, "loss": 0.7155, "step": 340 }, { "epoch": 0.01, "learning_rate": 1.0716530483972345e-06, "loss": 0.9702, "step": 341 }, { "epoch": 0.01, "learning_rate": 1.0747957259585168e-06, "loss": 1.0217, "step": 342 }, { "epoch": 0.01, "learning_rate": 1.077938403519799e-06, "loss": 1.2588, "step": 343 }, { "epoch": 0.01, "learning_rate": 1.0810810810810812e-06, "loss": 1.435, "step": 344 }, { "epoch": 0.01, "learning_rate": 1.0842237586423632e-06, "loss": 0.991, "step": 345 }, { "epoch": 0.01, "learning_rate": 1.0873664362036455e-06, "loss": 0.9688, "step": 346 }, { "epoch": 0.01, "learning_rate": 1.0905091137649278e-06, "loss": 0.8723, "step": 347 }, { "epoch": 0.01, "learning_rate": 1.09365179132621e-06, "loss": 1.0305, "step": 348 }, { "epoch": 0.01, "learning_rate": 1.0967944688874922e-06, "loss": 1.2754, "step": 349 }, { "epoch": 0.01, "learning_rate": 1.0999371464487745e-06, "loss": 1.3209, "step": 350 }, { "epoch": 0.01, "learning_rate": 1.1030798240100568e-06, "loss": 0.9902, "step": 351 }, { "epoch": 0.01, "learning_rate": 1.1062225015713388e-06, "loss": 0.9008, "step": 352 }, { "epoch": 0.01, "learning_rate": 1.1093651791326211e-06, "loss": 1.0521, "step": 353 }, { "epoch": 0.01, "learning_rate": 1.1125078566939034e-06, "loss": 0.9803, "step": 354 }, { "epoch": 0.01, "learning_rate": 1.1156505342551855e-06, "loss": 1.0416, "step": 355 }, { "epoch": 0.01, "learning_rate": 1.1187932118164676e-06, "loss": 1.1812, "step": 356 }, { "epoch": 0.01, "learning_rate": 1.1219358893777499e-06, "loss": 1.053, "step": 357 }, { "epoch": 0.01, "learning_rate": 1.1250785669390322e-06, "loss": 1.1126, "step": 358 }, { "epoch": 0.01, "learning_rate": 1.1282212445003142e-06, "loss": 0.8972, "step": 359 }, { "epoch": 0.01, "learning_rate": 1.1313639220615965e-06, "loss": 1.0707, "step": 360 }, { "epoch": 0.01, "learning_rate": 1.1345065996228788e-06, "loss": 1.1063, "step": 361 }, { "epoch": 0.01, "learning_rate": 1.1376492771841611e-06, "loss": 1.2633, "step": 362 }, { "epoch": 0.01, "learning_rate": 1.1407919547454432e-06, "loss": 1.2527, "step": 363 }, { "epoch": 0.01, "learning_rate": 1.1439346323067255e-06, "loss": 1.0457, "step": 364 }, { "epoch": 0.01, "learning_rate": 1.1470773098680078e-06, "loss": 0.8333, "step": 365 }, { "epoch": 0.01, "learning_rate": 1.1502199874292898e-06, "loss": 1.0469, "step": 366 }, { "epoch": 0.01, "learning_rate": 1.153362664990572e-06, "loss": 1.037, "step": 367 }, { "epoch": 0.01, "learning_rate": 1.1565053425518542e-06, "loss": 1.2899, "step": 368 }, { "epoch": 0.01, "learning_rate": 1.1596480201131365e-06, "loss": 1.1546, "step": 369 }, { "epoch": 0.01, "learning_rate": 1.1627906976744188e-06, "loss": 0.9126, "step": 370 }, { "epoch": 0.01, "learning_rate": 1.1659333752357009e-06, "loss": 1.1072, "step": 371 }, { "epoch": 0.01, "learning_rate": 1.1690760527969832e-06, "loss": 1.0463, "step": 372 }, { "epoch": 0.01, "learning_rate": 1.1722187303582654e-06, "loss": 1.0348, "step": 373 }, { "epoch": 0.01, "learning_rate": 1.1753614079195475e-06, "loss": 1.1201, "step": 374 }, { "epoch": 0.01, "learning_rate": 1.1785040854808298e-06, "loss": 1.3018, "step": 375 }, { "epoch": 0.01, "learning_rate": 1.181646763042112e-06, "loss": 0.728, "step": 376 }, { "epoch": 0.01, "learning_rate": 1.1847894406033942e-06, "loss": 1.0641, "step": 377 }, { "epoch": 0.01, "learning_rate": 1.1879321181646763e-06, "loss": 1.0741, "step": 378 }, { "epoch": 0.01, "learning_rate": 1.1910747957259585e-06, "loss": 1.1164, "step": 379 }, { "epoch": 0.01, "learning_rate": 1.1942174732872408e-06, "loss": 1.0132, "step": 380 }, { "epoch": 0.01, "learning_rate": 1.1973601508485231e-06, "loss": 1.0197, "step": 381 }, { "epoch": 0.01, "learning_rate": 1.2005028284098052e-06, "loss": 1.0652, "step": 382 }, { "epoch": 0.01, "learning_rate": 1.2036455059710875e-06, "loss": 0.8959, "step": 383 }, { "epoch": 0.01, "learning_rate": 1.2067881835323698e-06, "loss": 0.9656, "step": 384 }, { "epoch": 0.01, "learning_rate": 1.2099308610936519e-06, "loss": 0.8596, "step": 385 }, { "epoch": 0.01, "learning_rate": 1.2130735386549342e-06, "loss": 1.0183, "step": 386 }, { "epoch": 0.01, "learning_rate": 1.2162162162162164e-06, "loss": 1.2219, "step": 387 }, { "epoch": 0.01, "learning_rate": 1.2193588937774985e-06, "loss": 1.1544, "step": 388 }, { "epoch": 0.01, "learning_rate": 1.2225015713387806e-06, "loss": 0.9466, "step": 389 }, { "epoch": 0.01, "learning_rate": 1.2256442489000629e-06, "loss": 1.0965, "step": 390 }, { "epoch": 0.01, "learning_rate": 1.2287869264613452e-06, "loss": 0.9296, "step": 391 }, { "epoch": 0.01, "learning_rate": 1.2319296040226275e-06, "loss": 0.9231, "step": 392 }, { "epoch": 0.01, "learning_rate": 1.2350722815839095e-06, "loss": 1.2695, "step": 393 }, { "epoch": 0.01, "learning_rate": 1.2382149591451918e-06, "loss": 1.2365, "step": 394 }, { "epoch": 0.01, "learning_rate": 1.2413576367064741e-06, "loss": 0.9838, "step": 395 }, { "epoch": 0.01, "learning_rate": 1.2445003142677562e-06, "loss": 0.9519, "step": 396 }, { "epoch": 0.01, "learning_rate": 1.2476429918290385e-06, "loss": 1.1915, "step": 397 }, { "epoch": 0.01, "learning_rate": 1.2507856693903206e-06, "loss": 0.985, "step": 398 }, { "epoch": 0.01, "learning_rate": 1.2539283469516029e-06, "loss": 1.1884, "step": 399 }, { "epoch": 0.01, "learning_rate": 1.257071024512885e-06, "loss": 1.0864, "step": 400 }, { "epoch": 0.01, "learning_rate": 1.2602137020741672e-06, "loss": 1.0644, "step": 401 }, { "epoch": 0.01, "learning_rate": 1.2633563796354495e-06, "loss": 1.0206, "step": 402 }, { "epoch": 0.01, "learning_rate": 1.2664990571967318e-06, "loss": 0.8168, "step": 403 }, { "epoch": 0.01, "learning_rate": 1.2696417347580139e-06, "loss": 0.9284, "step": 404 }, { "epoch": 0.01, "learning_rate": 1.2727844123192962e-06, "loss": 1.0291, "step": 405 }, { "epoch": 0.01, "learning_rate": 1.2759270898805785e-06, "loss": 1.2677, "step": 406 }, { "epoch": 0.01, "learning_rate": 1.2790697674418605e-06, "loss": 0.9496, "step": 407 }, { "epoch": 0.01, "learning_rate": 1.2822124450031428e-06, "loss": 1.1033, "step": 408 }, { "epoch": 0.01, "learning_rate": 1.2853551225644251e-06, "loss": 1.0405, "step": 409 }, { "epoch": 0.01, "learning_rate": 1.2884978001257072e-06, "loss": 1.0938, "step": 410 }, { "epoch": 0.01, "learning_rate": 1.2916404776869895e-06, "loss": 0.9844, "step": 411 }, { "epoch": 0.01, "learning_rate": 1.2947831552482718e-06, "loss": 1.1768, "step": 412 }, { "epoch": 0.01, "learning_rate": 1.297925832809554e-06, "loss": 1.3477, "step": 413 }, { "epoch": 0.01, "learning_rate": 1.301068510370836e-06, "loss": 0.8732, "step": 414 }, { "epoch": 0.01, "learning_rate": 1.3042111879321182e-06, "loss": 1.0511, "step": 415 }, { "epoch": 0.01, "learning_rate": 1.3073538654934003e-06, "loss": 1.0289, "step": 416 }, { "epoch": 0.01, "learning_rate": 1.3104965430546826e-06, "loss": 1.0926, "step": 417 }, { "epoch": 0.01, "learning_rate": 1.3136392206159649e-06, "loss": 1.2729, "step": 418 }, { "epoch": 0.01, "learning_rate": 1.316781898177247e-06, "loss": 1.2509, "step": 419 }, { "epoch": 0.01, "learning_rate": 1.3199245757385292e-06, "loss": 0.9243, "step": 420 }, { "epoch": 0.01, "learning_rate": 1.3230672532998115e-06, "loss": 0.9653, "step": 421 }, { "epoch": 0.01, "learning_rate": 1.3262099308610938e-06, "loss": 0.9189, "step": 422 }, { "epoch": 0.01, "learning_rate": 1.329352608422376e-06, "loss": 0.9479, "step": 423 }, { "epoch": 0.01, "learning_rate": 1.3324952859836582e-06, "loss": 1.2134, "step": 424 }, { "epoch": 0.01, "learning_rate": 1.3356379635449405e-06, "loss": 1.3234, "step": 425 }, { "epoch": 0.01, "learning_rate": 1.3387806411062226e-06, "loss": 1.0065, "step": 426 }, { "epoch": 0.01, "learning_rate": 1.3419233186675049e-06, "loss": 1.0598, "step": 427 }, { "epoch": 0.01, "learning_rate": 1.3450659962287871e-06, "loss": 1.0137, "step": 428 }, { "epoch": 0.01, "learning_rate": 1.3482086737900692e-06, "loss": 1.1537, "step": 429 }, { "epoch": 0.01, "learning_rate": 1.3513513513513515e-06, "loss": 1.0417, "step": 430 }, { "epoch": 0.01, "learning_rate": 1.3544940289126338e-06, "loss": 1.3404, "step": 431 }, { "epoch": 0.01, "learning_rate": 1.357636706473916e-06, "loss": 1.0185, "step": 432 }, { "epoch": 0.01, "learning_rate": 1.3607793840351982e-06, "loss": 0.9529, "step": 433 }, { "epoch": 0.01, "learning_rate": 1.3639220615964805e-06, "loss": 1.2417, "step": 434 }, { "epoch": 0.01, "learning_rate": 1.3670647391577623e-06, "loss": 1.0063, "step": 435 }, { "epoch": 0.01, "learning_rate": 1.3702074167190446e-06, "loss": 1.2356, "step": 436 }, { "epoch": 0.01, "learning_rate": 1.373350094280327e-06, "loss": 1.2774, "step": 437 }, { "epoch": 0.01, "learning_rate": 1.376492771841609e-06, "loss": 0.9954, "step": 438 }, { "epoch": 0.01, "learning_rate": 1.3796354494028913e-06, "loss": 0.9868, "step": 439 }, { "epoch": 0.01, "learning_rate": 1.3827781269641736e-06, "loss": 0.8532, "step": 440 }, { "epoch": 0.01, "learning_rate": 1.3859208045254558e-06, "loss": 1.1603, "step": 441 }, { "epoch": 0.01, "learning_rate": 1.389063482086738e-06, "loss": 1.0952, "step": 442 }, { "epoch": 0.01, "learning_rate": 1.3922061596480202e-06, "loss": 1.2966, "step": 443 }, { "epoch": 0.01, "learning_rate": 1.3953488372093025e-06, "loss": 1.0761, "step": 444 }, { "epoch": 0.01, "learning_rate": 1.3984915147705846e-06, "loss": 0.9885, "step": 445 }, { "epoch": 0.01, "learning_rate": 1.4016341923318669e-06, "loss": 1.0132, "step": 446 }, { "epoch": 0.01, "learning_rate": 1.4047768698931492e-06, "loss": 0.9469, "step": 447 }, { "epoch": 0.01, "learning_rate": 1.4079195474544312e-06, "loss": 0.8172, "step": 448 }, { "epoch": 0.01, "learning_rate": 1.4110622250157135e-06, "loss": 1.1594, "step": 449 }, { "epoch": 0.01, "learning_rate": 1.4142049025769958e-06, "loss": 1.2166, "step": 450 }, { "epoch": 0.01, "learning_rate": 1.417347580138278e-06, "loss": 0.7927, "step": 451 }, { "epoch": 0.01, "learning_rate": 1.4204902576995602e-06, "loss": 0.9977, "step": 452 }, { "epoch": 0.01, "learning_rate": 1.4236329352608425e-06, "loss": 0.7762, "step": 453 }, { "epoch": 0.01, "learning_rate": 1.4267756128221248e-06, "loss": 1.1874, "step": 454 }, { "epoch": 0.01, "learning_rate": 1.4299182903834068e-06, "loss": 1.1651, "step": 455 }, { "epoch": 0.01, "learning_rate": 1.4330609679446891e-06, "loss": 1.1315, "step": 456 }, { "epoch": 0.01, "learning_rate": 1.436203645505971e-06, "loss": 1.0989, "step": 457 }, { "epoch": 0.01, "learning_rate": 1.4393463230672533e-06, "loss": 0.9451, "step": 458 }, { "epoch": 0.01, "learning_rate": 1.4424890006285356e-06, "loss": 0.7952, "step": 459 }, { "epoch": 0.01, "learning_rate": 1.4456316781898177e-06, "loss": 1.1453, "step": 460 }, { "epoch": 0.01, "learning_rate": 1.4487743557511e-06, "loss": 1.1293, "step": 461 }, { "epoch": 0.01, "learning_rate": 1.4519170333123822e-06, "loss": 1.3759, "step": 462 }, { "epoch": 0.01, "learning_rate": 1.4550597108736645e-06, "loss": 1.1156, "step": 463 }, { "epoch": 0.01, "learning_rate": 1.4582023884349466e-06, "loss": 0.9363, "step": 464 }, { "epoch": 0.01, "learning_rate": 1.4613450659962289e-06, "loss": 0.8957, "step": 465 }, { "epoch": 0.01, "learning_rate": 1.4644877435575112e-06, "loss": 1.0707, "step": 466 }, { "epoch": 0.01, "learning_rate": 1.4676304211187933e-06, "loss": 0.9711, "step": 467 }, { "epoch": 0.01, "learning_rate": 1.4707730986800755e-06, "loss": 1.0406, "step": 468 }, { "epoch": 0.01, "learning_rate": 1.4739157762413578e-06, "loss": 1.2401, "step": 469 }, { "epoch": 0.01, "learning_rate": 1.47705845380264e-06, "loss": 0.9653, "step": 470 }, { "epoch": 0.01, "learning_rate": 1.4802011313639222e-06, "loss": 1.117, "step": 471 }, { "epoch": 0.01, "learning_rate": 1.4833438089252045e-06, "loss": 0.9932, "step": 472 }, { "epoch": 0.01, "learning_rate": 1.4864864864864868e-06, "loss": 1.0819, "step": 473 }, { "epoch": 0.01, "learning_rate": 1.4896291640477689e-06, "loss": 1.2016, "step": 474 }, { "epoch": 0.01, "learning_rate": 1.4927718416090512e-06, "loss": 1.5007, "step": 475 }, { "epoch": 0.01, "learning_rate": 1.4959145191703334e-06, "loss": 1.2375, "step": 476 }, { "epoch": 0.01, "learning_rate": 1.4990571967316155e-06, "loss": 0.8979, "step": 477 }, { "epoch": 0.01, "learning_rate": 1.5021998742928976e-06, "loss": 0.9486, "step": 478 }, { "epoch": 0.01, "learning_rate": 1.5053425518541797e-06, "loss": 1.0073, "step": 479 }, { "epoch": 0.01, "learning_rate": 1.508485229415462e-06, "loss": 1.0963, "step": 480 }, { "epoch": 0.01, "learning_rate": 1.5116279069767443e-06, "loss": 1.0458, "step": 481 }, { "epoch": 0.01, "learning_rate": 1.5147705845380265e-06, "loss": 0.9541, "step": 482 }, { "epoch": 0.01, "learning_rate": 1.5179132620993086e-06, "loss": 0.9683, "step": 483 }, { "epoch": 0.01, "learning_rate": 1.521055939660591e-06, "loss": 1.0309, "step": 484 }, { "epoch": 0.01, "learning_rate": 1.5241986172218732e-06, "loss": 0.8259, "step": 485 }, { "epoch": 0.01, "learning_rate": 1.5273412947831553e-06, "loss": 1.1042, "step": 486 }, { "epoch": 0.01, "learning_rate": 1.5304839723444376e-06, "loss": 1.325, "step": 487 }, { "epoch": 0.01, "learning_rate": 1.5336266499057199e-06, "loss": 1.2197, "step": 488 }, { "epoch": 0.01, "learning_rate": 1.536769327467002e-06, "loss": 0.9478, "step": 489 }, { "epoch": 0.01, "learning_rate": 1.5399120050282842e-06, "loss": 1.0669, "step": 490 }, { "epoch": 0.01, "learning_rate": 1.5430546825895665e-06, "loss": 0.9948, "step": 491 }, { "epoch": 0.01, "learning_rate": 1.5461973601508488e-06, "loss": 0.9949, "step": 492 }, { "epoch": 0.01, "learning_rate": 1.5493400377121309e-06, "loss": 1.0998, "step": 493 }, { "epoch": 0.01, "learning_rate": 1.5524827152734132e-06, "loss": 1.0535, "step": 494 }, { "epoch": 0.01, "learning_rate": 1.5556253928346955e-06, "loss": 0.9534, "step": 495 }, { "epoch": 0.01, "learning_rate": 1.5587680703959775e-06, "loss": 0.933, "step": 496 }, { "epoch": 0.01, "learning_rate": 1.5619107479572598e-06, "loss": 0.963, "step": 497 }, { "epoch": 0.01, "learning_rate": 1.5650534255185421e-06, "loss": 0.9208, "step": 498 }, { "epoch": 0.01, "learning_rate": 1.568196103079824e-06, "loss": 1.0191, "step": 499 }, { "epoch": 0.01, "learning_rate": 1.5713387806411063e-06, "loss": 1.2053, "step": 500 }, { "epoch": 0.01, "learning_rate": 1.5744814582023884e-06, "loss": 0.9736, "step": 501 }, { "epoch": 0.01, "learning_rate": 1.5776241357636706e-06, "loss": 0.8608, "step": 502 }, { "epoch": 0.01, "learning_rate": 1.580766813324953e-06, "loss": 1.0027, "step": 503 }, { "epoch": 0.01, "learning_rate": 1.5839094908862352e-06, "loss": 0.8684, "step": 504 }, { "epoch": 0.01, "learning_rate": 1.5870521684475173e-06, "loss": 1.2028, "step": 505 }, { "epoch": 0.01, "learning_rate": 1.5901948460087996e-06, "loss": 1.3237, "step": 506 }, { "epoch": 0.01, "learning_rate": 1.5933375235700819e-06, "loss": 0.8967, "step": 507 }, { "epoch": 0.01, "learning_rate": 1.596480201131364e-06, "loss": 0.7855, "step": 508 }, { "epoch": 0.01, "learning_rate": 1.5996228786926462e-06, "loss": 1.0588, "step": 509 }, { "epoch": 0.01, "learning_rate": 1.6027655562539285e-06, "loss": 1.0243, "step": 510 }, { "epoch": 0.01, "learning_rate": 1.6059082338152106e-06, "loss": 1.0345, "step": 511 }, { "epoch": 0.01, "learning_rate": 1.609050911376493e-06, "loss": 1.3508, "step": 512 }, { "epoch": 0.01, "learning_rate": 1.6121935889377752e-06, "loss": 1.2945, "step": 513 }, { "epoch": 0.01, "learning_rate": 1.6153362664990575e-06, "loss": 1.0946, "step": 514 }, { "epoch": 0.01, "learning_rate": 1.6184789440603396e-06, "loss": 0.9987, "step": 515 }, { "epoch": 0.01, "learning_rate": 1.6216216216216219e-06, "loss": 1.0754, "step": 516 }, { "epoch": 0.01, "learning_rate": 1.6247642991829041e-06, "loss": 1.0294, "step": 517 }, { "epoch": 0.01, "learning_rate": 1.6279069767441862e-06, "loss": 1.3311, "step": 518 }, { "epoch": 0.01, "learning_rate": 1.6310496543054685e-06, "loss": 1.2388, "step": 519 }, { "epoch": 0.01, "learning_rate": 1.6341923318667504e-06, "loss": 1.1025, "step": 520 }, { "epoch": 0.01, "learning_rate": 1.6373350094280327e-06, "loss": 1.0242, "step": 521 }, { "epoch": 0.01, "learning_rate": 1.640477686989315e-06, "loss": 0.9291, "step": 522 }, { "epoch": 0.01, "learning_rate": 1.6436203645505972e-06, "loss": 0.9297, "step": 523 }, { "epoch": 0.01, "learning_rate": 1.6467630421118793e-06, "loss": 1.0704, "step": 524 }, { "epoch": 0.01, "learning_rate": 1.6499057196731616e-06, "loss": 1.5038, "step": 525 }, { "epoch": 0.01, "learning_rate": 1.653048397234444e-06, "loss": 0.9429, "step": 526 }, { "epoch": 0.01, "learning_rate": 1.656191074795726e-06, "loss": 0.8918, "step": 527 }, { "epoch": 0.01, "learning_rate": 1.6593337523570083e-06, "loss": 1.1876, "step": 528 }, { "epoch": 0.01, "learning_rate": 1.6624764299182906e-06, "loss": 0.929, "step": 529 }, { "epoch": 0.01, "learning_rate": 1.6656191074795726e-06, "loss": 0.8876, "step": 530 }, { "epoch": 0.01, "learning_rate": 1.668761785040855e-06, "loss": 1.1609, "step": 531 }, { "epoch": 0.01, "learning_rate": 1.6719044626021372e-06, "loss": 0.9939, "step": 532 }, { "epoch": 0.01, "learning_rate": 1.6750471401634195e-06, "loss": 0.9372, "step": 533 }, { "epoch": 0.01, "learning_rate": 1.6781898177247016e-06, "loss": 0.8968, "step": 534 }, { "epoch": 0.01, "learning_rate": 1.6813324952859839e-06, "loss": 0.8243, "step": 535 }, { "epoch": 0.01, "learning_rate": 1.6844751728472662e-06, "loss": 0.9378, "step": 536 }, { "epoch": 0.01, "learning_rate": 1.6876178504085482e-06, "loss": 1.074, "step": 537 }, { "epoch": 0.01, "learning_rate": 1.6907605279698305e-06, "loss": 1.0753, "step": 538 }, { "epoch": 0.01, "learning_rate": 1.6939032055311128e-06, "loss": 0.7446, "step": 539 }, { "epoch": 0.01, "learning_rate": 1.697045883092395e-06, "loss": 0.9745, "step": 540 }, { "epoch": 0.01, "learning_rate": 1.700188560653677e-06, "loss": 0.8242, "step": 541 }, { "epoch": 0.01, "learning_rate": 1.7033312382149593e-06, "loss": 0.9622, "step": 542 }, { "epoch": 0.01, "learning_rate": 1.7064739157762413e-06, "loss": 1.1268, "step": 543 }, { "epoch": 0.01, "learning_rate": 1.7096165933375236e-06, "loss": 1.1138, "step": 544 }, { "epoch": 0.01, "learning_rate": 1.712759270898806e-06, "loss": 1.0964, "step": 545 }, { "epoch": 0.01, "learning_rate": 1.715901948460088e-06, "loss": 0.8863, "step": 546 }, { "epoch": 0.01, "learning_rate": 1.7190446260213703e-06, "loss": 1.1301, "step": 547 }, { "epoch": 0.01, "learning_rate": 1.7221873035826526e-06, "loss": 1.0844, "step": 548 }, { "epoch": 0.01, "learning_rate": 1.7253299811439347e-06, "loss": 1.064, "step": 549 }, { "epoch": 0.01, "learning_rate": 1.728472658705217e-06, "loss": 1.1023, "step": 550 }, { "epoch": 0.01, "learning_rate": 1.7316153362664992e-06, "loss": 1.0302, "step": 551 }, { "epoch": 0.01, "learning_rate": 1.7347580138277813e-06, "loss": 0.7752, "step": 552 }, { "epoch": 0.01, "learning_rate": 1.7379006913890636e-06, "loss": 1.1998, "step": 553 }, { "epoch": 0.01, "learning_rate": 1.7410433689503459e-06, "loss": 1.079, "step": 554 }, { "epoch": 0.01, "learning_rate": 1.7441860465116282e-06, "loss": 1.19, "step": 555 }, { "epoch": 0.01, "learning_rate": 1.7473287240729103e-06, "loss": 1.259, "step": 556 }, { "epoch": 0.01, "learning_rate": 1.7504714016341926e-06, "loss": 1.1775, "step": 557 }, { "epoch": 0.01, "learning_rate": 1.7536140791954748e-06, "loss": 1.0046, "step": 558 }, { "epoch": 0.01, "learning_rate": 1.756756756756757e-06, "loss": 1.0026, "step": 559 }, { "epoch": 0.01, "learning_rate": 1.7598994343180392e-06, "loss": 0.896, "step": 560 }, { "epoch": 0.01, "learning_rate": 1.7630421118793215e-06, "loss": 0.9752, "step": 561 }, { "epoch": 0.01, "learning_rate": 1.7661847894406036e-06, "loss": 1.14, "step": 562 }, { "epoch": 0.01, "learning_rate": 1.7693274670018857e-06, "loss": 1.1033, "step": 563 }, { "epoch": 0.01, "learning_rate": 1.772470144563168e-06, "loss": 0.9205, "step": 564 }, { "epoch": 0.01, "learning_rate": 1.77561282212445e-06, "loss": 0.8172, "step": 565 }, { "epoch": 0.01, "learning_rate": 1.7787554996857323e-06, "loss": 1.0778, "step": 566 }, { "epoch": 0.01, "learning_rate": 1.7818981772470146e-06, "loss": 1.0334, "step": 567 }, { "epoch": 0.01, "learning_rate": 1.7850408548082967e-06, "loss": 1.2527, "step": 568 }, { "epoch": 0.01, "learning_rate": 1.788183532369579e-06, "loss": 1.1786, "step": 569 }, { "epoch": 0.01, "learning_rate": 1.7913262099308613e-06, "loss": 1.149, "step": 570 }, { "epoch": 0.01, "learning_rate": 1.7944688874921433e-06, "loss": 0.9038, "step": 571 }, { "epoch": 0.01, "learning_rate": 1.7976115650534256e-06, "loss": 0.9056, "step": 572 }, { "epoch": 0.01, "learning_rate": 1.800754242614708e-06, "loss": 0.921, "step": 573 }, { "epoch": 0.01, "learning_rate": 1.8038969201759902e-06, "loss": 1.1624, "step": 574 }, { "epoch": 0.01, "learning_rate": 1.8070395977372723e-06, "loss": 1.2685, "step": 575 }, { "epoch": 0.01, "learning_rate": 1.8101822752985546e-06, "loss": 1.0114, "step": 576 }, { "epoch": 0.01, "learning_rate": 1.8133249528598369e-06, "loss": 1.0046, "step": 577 }, { "epoch": 0.01, "learning_rate": 1.816467630421119e-06, "loss": 0.7366, "step": 578 }, { "epoch": 0.01, "learning_rate": 1.8196103079824012e-06, "loss": 0.9054, "step": 579 }, { "epoch": 0.01, "learning_rate": 1.8227529855436835e-06, "loss": 1.1718, "step": 580 }, { "epoch": 0.01, "learning_rate": 1.8258956631049656e-06, "loss": 1.2065, "step": 581 }, { "epoch": 0.01, "learning_rate": 1.8290383406662479e-06, "loss": 1.0789, "step": 582 }, { "epoch": 0.01, "learning_rate": 1.8321810182275302e-06, "loss": 1.0063, "step": 583 }, { "epoch": 0.01, "learning_rate": 1.835323695788812e-06, "loss": 0.9418, "step": 584 }, { "epoch": 0.01, "learning_rate": 1.8384663733500943e-06, "loss": 0.9979, "step": 585 }, { "epoch": 0.01, "learning_rate": 1.8416090509113766e-06, "loss": 0.958, "step": 586 }, { "epoch": 0.01, "learning_rate": 1.8447517284726587e-06, "loss": 1.1824, "step": 587 }, { "epoch": 0.01, "learning_rate": 1.847894406033941e-06, "loss": 1.2413, "step": 588 }, { "epoch": 0.01, "learning_rate": 1.8510370835952233e-06, "loss": 0.9204, "step": 589 }, { "epoch": 0.01, "learning_rate": 1.8541797611565054e-06, "loss": 1.1371, "step": 590 }, { "epoch": 0.01, "learning_rate": 1.8573224387177876e-06, "loss": 1.1457, "step": 591 }, { "epoch": 0.01, "learning_rate": 1.86046511627907e-06, "loss": 0.9207, "step": 592 }, { "epoch": 0.01, "learning_rate": 1.8636077938403522e-06, "loss": 1.4471, "step": 593 }, { "epoch": 0.01, "learning_rate": 1.8667504714016343e-06, "loss": 1.1357, "step": 594 }, { "epoch": 0.01, "learning_rate": 1.8698931489629166e-06, "loss": 1.0489, "step": 595 }, { "epoch": 0.01, "learning_rate": 1.8730358265241989e-06, "loss": 0.8907, "step": 596 }, { "epoch": 0.01, "learning_rate": 1.876178504085481e-06, "loss": 0.9274, "step": 597 }, { "epoch": 0.01, "learning_rate": 1.8793211816467632e-06, "loss": 1.0289, "step": 598 }, { "epoch": 0.01, "learning_rate": 1.8824638592080455e-06, "loss": 1.0284, "step": 599 }, { "epoch": 0.01, "learning_rate": 1.8856065367693276e-06, "loss": 1.1866, "step": 600 }, { "epoch": 0.01, "learning_rate": 1.88874921433061e-06, "loss": 1.0093, "step": 601 }, { "epoch": 0.01, "learning_rate": 1.8918918918918922e-06, "loss": 1.0898, "step": 602 }, { "epoch": 0.01, "learning_rate": 1.8950345694531743e-06, "loss": 0.9124, "step": 603 }, { "epoch": 0.01, "learning_rate": 1.8981772470144566e-06, "loss": 0.9324, "step": 604 }, { "epoch": 0.01, "learning_rate": 1.9013199245757386e-06, "loss": 1.0074, "step": 605 }, { "epoch": 0.01, "learning_rate": 1.9044626021370207e-06, "loss": 1.1467, "step": 606 }, { "epoch": 0.01, "learning_rate": 1.907605279698303e-06, "loss": 0.9837, "step": 607 }, { "epoch": 0.01, "learning_rate": 1.910747957259585e-06, "loss": 0.7087, "step": 608 }, { "epoch": 0.01, "learning_rate": 1.9138906348208674e-06, "loss": 0.9966, "step": 609 }, { "epoch": 0.01, "learning_rate": 1.9170333123821497e-06, "loss": 1.0435, "step": 610 }, { "epoch": 0.01, "learning_rate": 1.920175989943432e-06, "loss": 1.2396, "step": 611 }, { "epoch": 0.01, "learning_rate": 1.9233186675047142e-06, "loss": 1.0334, "step": 612 }, { "epoch": 0.01, "learning_rate": 1.9264613450659965e-06, "loss": 1.1567, "step": 613 }, { "epoch": 0.01, "learning_rate": 1.9296040226272784e-06, "loss": 0.9635, "step": 614 }, { "epoch": 0.01, "learning_rate": 1.9327467001885607e-06, "loss": 0.7967, "step": 615 }, { "epoch": 0.01, "learning_rate": 1.935889377749843e-06, "loss": 0.936, "step": 616 }, { "epoch": 0.01, "learning_rate": 1.9390320553111253e-06, "loss": 1.093, "step": 617 }, { "epoch": 0.01, "learning_rate": 1.9421747328724076e-06, "loss": 0.957, "step": 618 }, { "epoch": 0.01, "learning_rate": 1.94531741043369e-06, "loss": 1.2581, "step": 619 }, { "epoch": 0.01, "learning_rate": 1.948460087994972e-06, "loss": 0.8446, "step": 620 }, { "epoch": 0.01, "learning_rate": 1.951602765556254e-06, "loss": 0.9203, "step": 621 }, { "epoch": 0.01, "learning_rate": 1.9547454431175363e-06, "loss": 0.8326, "step": 622 }, { "epoch": 0.01, "learning_rate": 1.9578881206788186e-06, "loss": 0.9999, "step": 623 }, { "epoch": 0.01, "learning_rate": 1.961030798240101e-06, "loss": 1.2236, "step": 624 }, { "epoch": 0.01, "learning_rate": 1.964173475801383e-06, "loss": 1.4354, "step": 625 }, { "epoch": 0.01, "learning_rate": 1.967316153362665e-06, "loss": 0.9966, "step": 626 }, { "epoch": 0.01, "learning_rate": 1.9704588309239473e-06, "loss": 0.9358, "step": 627 }, { "epoch": 0.01, "learning_rate": 1.9736015084852296e-06, "loss": 1.0838, "step": 628 }, { "epoch": 0.01, "learning_rate": 1.976744186046512e-06, "loss": 1.0632, "step": 629 }, { "epoch": 0.01, "learning_rate": 1.9798868636077938e-06, "loss": 1.1232, "step": 630 }, { "epoch": 0.01, "learning_rate": 1.983029541169076e-06, "loss": 1.289, "step": 631 }, { "epoch": 0.01, "learning_rate": 1.9861722187303583e-06, "loss": 0.9955, "step": 632 }, { "epoch": 0.01, "learning_rate": 1.9893148962916406e-06, "loss": 0.9867, "step": 633 }, { "epoch": 0.01, "learning_rate": 1.992457573852923e-06, "loss": 1.1163, "step": 634 }, { "epoch": 0.01, "learning_rate": 1.9956002514142052e-06, "loss": 0.9731, "step": 635 }, { "epoch": 0.01, "learning_rate": 1.998742928975487e-06, "loss": 0.991, "step": 636 }, { "epoch": 0.01, "learning_rate": 2.0018856065367694e-06, "loss": 1.1715, "step": 637 }, { "epoch": 0.01, "learning_rate": 2.0050282840980517e-06, "loss": 1.0359, "step": 638 }, { "epoch": 0.01, "learning_rate": 2.008170961659334e-06, "loss": 1.0824, "step": 639 }, { "epoch": 0.01, "learning_rate": 2.0113136392206162e-06, "loss": 0.9707, "step": 640 }, { "epoch": 0.01, "learning_rate": 2.0144563167818985e-06, "loss": 0.8824, "step": 641 }, { "epoch": 0.01, "learning_rate": 2.017598994343181e-06, "loss": 0.9326, "step": 642 }, { "epoch": 0.01, "learning_rate": 2.0207416719044627e-06, "loss": 1.1407, "step": 643 }, { "epoch": 0.01, "learning_rate": 2.023884349465745e-06, "loss": 1.247, "step": 644 }, { "epoch": 0.01, "learning_rate": 2.0270270270270273e-06, "loss": 0.8764, "step": 645 }, { "epoch": 0.01, "learning_rate": 2.0301697045883096e-06, "loss": 0.869, "step": 646 }, { "epoch": 0.01, "learning_rate": 2.033312382149592e-06, "loss": 0.9085, "step": 647 }, { "epoch": 0.01, "learning_rate": 2.0364550597108737e-06, "loss": 1.0403, "step": 648 }, { "epoch": 0.01, "learning_rate": 2.039597737272156e-06, "loss": 1.2476, "step": 649 }, { "epoch": 0.01, "learning_rate": 2.0427404148334383e-06, "loss": 1.2651, "step": 650 }, { "epoch": 0.01, "learning_rate": 2.0458830923947206e-06, "loss": 1.0493, "step": 651 }, { "epoch": 0.01, "learning_rate": 2.0490257699560024e-06, "loss": 1.1178, "step": 652 }, { "epoch": 0.01, "learning_rate": 2.0521684475172847e-06, "loss": 1.0388, "step": 653 }, { "epoch": 0.01, "learning_rate": 2.055311125078567e-06, "loss": 1.0047, "step": 654 }, { "epoch": 0.01, "learning_rate": 2.0584538026398493e-06, "loss": 1.0867, "step": 655 }, { "epoch": 0.01, "learning_rate": 2.0615964802011316e-06, "loss": 1.1398, "step": 656 }, { "epoch": 0.01, "learning_rate": 2.064739157762414e-06, "loss": 1.0502, "step": 657 }, { "epoch": 0.01, "learning_rate": 2.0678818353236958e-06, "loss": 1.0228, "step": 658 }, { "epoch": 0.01, "learning_rate": 2.071024512884978e-06, "loss": 1.0677, "step": 659 }, { "epoch": 0.01, "learning_rate": 2.0741671904462603e-06, "loss": 0.9655, "step": 660 }, { "epoch": 0.01, "learning_rate": 2.0773098680075426e-06, "loss": 0.9964, "step": 661 }, { "epoch": 0.01, "learning_rate": 2.080452545568825e-06, "loss": 1.216, "step": 662 }, { "epoch": 0.01, "learning_rate": 2.083595223130107e-06, "loss": 1.0211, "step": 663 }, { "epoch": 0.01, "learning_rate": 2.0867379006913895e-06, "loss": 0.8331, "step": 664 }, { "epoch": 0.01, "learning_rate": 2.0898805782526714e-06, "loss": 0.9446, "step": 665 }, { "epoch": 0.01, "learning_rate": 2.0930232558139536e-06, "loss": 0.9496, "step": 666 }, { "epoch": 0.01, "learning_rate": 2.096165933375236e-06, "loss": 0.9926, "step": 667 }, { "epoch": 0.01, "learning_rate": 2.0993086109365182e-06, "loss": 1.2181, "step": 668 }, { "epoch": 0.01, "learning_rate": 2.1024512884978e-06, "loss": 1.313, "step": 669 }, { "epoch": 0.01, "learning_rate": 2.1055939660590824e-06, "loss": 0.6884, "step": 670 }, { "epoch": 0.01, "learning_rate": 2.1087366436203647e-06, "loss": 0.9498, "step": 671 }, { "epoch": 0.01, "learning_rate": 2.111879321181647e-06, "loss": 1.0973, "step": 672 }, { "epoch": 0.01, "learning_rate": 2.1150219987429293e-06, "loss": 0.8952, "step": 673 }, { "epoch": 0.01, "learning_rate": 2.118164676304211e-06, "loss": 1.0161, "step": 674 }, { "epoch": 0.01, "learning_rate": 2.1213073538654934e-06, "loss": 1.1936, "step": 675 }, { "epoch": 0.01, "learning_rate": 2.1244500314267757e-06, "loss": 0.835, "step": 676 }, { "epoch": 0.01, "learning_rate": 2.127592708988058e-06, "loss": 0.9088, "step": 677 }, { "epoch": 0.01, "learning_rate": 2.1307353865493403e-06, "loss": 0.9003, "step": 678 }, { "epoch": 0.01, "learning_rate": 2.1338780641106226e-06, "loss": 1.0047, "step": 679 }, { "epoch": 0.01, "learning_rate": 2.137020741671905e-06, "loss": 1.0449, "step": 680 }, { "epoch": 0.01, "learning_rate": 2.1401634192331867e-06, "loss": 1.1895, "step": 681 }, { "epoch": 0.01, "learning_rate": 2.143306096794469e-06, "loss": 1.0779, "step": 682 }, { "epoch": 0.01, "learning_rate": 2.1464487743557513e-06, "loss": 0.96, "step": 683 }, { "epoch": 0.01, "learning_rate": 2.1495914519170336e-06, "loss": 1.1668, "step": 684 }, { "epoch": 0.01, "learning_rate": 2.152734129478316e-06, "loss": 0.9483, "step": 685 }, { "epoch": 0.01, "learning_rate": 2.155876807039598e-06, "loss": 1.1977, "step": 686 }, { "epoch": 0.01, "learning_rate": 2.15901948460088e-06, "loss": 1.4156, "step": 687 }, { "epoch": 0.01, "learning_rate": 2.1621621621621623e-06, "loss": 1.0399, "step": 688 }, { "epoch": 0.01, "learning_rate": 2.1653048397234446e-06, "loss": 1.0643, "step": 689 }, { "epoch": 0.01, "learning_rate": 2.1684475172847265e-06, "loss": 0.8692, "step": 690 }, { "epoch": 0.01, "learning_rate": 2.1715901948460088e-06, "loss": 0.8911, "step": 691 }, { "epoch": 0.01, "learning_rate": 2.174732872407291e-06, "loss": 0.994, "step": 692 }, { "epoch": 0.01, "learning_rate": 2.1778755499685734e-06, "loss": 1.21, "step": 693 }, { "epoch": 0.01, "learning_rate": 2.1810182275298556e-06, "loss": 1.0601, "step": 694 }, { "epoch": 0.01, "learning_rate": 2.184160905091138e-06, "loss": 0.8463, "step": 695 }, { "epoch": 0.01, "learning_rate": 2.18730358265242e-06, "loss": 1.0657, "step": 696 }, { "epoch": 0.01, "learning_rate": 2.190446260213702e-06, "loss": 0.9656, "step": 697 }, { "epoch": 0.01, "learning_rate": 2.1935889377749844e-06, "loss": 0.8587, "step": 698 }, { "epoch": 0.01, "learning_rate": 2.1967316153362667e-06, "loss": 1.254, "step": 699 }, { "epoch": 0.01, "learning_rate": 2.199874292897549e-06, "loss": 1.3116, "step": 700 }, { "epoch": 0.01, "learning_rate": 2.2030169704588312e-06, "loss": 1.2532, "step": 701 }, { "epoch": 0.01, "learning_rate": 2.2061596480201135e-06, "loss": 1.1039, "step": 702 }, { "epoch": 0.01, "learning_rate": 2.2093023255813954e-06, "loss": 1.1286, "step": 703 }, { "epoch": 0.01, "learning_rate": 2.2124450031426777e-06, "loss": 1.1205, "step": 704 }, { "epoch": 0.01, "learning_rate": 2.21558768070396e-06, "loss": 1.1432, "step": 705 }, { "epoch": 0.01, "learning_rate": 2.2187303582652423e-06, "loss": 1.1394, "step": 706 }, { "epoch": 0.01, "learning_rate": 2.2218730358265246e-06, "loss": 0.908, "step": 707 }, { "epoch": 0.01, "learning_rate": 2.225015713387807e-06, "loss": 1.1681, "step": 708 }, { "epoch": 0.01, "learning_rate": 2.2281583909490887e-06, "loss": 1.0925, "step": 709 }, { "epoch": 0.01, "learning_rate": 2.231301068510371e-06, "loss": 0.9037, "step": 710 }, { "epoch": 0.01, "learning_rate": 2.2344437460716533e-06, "loss": 1.0988, "step": 711 }, { "epoch": 0.01, "learning_rate": 2.237586423632935e-06, "loss": 1.1982, "step": 712 }, { "epoch": 0.01, "learning_rate": 2.2407291011942175e-06, "loss": 0.9006, "step": 713 }, { "epoch": 0.01, "learning_rate": 2.2438717787554997e-06, "loss": 1.0156, "step": 714 }, { "epoch": 0.01, "learning_rate": 2.247014456316782e-06, "loss": 0.9499, "step": 715 }, { "epoch": 0.01, "learning_rate": 2.2501571338780643e-06, "loss": 1.0309, "step": 716 }, { "epoch": 0.01, "learning_rate": 2.2532998114393466e-06, "loss": 0.9856, "step": 717 }, { "epoch": 0.01, "learning_rate": 2.2564424890006285e-06, "loss": 1.2354, "step": 718 }, { "epoch": 0.01, "learning_rate": 2.2595851665619108e-06, "loss": 1.1265, "step": 719 }, { "epoch": 0.01, "learning_rate": 2.262727844123193e-06, "loss": 0.8848, "step": 720 }, { "epoch": 0.01, "learning_rate": 2.2658705216844753e-06, "loss": 0.8805, "step": 721 }, { "epoch": 0.01, "learning_rate": 2.2690131992457576e-06, "loss": 0.9933, "step": 722 }, { "epoch": 0.01, "learning_rate": 2.27215587680704e-06, "loss": 1.0408, "step": 723 }, { "epoch": 0.01, "learning_rate": 2.2752985543683222e-06, "loss": 1.0853, "step": 724 }, { "epoch": 0.01, "learning_rate": 2.278441231929604e-06, "loss": 1.0931, "step": 725 }, { "epoch": 0.01, "learning_rate": 2.2815839094908864e-06, "loss": 0.9269, "step": 726 }, { "epoch": 0.01, "learning_rate": 2.2847265870521687e-06, "loss": 1.0077, "step": 727 }, { "epoch": 0.01, "learning_rate": 2.287869264613451e-06, "loss": 1.0358, "step": 728 }, { "epoch": 0.01, "learning_rate": 2.2910119421747332e-06, "loss": 0.9062, "step": 729 }, { "epoch": 0.01, "learning_rate": 2.2941546197360155e-06, "loss": 0.8732, "step": 730 }, { "epoch": 0.01, "learning_rate": 2.297297297297298e-06, "loss": 1.1666, "step": 731 }, { "epoch": 0.01, "learning_rate": 2.3004399748585797e-06, "loss": 1.0382, "step": 732 }, { "epoch": 0.01, "learning_rate": 2.303582652419862e-06, "loss": 0.7801, "step": 733 }, { "epoch": 0.01, "learning_rate": 2.306725329981144e-06, "loss": 0.9271, "step": 734 }, { "epoch": 0.01, "learning_rate": 2.309868007542426e-06, "loss": 0.8748, "step": 735 }, { "epoch": 0.01, "learning_rate": 2.3130106851037084e-06, "loss": 1.0203, "step": 736 }, { "epoch": 0.01, "learning_rate": 2.3161533626649907e-06, "loss": 1.3457, "step": 737 }, { "epoch": 0.01, "learning_rate": 2.319296040226273e-06, "loss": 0.9685, "step": 738 }, { "epoch": 0.01, "learning_rate": 2.3224387177875553e-06, "loss": 0.8699, "step": 739 }, { "epoch": 0.01, "learning_rate": 2.3255813953488376e-06, "loss": 1.0173, "step": 740 }, { "epoch": 0.01, "learning_rate": 2.3287240729101194e-06, "loss": 0.9474, "step": 741 }, { "epoch": 0.01, "learning_rate": 2.3318667504714017e-06, "loss": 1.256, "step": 742 }, { "epoch": 0.01, "learning_rate": 2.335009428032684e-06, "loss": 1.2559, "step": 743 }, { "epoch": 0.01, "learning_rate": 2.3381521055939663e-06, "loss": 1.2969, "step": 744 }, { "epoch": 0.01, "learning_rate": 2.3412947831552486e-06, "loss": 0.924, "step": 745 }, { "epoch": 0.01, "learning_rate": 2.344437460716531e-06, "loss": 0.9013, "step": 746 }, { "epoch": 0.01, "learning_rate": 2.3475801382778128e-06, "loss": 0.8594, "step": 747 }, { "epoch": 0.01, "learning_rate": 2.350722815839095e-06, "loss": 1.0766, "step": 748 }, { "epoch": 0.01, "learning_rate": 2.3538654934003773e-06, "loss": 1.0533, "step": 749 }, { "epoch": 0.01, "learning_rate": 2.3570081709616596e-06, "loss": 1.2358, "step": 750 }, { "epoch": 0.01, "learning_rate": 2.360150848522942e-06, "loss": 1.0996, "step": 751 }, { "epoch": 0.01, "learning_rate": 2.363293526084224e-06, "loss": 0.8868, "step": 752 }, { "epoch": 0.01, "learning_rate": 2.3664362036455065e-06, "loss": 0.8864, "step": 753 }, { "epoch": 0.01, "learning_rate": 2.3695788812067884e-06, "loss": 0.9641, "step": 754 }, { "epoch": 0.01, "learning_rate": 2.3727215587680707e-06, "loss": 1.009, "step": 755 }, { "epoch": 0.01, "learning_rate": 2.3758642363293525e-06, "loss": 1.0283, "step": 756 }, { "epoch": 0.01, "learning_rate": 2.379006913890635e-06, "loss": 1.0465, "step": 757 }, { "epoch": 0.01, "learning_rate": 2.382149591451917e-06, "loss": 1.1812, "step": 758 }, { "epoch": 0.01, "learning_rate": 2.3852922690131994e-06, "loss": 1.1621, "step": 759 }, { "epoch": 0.01, "learning_rate": 2.3884349465744817e-06, "loss": 0.9888, "step": 760 }, { "epoch": 0.01, "learning_rate": 2.391577624135764e-06, "loss": 0.949, "step": 761 }, { "epoch": 0.01, "learning_rate": 2.3947203016970463e-06, "loss": 1.0973, "step": 762 }, { "epoch": 0.01, "learning_rate": 2.397862979258328e-06, "loss": 1.1883, "step": 763 }, { "epoch": 0.01, "learning_rate": 2.4010056568196104e-06, "loss": 0.8453, "step": 764 }, { "epoch": 0.01, "learning_rate": 2.4041483343808927e-06, "loss": 1.0283, "step": 765 }, { "epoch": 0.01, "learning_rate": 2.407291011942175e-06, "loss": 1.147, "step": 766 }, { "epoch": 0.01, "learning_rate": 2.4104336895034573e-06, "loss": 0.887, "step": 767 }, { "epoch": 0.01, "learning_rate": 2.4135763670647396e-06, "loss": 1.1642, "step": 768 }, { "epoch": 0.01, "learning_rate": 2.4167190446260214e-06, "loss": 1.2001, "step": 769 }, { "epoch": 0.01, "learning_rate": 2.4198617221873037e-06, "loss": 0.9344, "step": 770 }, { "epoch": 0.01, "learning_rate": 2.423004399748586e-06, "loss": 1.0417, "step": 771 }, { "epoch": 0.01, "learning_rate": 2.4261470773098683e-06, "loss": 0.8909, "step": 772 }, { "epoch": 0.01, "learning_rate": 2.4292897548711506e-06, "loss": 0.9262, "step": 773 }, { "epoch": 0.01, "learning_rate": 2.432432432432433e-06, "loss": 1.2005, "step": 774 }, { "epoch": 0.01, "learning_rate": 2.4355751099937147e-06, "loss": 1.0798, "step": 775 }, { "epoch": 0.01, "learning_rate": 2.438717787554997e-06, "loss": 1.0691, "step": 776 }, { "epoch": 0.01, "learning_rate": 2.4418604651162793e-06, "loss": 0.8071, "step": 777 }, { "epoch": 0.01, "learning_rate": 2.445003142677561e-06, "loss": 1.09, "step": 778 }, { "epoch": 0.01, "learning_rate": 2.4481458202388435e-06, "loss": 0.9611, "step": 779 }, { "epoch": 0.01, "learning_rate": 2.4512884978001258e-06, "loss": 1.0331, "step": 780 }, { "epoch": 0.01, "learning_rate": 2.454431175361408e-06, "loss": 1.1932, "step": 781 }, { "epoch": 0.01, "learning_rate": 2.4575738529226904e-06, "loss": 1.2327, "step": 782 }, { "epoch": 0.01, "learning_rate": 2.4607165304839726e-06, "loss": 0.8836, "step": 783 }, { "epoch": 0.01, "learning_rate": 2.463859208045255e-06, "loss": 0.8478, "step": 784 }, { "epoch": 0.01, "learning_rate": 2.467001885606537e-06, "loss": 0.9333, "step": 785 }, { "epoch": 0.01, "learning_rate": 2.470144563167819e-06, "loss": 1.06, "step": 786 }, { "epoch": 0.01, "learning_rate": 2.4732872407291014e-06, "loss": 1.2497, "step": 787 }, { "epoch": 0.01, "learning_rate": 2.4764299182903837e-06, "loss": 1.0444, "step": 788 }, { "epoch": 0.01, "learning_rate": 2.479572595851666e-06, "loss": 0.8818, "step": 789 }, { "epoch": 0.01, "learning_rate": 2.4827152734129482e-06, "loss": 0.9475, "step": 790 }, { "epoch": 0.01, "learning_rate": 2.4858579509742305e-06, "loss": 0.7916, "step": 791 }, { "epoch": 0.01, "learning_rate": 2.4890006285355124e-06, "loss": 0.9679, "step": 792 }, { "epoch": 0.01, "learning_rate": 2.4921433060967947e-06, "loss": 1.1028, "step": 793 }, { "epoch": 0.01, "learning_rate": 2.495285983658077e-06, "loss": 1.2806, "step": 794 }, { "epoch": 0.01, "learning_rate": 2.4984286612193593e-06, "loss": 0.8723, "step": 795 }, { "epoch": 0.02, "learning_rate": 2.501571338780641e-06, "loss": 1.0811, "step": 796 }, { "epoch": 0.02, "learning_rate": 2.504714016341924e-06, "loss": 0.9317, "step": 797 }, { "epoch": 0.02, "learning_rate": 2.5078566939032057e-06, "loss": 0.8674, "step": 798 }, { "epoch": 0.02, "learning_rate": 2.510999371464488e-06, "loss": 1.1, "step": 799 }, { "epoch": 0.02, "learning_rate": 2.51414204902577e-06, "loss": 1.2341, "step": 800 }, { "epoch": 0.02, "learning_rate": 2.5172847265870526e-06, "loss": 1.0424, "step": 801 }, { "epoch": 0.02, "learning_rate": 2.5204274041483345e-06, "loss": 0.9154, "step": 802 }, { "epoch": 0.02, "learning_rate": 2.523570081709617e-06, "loss": 0.8837, "step": 803 }, { "epoch": 0.02, "learning_rate": 2.526712759270899e-06, "loss": 0.8907, "step": 804 }, { "epoch": 0.02, "learning_rate": 2.5298554368321813e-06, "loss": 1.0236, "step": 805 }, { "epoch": 0.02, "learning_rate": 2.5329981143934636e-06, "loss": 1.2532, "step": 806 }, { "epoch": 0.02, "learning_rate": 2.5361407919547455e-06, "loss": 1.218, "step": 807 }, { "epoch": 0.02, "learning_rate": 2.5392834695160278e-06, "loss": 0.8202, "step": 808 }, { "epoch": 0.02, "learning_rate": 2.5424261470773096e-06, "loss": 1.0819, "step": 809 }, { "epoch": 0.02, "learning_rate": 2.5455688246385923e-06, "loss": 0.9884, "step": 810 }, { "epoch": 0.02, "learning_rate": 2.548711502199874e-06, "loss": 1.0594, "step": 811 }, { "epoch": 0.02, "learning_rate": 2.551854179761157e-06, "loss": 1.212, "step": 812 }, { "epoch": 0.02, "learning_rate": 2.554996857322439e-06, "loss": 0.8916, "step": 813 }, { "epoch": 0.02, "learning_rate": 2.558139534883721e-06, "loss": 0.9848, "step": 814 }, { "epoch": 0.02, "learning_rate": 2.5612822124450034e-06, "loss": 1.0342, "step": 815 }, { "epoch": 0.02, "learning_rate": 2.5644248900062857e-06, "loss": 0.9627, "step": 816 }, { "epoch": 0.02, "learning_rate": 2.5675675675675675e-06, "loss": 1.1063, "step": 817 }, { "epoch": 0.02, "learning_rate": 2.5707102451288502e-06, "loss": 1.1656, "step": 818 }, { "epoch": 0.02, "learning_rate": 2.573852922690132e-06, "loss": 1.1276, "step": 819 }, { "epoch": 0.02, "learning_rate": 2.5769956002514144e-06, "loss": 0.8709, "step": 820 }, { "epoch": 0.02, "learning_rate": 2.5801382778126967e-06, "loss": 1.0956, "step": 821 }, { "epoch": 0.02, "learning_rate": 2.583280955373979e-06, "loss": 0.9073, "step": 822 }, { "epoch": 0.02, "learning_rate": 2.586423632935261e-06, "loss": 1.0731, "step": 823 }, { "epoch": 0.02, "learning_rate": 2.5895663104965436e-06, "loss": 1.3572, "step": 824 }, { "epoch": 0.02, "learning_rate": 2.5927089880578254e-06, "loss": 1.2798, "step": 825 }, { "epoch": 0.02, "learning_rate": 2.595851665619108e-06, "loss": 0.8093, "step": 826 }, { "epoch": 0.02, "learning_rate": 2.59899434318039e-06, "loss": 0.8341, "step": 827 }, { "epoch": 0.02, "learning_rate": 2.602137020741672e-06, "loss": 0.978, "step": 828 }, { "epoch": 0.02, "learning_rate": 2.605279698302954e-06, "loss": 1.1428, "step": 829 }, { "epoch": 0.02, "learning_rate": 2.6084223758642364e-06, "loss": 1.1036, "step": 830 }, { "epoch": 0.02, "learning_rate": 2.6115650534255187e-06, "loss": 1.3416, "step": 831 }, { "epoch": 0.02, "learning_rate": 2.6147077309868006e-06, "loss": 1.1758, "step": 832 }, { "epoch": 0.02, "learning_rate": 2.6178504085480833e-06, "loss": 0.857, "step": 833 }, { "epoch": 0.02, "learning_rate": 2.620993086109365e-06, "loss": 0.9289, "step": 834 }, { "epoch": 0.02, "learning_rate": 2.624135763670648e-06, "loss": 0.936, "step": 835 }, { "epoch": 0.02, "learning_rate": 2.6272784412319298e-06, "loss": 0.9518, "step": 836 }, { "epoch": 0.02, "learning_rate": 2.630421118793212e-06, "loss": 1.2516, "step": 837 }, { "epoch": 0.02, "learning_rate": 2.633563796354494e-06, "loss": 1.1115, "step": 838 }, { "epoch": 0.02, "learning_rate": 2.6367064739157766e-06, "loss": 0.8926, "step": 839 }, { "epoch": 0.02, "learning_rate": 2.6398491514770585e-06, "loss": 0.9309, "step": 840 }, { "epoch": 0.02, "learning_rate": 2.642991829038341e-06, "loss": 0.9225, "step": 841 }, { "epoch": 0.02, "learning_rate": 2.646134506599623e-06, "loss": 0.8925, "step": 842 }, { "epoch": 0.02, "learning_rate": 2.6492771841609054e-06, "loss": 1.0657, "step": 843 }, { "epoch": 0.02, "learning_rate": 2.6524198617221877e-06, "loss": 1.0818, "step": 844 }, { "epoch": 0.02, "learning_rate": 2.65556253928347e-06, "loss": 1.1723, "step": 845 }, { "epoch": 0.02, "learning_rate": 2.658705216844752e-06, "loss": 0.9691, "step": 846 }, { "epoch": 0.02, "learning_rate": 2.6618478944060345e-06, "loss": 0.8809, "step": 847 }, { "epoch": 0.02, "learning_rate": 2.6649905719673164e-06, "loss": 0.9694, "step": 848 }, { "epoch": 0.02, "learning_rate": 2.6681332495285983e-06, "loss": 1.1359, "step": 849 }, { "epoch": 0.02, "learning_rate": 2.671275927089881e-06, "loss": 1.1825, "step": 850 }, { "epoch": 0.02, "learning_rate": 2.674418604651163e-06, "loss": 1.1697, "step": 851 }, { "epoch": 0.02, "learning_rate": 2.677561282212445e-06, "loss": 0.8776, "step": 852 }, { "epoch": 0.02, "learning_rate": 2.6807039597737274e-06, "loss": 1.2199, "step": 853 }, { "epoch": 0.02, "learning_rate": 2.6838466373350097e-06, "loss": 0.9484, "step": 854 }, { "epoch": 0.02, "learning_rate": 2.6869893148962916e-06, "loss": 1.0577, "step": 855 }, { "epoch": 0.02, "learning_rate": 2.6901319924575743e-06, "loss": 1.1591, "step": 856 }, { "epoch": 0.02, "learning_rate": 2.693274670018856e-06, "loss": 0.9813, "step": 857 }, { "epoch": 0.02, "learning_rate": 2.6964173475801384e-06, "loss": 0.9403, "step": 858 }, { "epoch": 0.02, "learning_rate": 2.6995600251414207e-06, "loss": 1.1224, "step": 859 }, { "epoch": 0.02, "learning_rate": 2.702702702702703e-06, "loss": 1.0536, "step": 860 }, { "epoch": 0.02, "learning_rate": 2.705845380263985e-06, "loss": 1.1592, "step": 861 }, { "epoch": 0.02, "learning_rate": 2.7089880578252676e-06, "loss": 1.0449, "step": 862 }, { "epoch": 0.02, "learning_rate": 2.7121307353865495e-06, "loss": 1.2037, "step": 863 }, { "epoch": 0.02, "learning_rate": 2.715273412947832e-06, "loss": 0.9644, "step": 864 }, { "epoch": 0.02, "learning_rate": 2.718416090509114e-06, "loss": 0.9076, "step": 865 }, { "epoch": 0.02, "learning_rate": 2.7215587680703963e-06, "loss": 0.8649, "step": 866 }, { "epoch": 0.02, "learning_rate": 2.724701445631678e-06, "loss": 1.0364, "step": 867 }, { "epoch": 0.02, "learning_rate": 2.727844123192961e-06, "loss": 1.3395, "step": 868 }, { "epoch": 0.02, "learning_rate": 2.7309868007542428e-06, "loss": 0.9641, "step": 869 }, { "epoch": 0.02, "learning_rate": 2.7341294783155246e-06, "loss": 0.8997, "step": 870 }, { "epoch": 0.02, "learning_rate": 2.7372721558768074e-06, "loss": 1.1442, "step": 871 }, { "epoch": 0.02, "learning_rate": 2.7404148334380892e-06, "loss": 0.9365, "step": 872 }, { "epoch": 0.02, "learning_rate": 2.743557510999372e-06, "loss": 0.8458, "step": 873 }, { "epoch": 0.02, "learning_rate": 2.746700188560654e-06, "loss": 1.1603, "step": 874 }, { "epoch": 0.02, "learning_rate": 2.749842866121936e-06, "loss": 1.1363, "step": 875 }, { "epoch": 0.02, "learning_rate": 2.752985543683218e-06, "loss": 1.0364, "step": 876 }, { "epoch": 0.02, "learning_rate": 2.7561282212445007e-06, "loss": 1.1583, "step": 877 }, { "epoch": 0.02, "learning_rate": 2.7592708988057825e-06, "loss": 1.0526, "step": 878 }, { "epoch": 0.02, "learning_rate": 2.7624135763670652e-06, "loss": 0.9356, "step": 879 }, { "epoch": 0.02, "learning_rate": 2.765556253928347e-06, "loss": 1.0049, "step": 880 }, { "epoch": 0.02, "learning_rate": 2.7686989314896294e-06, "loss": 1.1777, "step": 881 }, { "epoch": 0.02, "learning_rate": 2.7718416090509117e-06, "loss": 1.1417, "step": 882 }, { "epoch": 0.02, "learning_rate": 2.774984286612194e-06, "loss": 1.0406, "step": 883 }, { "epoch": 0.02, "learning_rate": 2.778126964173476e-06, "loss": 1.0361, "step": 884 }, { "epoch": 0.02, "learning_rate": 2.7812696417347586e-06, "loss": 1.0089, "step": 885 }, { "epoch": 0.02, "learning_rate": 2.7844123192960404e-06, "loss": 1.0115, "step": 886 }, { "epoch": 0.02, "learning_rate": 2.7875549968573227e-06, "loss": 1.29, "step": 887 }, { "epoch": 0.02, "learning_rate": 2.790697674418605e-06, "loss": 1.1297, "step": 888 }, { "epoch": 0.02, "learning_rate": 2.7938403519798873e-06, "loss": 1.0812, "step": 889 }, { "epoch": 0.02, "learning_rate": 2.796983029541169e-06, "loss": 0.8094, "step": 890 }, { "epoch": 0.02, "learning_rate": 2.800125707102451e-06, "loss": 1.0508, "step": 891 }, { "epoch": 0.02, "learning_rate": 2.8032683846637337e-06, "loss": 0.9949, "step": 892 }, { "epoch": 0.02, "learning_rate": 2.8064110622250156e-06, "loss": 1.1078, "step": 893 }, { "epoch": 0.02, "learning_rate": 2.8095537397862983e-06, "loss": 1.0552, "step": 894 }, { "epoch": 0.02, "learning_rate": 2.81269641734758e-06, "loss": 0.9161, "step": 895 }, { "epoch": 0.02, "learning_rate": 2.8158390949088625e-06, "loss": 1.0353, "step": 896 }, { "epoch": 0.02, "learning_rate": 2.8189817724701448e-06, "loss": 0.8799, "step": 897 }, { "epoch": 0.02, "learning_rate": 2.822124450031427e-06, "loss": 0.9891, "step": 898 }, { "epoch": 0.02, "learning_rate": 2.825267127592709e-06, "loss": 1.0847, "step": 899 }, { "epoch": 0.02, "learning_rate": 2.8284098051539916e-06, "loss": 1.3286, "step": 900 }, { "epoch": 0.02, "learning_rate": 2.8315524827152735e-06, "loss": 1.0063, "step": 901 }, { "epoch": 0.02, "learning_rate": 2.834695160276556e-06, "loss": 0.975, "step": 902 }, { "epoch": 0.02, "learning_rate": 2.837837837837838e-06, "loss": 1.0016, "step": 903 }, { "epoch": 0.02, "learning_rate": 2.8409805153991204e-06, "loss": 1.067, "step": 904 }, { "epoch": 0.02, "learning_rate": 2.8441231929604022e-06, "loss": 1.0671, "step": 905 }, { "epoch": 0.02, "learning_rate": 2.847265870521685e-06, "loss": 1.0859, "step": 906 }, { "epoch": 0.02, "learning_rate": 2.850408548082967e-06, "loss": 0.9872, "step": 907 }, { "epoch": 0.02, "learning_rate": 2.8535512256442495e-06, "loss": 0.8174, "step": 908 }, { "epoch": 0.02, "learning_rate": 2.8566939032055314e-06, "loss": 1.0305, "step": 909 }, { "epoch": 0.02, "learning_rate": 2.8598365807668137e-06, "loss": 0.802, "step": 910 }, { "epoch": 0.02, "learning_rate": 2.8629792583280956e-06, "loss": 1.2307, "step": 911 }, { "epoch": 0.02, "learning_rate": 2.8661219358893783e-06, "loss": 1.0781, "step": 912 }, { "epoch": 0.02, "learning_rate": 2.86926461345066e-06, "loss": 1.1213, "step": 913 }, { "epoch": 0.02, "learning_rate": 2.872407291011942e-06, "loss": 1.052, "step": 914 }, { "epoch": 0.02, "learning_rate": 2.8755499685732247e-06, "loss": 0.8787, "step": 915 }, { "epoch": 0.02, "learning_rate": 2.8786926461345066e-06, "loss": 0.9095, "step": 916 }, { "epoch": 0.02, "learning_rate": 2.8818353236957893e-06, "loss": 0.9505, "step": 917 }, { "epoch": 0.02, "learning_rate": 2.884978001257071e-06, "loss": 1.1734, "step": 918 }, { "epoch": 0.02, "learning_rate": 2.8881206788183534e-06, "loss": 1.2079, "step": 919 }, { "epoch": 0.02, "learning_rate": 2.8912633563796353e-06, "loss": 1.0208, "step": 920 }, { "epoch": 0.02, "learning_rate": 2.894406033940918e-06, "loss": 0.9277, "step": 921 }, { "epoch": 0.02, "learning_rate": 2.8975487115022e-06, "loss": 1.017, "step": 922 }, { "epoch": 0.02, "learning_rate": 2.9006913890634826e-06, "loss": 1.0867, "step": 923 }, { "epoch": 0.02, "learning_rate": 2.9038340666247645e-06, "loss": 1.0199, "step": 924 }, { "epoch": 0.02, "learning_rate": 2.9069767441860468e-06, "loss": 1.1379, "step": 925 }, { "epoch": 0.02, "learning_rate": 2.910119421747329e-06, "loss": 0.8824, "step": 926 }, { "epoch": 0.02, "learning_rate": 2.9132620993086113e-06, "loss": 0.7237, "step": 927 }, { "epoch": 0.02, "learning_rate": 2.916404776869893e-06, "loss": 1.0483, "step": 928 }, { "epoch": 0.02, "learning_rate": 2.919547454431176e-06, "loss": 1.131, "step": 929 }, { "epoch": 0.02, "learning_rate": 2.9226901319924578e-06, "loss": 1.1434, "step": 930 }, { "epoch": 0.02, "learning_rate": 2.92583280955374e-06, "loss": 1.0029, "step": 931 }, { "epoch": 0.02, "learning_rate": 2.9289754871150224e-06, "loss": 1.0782, "step": 932 }, { "epoch": 0.02, "learning_rate": 2.9321181646763047e-06, "loss": 0.8432, "step": 933 }, { "epoch": 0.02, "learning_rate": 2.9352608422375865e-06, "loss": 0.9908, "step": 934 }, { "epoch": 0.02, "learning_rate": 2.938403519798869e-06, "loss": 0.957, "step": 935 }, { "epoch": 0.02, "learning_rate": 2.941546197360151e-06, "loss": 1.1172, "step": 936 }, { "epoch": 0.02, "learning_rate": 2.944688874921433e-06, "loss": 1.2643, "step": 937 }, { "epoch": 0.02, "learning_rate": 2.9478315524827157e-06, "loss": 0.9677, "step": 938 }, { "epoch": 0.02, "learning_rate": 2.9509742300439975e-06, "loss": 1.0351, "step": 939 }, { "epoch": 0.02, "learning_rate": 2.95411690760528e-06, "loss": 0.9095, "step": 940 }, { "epoch": 0.02, "learning_rate": 2.957259585166562e-06, "loss": 1.0782, "step": 941 }, { "epoch": 0.02, "learning_rate": 2.9604022627278444e-06, "loss": 0.8858, "step": 942 }, { "epoch": 0.02, "learning_rate": 2.9635449402891263e-06, "loss": 1.2407, "step": 943 }, { "epoch": 0.02, "learning_rate": 2.966687617850409e-06, "loss": 1.0329, "step": 944 }, { "epoch": 0.02, "learning_rate": 2.969830295411691e-06, "loss": 1.0076, "step": 945 }, { "epoch": 0.02, "learning_rate": 2.9729729729729736e-06, "loss": 0.9868, "step": 946 }, { "epoch": 0.02, "learning_rate": 2.9761156505342554e-06, "loss": 0.804, "step": 947 }, { "epoch": 0.02, "learning_rate": 2.9792583280955377e-06, "loss": 0.9808, "step": 948 }, { "epoch": 0.02, "learning_rate": 2.9824010056568196e-06, "loss": 1.0109, "step": 949 }, { "epoch": 0.02, "learning_rate": 2.9855436832181023e-06, "loss": 1.2473, "step": 950 }, { "epoch": 0.02, "learning_rate": 2.988686360779384e-06, "loss": 0.8988, "step": 951 }, { "epoch": 0.02, "learning_rate": 2.991829038340667e-06, "loss": 0.9189, "step": 952 }, { "epoch": 0.02, "learning_rate": 2.9949717159019488e-06, "loss": 0.9398, "step": 953 }, { "epoch": 0.02, "learning_rate": 2.998114393463231e-06, "loss": 0.9727, "step": 954 }, { "epoch": 0.02, "learning_rate": 3.0012570710245133e-06, "loss": 1.1053, "step": 955 }, { "epoch": 0.02, "learning_rate": 3.004399748585795e-06, "loss": 1.2202, "step": 956 }, { "epoch": 0.02, "learning_rate": 3.0075424261470775e-06, "loss": 1.0087, "step": 957 }, { "epoch": 0.02, "learning_rate": 3.0106851037083594e-06, "loss": 0.9052, "step": 958 }, { "epoch": 0.02, "learning_rate": 3.013827781269642e-06, "loss": 0.9055, "step": 959 }, { "epoch": 0.02, "learning_rate": 3.016970458830924e-06, "loss": 0.908, "step": 960 }, { "epoch": 0.02, "learning_rate": 3.0201131363922066e-06, "loss": 0.9102, "step": 961 }, { "epoch": 0.02, "learning_rate": 3.0232558139534885e-06, "loss": 1.1342, "step": 962 }, { "epoch": 0.02, "learning_rate": 3.026398491514771e-06, "loss": 0.9927, "step": 963 }, { "epoch": 0.02, "learning_rate": 3.029541169076053e-06, "loss": 0.9817, "step": 964 }, { "epoch": 0.02, "learning_rate": 3.0326838466373354e-06, "loss": 1.0452, "step": 965 }, { "epoch": 0.02, "learning_rate": 3.0358265241986172e-06, "loss": 1.0167, "step": 966 }, { "epoch": 0.02, "learning_rate": 3.0389692017599e-06, "loss": 1.0092, "step": 967 }, { "epoch": 0.02, "learning_rate": 3.042111879321182e-06, "loss": 1.0921, "step": 968 }, { "epoch": 0.02, "learning_rate": 3.045254556882464e-06, "loss": 1.0771, "step": 969 }, { "epoch": 0.02, "learning_rate": 3.0483972344437464e-06, "loss": 0.937, "step": 970 }, { "epoch": 0.02, "learning_rate": 3.0515399120050287e-06, "loss": 0.9701, "step": 971 }, { "epoch": 0.02, "learning_rate": 3.0546825895663106e-06, "loss": 1.1437, "step": 972 }, { "epoch": 0.02, "learning_rate": 3.0578252671275933e-06, "loss": 0.9909, "step": 973 }, { "epoch": 0.02, "learning_rate": 3.060967944688875e-06, "loss": 1.0067, "step": 974 }, { "epoch": 0.02, "learning_rate": 3.064110622250158e-06, "loss": 1.1728, "step": 975 }, { "epoch": 0.02, "learning_rate": 3.0672532998114397e-06, "loss": 1.0471, "step": 976 }, { "epoch": 0.02, "learning_rate": 3.0703959773727216e-06, "loss": 0.8488, "step": 977 }, { "epoch": 0.02, "learning_rate": 3.073538654934004e-06, "loss": 0.8837, "step": 978 }, { "epoch": 0.02, "learning_rate": 3.076681332495286e-06, "loss": 0.8815, "step": 979 }, { "epoch": 0.02, "learning_rate": 3.0798240100565685e-06, "loss": 1.0202, "step": 980 }, { "epoch": 0.02, "learning_rate": 3.0829666876178503e-06, "loss": 1.1451, "step": 981 }, { "epoch": 0.02, "learning_rate": 3.086109365179133e-06, "loss": 1.0955, "step": 982 }, { "epoch": 0.02, "learning_rate": 3.089252042740415e-06, "loss": 0.9394, "step": 983 }, { "epoch": 0.02, "learning_rate": 3.0923947203016976e-06, "loss": 1.0117, "step": 984 }, { "epoch": 0.02, "learning_rate": 3.0955373978629795e-06, "loss": 0.9195, "step": 985 }, { "epoch": 0.02, "learning_rate": 3.0986800754242618e-06, "loss": 1.153, "step": 986 }, { "epoch": 0.02, "learning_rate": 3.1018227529855436e-06, "loss": 1.0935, "step": 987 }, { "epoch": 0.02, "learning_rate": 3.1049654305468263e-06, "loss": 1.088, "step": 988 }, { "epoch": 0.02, "learning_rate": 3.1081081081081082e-06, "loss": 0.8734, "step": 989 }, { "epoch": 0.02, "learning_rate": 3.111250785669391e-06, "loss": 0.7541, "step": 990 }, { "epoch": 0.02, "learning_rate": 3.114393463230673e-06, "loss": 0.8047, "step": 991 }, { "epoch": 0.02, "learning_rate": 3.117536140791955e-06, "loss": 1.1377, "step": 992 }, { "epoch": 0.02, "learning_rate": 3.1206788183532374e-06, "loss": 0.9863, "step": 993 }, { "epoch": 0.02, "learning_rate": 3.1238214959145197e-06, "loss": 1.0604, "step": 994 }, { "epoch": 0.02, "learning_rate": 3.1269641734758015e-06, "loss": 1.0815, "step": 995 }, { "epoch": 0.02, "learning_rate": 3.1301068510370842e-06, "loss": 0.889, "step": 996 }, { "epoch": 0.02, "learning_rate": 3.133249528598366e-06, "loss": 0.9771, "step": 997 }, { "epoch": 0.02, "learning_rate": 3.136392206159648e-06, "loss": 0.9336, "step": 998 }, { "epoch": 0.02, "learning_rate": 3.1395348837209307e-06, "loss": 1.0153, "step": 999 }, { "epoch": 0.02, "learning_rate": 3.1426775612822126e-06, "loss": 1.222, "step": 1000 }, { "epoch": 0.02, "learning_rate": 3.145820238843495e-06, "loss": 0.9613, "step": 1001 }, { "epoch": 0.02, "learning_rate": 3.1489629164047767e-06, "loss": 0.9155, "step": 1002 }, { "epoch": 0.02, "learning_rate": 3.1521055939660594e-06, "loss": 1.1163, "step": 1003 }, { "epoch": 0.02, "learning_rate": 3.1552482715273413e-06, "loss": 0.9037, "step": 1004 }, { "epoch": 0.02, "learning_rate": 3.158390949088624e-06, "loss": 1.0527, "step": 1005 }, { "epoch": 0.02, "learning_rate": 3.161533626649906e-06, "loss": 1.2068, "step": 1006 }, { "epoch": 0.02, "learning_rate": 3.164676304211188e-06, "loss": 1.2119, "step": 1007 }, { "epoch": 0.02, "learning_rate": 3.1678189817724704e-06, "loss": 1.0372, "step": 1008 }, { "epoch": 0.02, "learning_rate": 3.1709616593337527e-06, "loss": 0.8193, "step": 1009 }, { "epoch": 0.02, "learning_rate": 3.1741043368950346e-06, "loss": 0.9501, "step": 1010 }, { "epoch": 0.02, "learning_rate": 3.1772470144563173e-06, "loss": 1.06, "step": 1011 }, { "epoch": 0.02, "learning_rate": 3.180389692017599e-06, "loss": 1.2315, "step": 1012 }, { "epoch": 0.02, "learning_rate": 3.1835323695788815e-06, "loss": 1.0805, "step": 1013 }, { "epoch": 0.02, "learning_rate": 3.1866750471401638e-06, "loss": 0.9149, "step": 1014 }, { "epoch": 0.02, "learning_rate": 3.189817724701446e-06, "loss": 1.0646, "step": 1015 }, { "epoch": 0.02, "learning_rate": 3.192960402262728e-06, "loss": 1.0909, "step": 1016 }, { "epoch": 0.02, "learning_rate": 3.1961030798240106e-06, "loss": 0.9163, "step": 1017 }, { "epoch": 0.02, "learning_rate": 3.1992457573852925e-06, "loss": 1.3501, "step": 1018 }, { "epoch": 0.02, "learning_rate": 3.2023884349465744e-06, "loss": 1.2141, "step": 1019 }, { "epoch": 0.02, "learning_rate": 3.205531112507857e-06, "loss": 1.1411, "step": 1020 }, { "epoch": 0.02, "learning_rate": 3.208673790069139e-06, "loss": 1.0412, "step": 1021 }, { "epoch": 0.02, "learning_rate": 3.2118164676304212e-06, "loss": 0.9416, "step": 1022 }, { "epoch": 0.02, "learning_rate": 3.2149591451917035e-06, "loss": 0.8586, "step": 1023 }, { "epoch": 0.02, "learning_rate": 3.218101822752986e-06, "loss": 0.9543, "step": 1024 }, { "epoch": 0.02, "learning_rate": 3.2212445003142677e-06, "loss": 1.1611, "step": 1025 }, { "epoch": 0.02, "learning_rate": 3.2243871778755504e-06, "loss": 0.9926, "step": 1026 }, { "epoch": 0.02, "learning_rate": 3.2275298554368323e-06, "loss": 0.7382, "step": 1027 }, { "epoch": 0.02, "learning_rate": 3.230672532998115e-06, "loss": 1.0066, "step": 1028 }, { "epoch": 0.02, "learning_rate": 3.233815210559397e-06, "loss": 1.0172, "step": 1029 }, { "epoch": 0.02, "learning_rate": 3.236957888120679e-06, "loss": 0.8896, "step": 1030 }, { "epoch": 0.02, "learning_rate": 3.240100565681961e-06, "loss": 1.1627, "step": 1031 }, { "epoch": 0.02, "learning_rate": 3.2432432432432437e-06, "loss": 0.9462, "step": 1032 }, { "epoch": 0.02, "learning_rate": 3.2463859208045256e-06, "loss": 0.81, "step": 1033 }, { "epoch": 0.02, "learning_rate": 3.2495285983658083e-06, "loss": 1.0386, "step": 1034 }, { "epoch": 0.02, "learning_rate": 3.25267127592709e-06, "loss": 1.0246, "step": 1035 }, { "epoch": 0.02, "learning_rate": 3.2558139534883724e-06, "loss": 1.0244, "step": 1036 }, { "epoch": 0.02, "learning_rate": 3.2589566310496547e-06, "loss": 1.1047, "step": 1037 }, { "epoch": 0.02, "learning_rate": 3.262099308610937e-06, "loss": 1.2079, "step": 1038 }, { "epoch": 0.02, "learning_rate": 3.265241986172219e-06, "loss": 1.1296, "step": 1039 }, { "epoch": 0.02, "learning_rate": 3.2683846637335007e-06, "loss": 0.9743, "step": 1040 }, { "epoch": 0.02, "learning_rate": 3.2715273412947835e-06, "loss": 0.9989, "step": 1041 }, { "epoch": 0.02, "learning_rate": 3.2746700188560653e-06, "loss": 0.8908, "step": 1042 }, { "epoch": 0.02, "learning_rate": 3.277812696417348e-06, "loss": 1.0411, "step": 1043 }, { "epoch": 0.02, "learning_rate": 3.28095537397863e-06, "loss": 1.1105, "step": 1044 }, { "epoch": 0.02, "learning_rate": 3.284098051539912e-06, "loss": 0.9971, "step": 1045 }, { "epoch": 0.02, "learning_rate": 3.2872407291011945e-06, "loss": 0.8949, "step": 1046 }, { "epoch": 0.02, "learning_rate": 3.2903834066624768e-06, "loss": 1.01, "step": 1047 }, { "epoch": 0.02, "learning_rate": 3.2935260842237586e-06, "loss": 0.9362, "step": 1048 }, { "epoch": 0.02, "learning_rate": 3.2966687617850414e-06, "loss": 1.152, "step": 1049 }, { "epoch": 0.02, "learning_rate": 3.2998114393463232e-06, "loss": 1.1504, "step": 1050 }, { "epoch": 0.02, "learning_rate": 3.3029541169076055e-06, "loss": 1.0567, "step": 1051 }, { "epoch": 0.02, "learning_rate": 3.306096794468888e-06, "loss": 0.9813, "step": 1052 }, { "epoch": 0.02, "learning_rate": 3.30923947203017e-06, "loss": 1.0502, "step": 1053 }, { "epoch": 0.02, "learning_rate": 3.312382149591452e-06, "loss": 0.9595, "step": 1054 }, { "epoch": 0.02, "learning_rate": 3.3155248271527347e-06, "loss": 1.1968, "step": 1055 }, { "epoch": 0.02, "learning_rate": 3.3186675047140165e-06, "loss": 1.2513, "step": 1056 }, { "epoch": 0.02, "learning_rate": 3.3218101822752992e-06, "loss": 1.2229, "step": 1057 }, { "epoch": 0.02, "learning_rate": 3.324952859836581e-06, "loss": 0.884, "step": 1058 }, { "epoch": 0.02, "learning_rate": 3.3280955373978634e-06, "loss": 1.0178, "step": 1059 }, { "epoch": 0.02, "learning_rate": 3.3312382149591453e-06, "loss": 0.8914, "step": 1060 }, { "epoch": 0.02, "learning_rate": 3.3343808925204276e-06, "loss": 0.947, "step": 1061 }, { "epoch": 0.02, "learning_rate": 3.33752357008171e-06, "loss": 1.185, "step": 1062 }, { "epoch": 0.02, "learning_rate": 3.3406662476429917e-06, "loss": 1.2219, "step": 1063 }, { "epoch": 0.02, "learning_rate": 3.3438089252042744e-06, "loss": 1.0967, "step": 1064 }, { "epoch": 0.02, "learning_rate": 3.3469516027655563e-06, "loss": 1.0479, "step": 1065 }, { "epoch": 0.02, "learning_rate": 3.350094280326839e-06, "loss": 0.8333, "step": 1066 }, { "epoch": 0.02, "learning_rate": 3.353236957888121e-06, "loss": 1.0963, "step": 1067 }, { "epoch": 0.02, "learning_rate": 3.356379635449403e-06, "loss": 0.9581, "step": 1068 }, { "epoch": 0.02, "learning_rate": 3.359522313010685e-06, "loss": 1.0731, "step": 1069 }, { "epoch": 0.02, "learning_rate": 3.3626649905719677e-06, "loss": 0.9464, "step": 1070 }, { "epoch": 0.02, "learning_rate": 3.3658076681332496e-06, "loss": 0.8357, "step": 1071 }, { "epoch": 0.02, "learning_rate": 3.3689503456945323e-06, "loss": 1.1074, "step": 1072 }, { "epoch": 0.02, "learning_rate": 3.372093023255814e-06, "loss": 0.9188, "step": 1073 }, { "epoch": 0.02, "learning_rate": 3.3752357008170965e-06, "loss": 1.0979, "step": 1074 }, { "epoch": 0.02, "learning_rate": 3.3783783783783788e-06, "loss": 1.2519, "step": 1075 }, { "epoch": 0.02, "learning_rate": 3.381521055939661e-06, "loss": 0.9275, "step": 1076 }, { "epoch": 0.02, "learning_rate": 3.384663733500943e-06, "loss": 1.0352, "step": 1077 }, { "epoch": 0.02, "learning_rate": 3.3878064110622256e-06, "loss": 0.8505, "step": 1078 }, { "epoch": 0.02, "learning_rate": 3.3909490886235075e-06, "loss": 0.8768, "step": 1079 }, { "epoch": 0.02, "learning_rate": 3.39409176618479e-06, "loss": 1.1115, "step": 1080 }, { "epoch": 0.02, "learning_rate": 3.397234443746072e-06, "loss": 1.2176, "step": 1081 }, { "epoch": 0.02, "learning_rate": 3.400377121307354e-06, "loss": 1.0479, "step": 1082 }, { "epoch": 0.02, "learning_rate": 3.4035197988686362e-06, "loss": 1.1724, "step": 1083 }, { "epoch": 0.02, "learning_rate": 3.4066624764299185e-06, "loss": 1.06, "step": 1084 }, { "epoch": 0.02, "learning_rate": 3.409805153991201e-06, "loss": 0.9307, "step": 1085 }, { "epoch": 0.02, "learning_rate": 3.4129478315524827e-06, "loss": 0.9587, "step": 1086 }, { "epoch": 0.02, "learning_rate": 3.4160905091137654e-06, "loss": 1.3348, "step": 1087 }, { "epoch": 0.02, "learning_rate": 3.4192331866750473e-06, "loss": 1.1377, "step": 1088 }, { "epoch": 0.02, "learning_rate": 3.4223758642363296e-06, "loss": 1.1139, "step": 1089 }, { "epoch": 0.02, "learning_rate": 3.425518541797612e-06, "loss": 0.9144, "step": 1090 }, { "epoch": 0.02, "learning_rate": 3.428661219358894e-06, "loss": 0.9709, "step": 1091 }, { "epoch": 0.02, "learning_rate": 3.431803896920176e-06, "loss": 0.9905, "step": 1092 }, { "epoch": 0.02, "learning_rate": 3.4349465744814587e-06, "loss": 1.1403, "step": 1093 }, { "epoch": 0.02, "learning_rate": 3.4380892520427406e-06, "loss": 1.1647, "step": 1094 }, { "epoch": 0.02, "learning_rate": 3.4412319296040233e-06, "loss": 0.8234, "step": 1095 }, { "epoch": 0.02, "learning_rate": 3.444374607165305e-06, "loss": 0.8586, "step": 1096 }, { "epoch": 0.02, "learning_rate": 3.4475172847265874e-06, "loss": 0.7595, "step": 1097 }, { "epoch": 0.02, "learning_rate": 3.4506599622878693e-06, "loss": 1.1545, "step": 1098 }, { "epoch": 0.02, "learning_rate": 3.453802639849152e-06, "loss": 1.0396, "step": 1099 }, { "epoch": 0.02, "learning_rate": 3.456945317410434e-06, "loss": 1.0776, "step": 1100 }, { "epoch": 0.02, "learning_rate": 3.4600879949717166e-06, "loss": 1.0026, "step": 1101 }, { "epoch": 0.02, "learning_rate": 3.4632306725329985e-06, "loss": 0.8591, "step": 1102 }, { "epoch": 0.02, "learning_rate": 3.4663733500942808e-06, "loss": 0.8392, "step": 1103 }, { "epoch": 0.02, "learning_rate": 3.4695160276555626e-06, "loss": 1.1372, "step": 1104 }, { "epoch": 0.02, "learning_rate": 3.472658705216845e-06, "loss": 1.0876, "step": 1105 }, { "epoch": 0.02, "learning_rate": 3.475801382778127e-06, "loss": 0.9946, "step": 1106 }, { "epoch": 0.02, "learning_rate": 3.478944060339409e-06, "loss": 0.9143, "step": 1107 }, { "epoch": 0.02, "learning_rate": 3.4820867379006918e-06, "loss": 1.05, "step": 1108 }, { "epoch": 0.02, "learning_rate": 3.4852294154619737e-06, "loss": 0.9235, "step": 1109 }, { "epoch": 0.02, "learning_rate": 3.4883720930232564e-06, "loss": 0.9324, "step": 1110 }, { "epoch": 0.02, "learning_rate": 3.4915147705845382e-06, "loss": 0.9782, "step": 1111 }, { "epoch": 0.02, "learning_rate": 3.4946574481458205e-06, "loss": 1.1019, "step": 1112 }, { "epoch": 0.02, "learning_rate": 3.4978001257071024e-06, "loss": 1.1354, "step": 1113 }, { "epoch": 0.02, "learning_rate": 3.500942803268385e-06, "loss": 0.9912, "step": 1114 }, { "epoch": 0.02, "learning_rate": 3.504085480829667e-06, "loss": 1.0467, "step": 1115 }, { "epoch": 0.02, "learning_rate": 3.5072281583909497e-06, "loss": 0.9937, "step": 1116 }, { "epoch": 0.02, "learning_rate": 3.5103708359522315e-06, "loss": 1.0011, "step": 1117 }, { "epoch": 0.02, "learning_rate": 3.513513513513514e-06, "loss": 1.2918, "step": 1118 }, { "epoch": 0.02, "learning_rate": 3.516656191074796e-06, "loss": 1.0775, "step": 1119 }, { "epoch": 0.02, "learning_rate": 3.5197988686360784e-06, "loss": 1.1271, "step": 1120 }, { "epoch": 0.02, "learning_rate": 3.5229415461973603e-06, "loss": 0.8724, "step": 1121 }, { "epoch": 0.02, "learning_rate": 3.526084223758643e-06, "loss": 1.0306, "step": 1122 }, { "epoch": 0.02, "learning_rate": 3.529226901319925e-06, "loss": 0.8213, "step": 1123 }, { "epoch": 0.02, "learning_rate": 3.532369578881207e-06, "loss": 1.1176, "step": 1124 }, { "epoch": 0.02, "learning_rate": 3.5355122564424894e-06, "loss": 1.2409, "step": 1125 }, { "epoch": 0.02, "learning_rate": 3.5386549340037713e-06, "loss": 1.142, "step": 1126 }, { "epoch": 0.02, "learning_rate": 3.5417976115650536e-06, "loss": 0.9514, "step": 1127 }, { "epoch": 0.02, "learning_rate": 3.544940289126336e-06, "loss": 1.0151, "step": 1128 }, { "epoch": 0.02, "learning_rate": 3.548082966687618e-06, "loss": 1.0107, "step": 1129 }, { "epoch": 0.02, "learning_rate": 3.5512256442489e-06, "loss": 1.2585, "step": 1130 }, { "epoch": 0.02, "learning_rate": 3.5543683218101828e-06, "loss": 1.1306, "step": 1131 }, { "epoch": 0.02, "learning_rate": 3.5575109993714646e-06, "loss": 1.1857, "step": 1132 }, { "epoch": 0.02, "learning_rate": 3.560653676932747e-06, "loss": 0.8688, "step": 1133 }, { "epoch": 0.02, "learning_rate": 3.563796354494029e-06, "loss": 0.9835, "step": 1134 }, { "epoch": 0.02, "learning_rate": 3.5669390320553115e-06, "loss": 0.9783, "step": 1135 }, { "epoch": 0.02, "learning_rate": 3.5700817096165934e-06, "loss": 1.0313, "step": 1136 }, { "epoch": 0.02, "learning_rate": 3.573224387177876e-06, "loss": 1.4424, "step": 1137 }, { "epoch": 0.02, "learning_rate": 3.576367064739158e-06, "loss": 1.0933, "step": 1138 }, { "epoch": 0.02, "learning_rate": 3.5795097423004406e-06, "loss": 0.6948, "step": 1139 }, { "epoch": 0.02, "learning_rate": 3.5826524198617225e-06, "loss": 0.7765, "step": 1140 }, { "epoch": 0.02, "learning_rate": 3.585795097423005e-06, "loss": 0.9289, "step": 1141 }, { "epoch": 0.02, "learning_rate": 3.5889377749842867e-06, "loss": 0.9473, "step": 1142 }, { "epoch": 0.02, "learning_rate": 3.5920804525455694e-06, "loss": 1.1589, "step": 1143 }, { "epoch": 0.02, "learning_rate": 3.5952231301068512e-06, "loss": 1.2322, "step": 1144 }, { "epoch": 0.02, "learning_rate": 3.598365807668134e-06, "loss": 0.9318, "step": 1145 }, { "epoch": 0.02, "learning_rate": 3.601508485229416e-06, "loss": 0.8476, "step": 1146 }, { "epoch": 0.02, "learning_rate": 3.6046511627906977e-06, "loss": 0.7603, "step": 1147 }, { "epoch": 0.02, "learning_rate": 3.6077938403519804e-06, "loss": 0.9872, "step": 1148 }, { "epoch": 0.02, "learning_rate": 3.6109365179132623e-06, "loss": 1.1002, "step": 1149 }, { "epoch": 0.02, "learning_rate": 3.6140791954745446e-06, "loss": 1.2755, "step": 1150 }, { "epoch": 0.02, "learning_rate": 3.6172218730358264e-06, "loss": 0.8575, "step": 1151 }, { "epoch": 0.02, "learning_rate": 3.620364550597109e-06, "loss": 0.9085, "step": 1152 }, { "epoch": 0.02, "learning_rate": 3.623507228158391e-06, "loss": 1.0162, "step": 1153 }, { "epoch": 0.02, "learning_rate": 3.6266499057196737e-06, "loss": 1.0536, "step": 1154 }, { "epoch": 0.02, "learning_rate": 3.6297925832809556e-06, "loss": 1.0197, "step": 1155 }, { "epoch": 0.02, "learning_rate": 3.632935260842238e-06, "loss": 1.2963, "step": 1156 }, { "epoch": 0.02, "learning_rate": 3.63607793840352e-06, "loss": 0.9318, "step": 1157 }, { "epoch": 0.02, "learning_rate": 3.6392206159648025e-06, "loss": 0.9866, "step": 1158 }, { "epoch": 0.02, "learning_rate": 3.6423632935260843e-06, "loss": 1.0841, "step": 1159 }, { "epoch": 0.02, "learning_rate": 3.645505971087367e-06, "loss": 0.9879, "step": 1160 }, { "epoch": 0.02, "learning_rate": 3.648648648648649e-06, "loss": 0.986, "step": 1161 }, { "epoch": 0.02, "learning_rate": 3.651791326209931e-06, "loss": 1.2317, "step": 1162 }, { "epoch": 0.02, "learning_rate": 3.6549340037712135e-06, "loss": 1.1354, "step": 1163 }, { "epoch": 0.02, "learning_rate": 3.6580766813324958e-06, "loss": 0.9642, "step": 1164 }, { "epoch": 0.02, "learning_rate": 3.6612193588937776e-06, "loss": 0.939, "step": 1165 }, { "epoch": 0.02, "learning_rate": 3.6643620364550603e-06, "loss": 0.9194, "step": 1166 }, { "epoch": 0.02, "learning_rate": 3.6675047140163422e-06, "loss": 0.8751, "step": 1167 }, { "epoch": 0.02, "learning_rate": 3.670647391577624e-06, "loss": 1.1298, "step": 1168 }, { "epoch": 0.02, "learning_rate": 3.673790069138907e-06, "loss": 1.3204, "step": 1169 }, { "epoch": 0.02, "learning_rate": 3.6769327467001887e-06, "loss": 0.9332, "step": 1170 }, { "epoch": 0.02, "learning_rate": 3.680075424261471e-06, "loss": 0.9858, "step": 1171 }, { "epoch": 0.02, "learning_rate": 3.6832181018227532e-06, "loss": 1.0721, "step": 1172 }, { "epoch": 0.02, "learning_rate": 3.6863607793840355e-06, "loss": 1.0458, "step": 1173 }, { "epoch": 0.02, "learning_rate": 3.6895034569453174e-06, "loss": 1.075, "step": 1174 }, { "epoch": 0.02, "learning_rate": 3.6926461345066e-06, "loss": 1.2499, "step": 1175 }, { "epoch": 0.02, "learning_rate": 3.695788812067882e-06, "loss": 0.9758, "step": 1176 }, { "epoch": 0.02, "learning_rate": 3.6989314896291647e-06, "loss": 1.0407, "step": 1177 }, { "epoch": 0.02, "learning_rate": 3.7020741671904466e-06, "loss": 0.9331, "step": 1178 }, { "epoch": 0.02, "learning_rate": 3.705216844751729e-06, "loss": 0.889, "step": 1179 }, { "epoch": 0.02, "learning_rate": 3.7083595223130107e-06, "loss": 1.0607, "step": 1180 }, { "epoch": 0.02, "learning_rate": 3.7115021998742934e-06, "loss": 1.1281, "step": 1181 }, { "epoch": 0.02, "learning_rate": 3.7146448774355753e-06, "loss": 1.0884, "step": 1182 }, { "epoch": 0.02, "learning_rate": 3.717787554996858e-06, "loss": 0.9001, "step": 1183 }, { "epoch": 0.02, "learning_rate": 3.72093023255814e-06, "loss": 0.8062, "step": 1184 }, { "epoch": 0.02, "learning_rate": 3.724072910119422e-06, "loss": 0.9205, "step": 1185 }, { "epoch": 0.02, "learning_rate": 3.7272155876807044e-06, "loss": 1.0683, "step": 1186 }, { "epoch": 0.02, "learning_rate": 3.7303582652419867e-06, "loss": 1.2518, "step": 1187 }, { "epoch": 0.02, "learning_rate": 3.7335009428032686e-06, "loss": 1.0663, "step": 1188 }, { "epoch": 0.02, "learning_rate": 3.7366436203645505e-06, "loss": 1.0815, "step": 1189 }, { "epoch": 0.02, "learning_rate": 3.739786297925833e-06, "loss": 0.9232, "step": 1190 }, { "epoch": 0.02, "learning_rate": 3.742928975487115e-06, "loss": 1.0609, "step": 1191 }, { "epoch": 0.02, "learning_rate": 3.7460716530483978e-06, "loss": 0.9397, "step": 1192 }, { "epoch": 0.02, "learning_rate": 3.7492143306096796e-06, "loss": 1.0292, "step": 1193 }, { "epoch": 0.02, "learning_rate": 3.752357008170962e-06, "loss": 1.1144, "step": 1194 }, { "epoch": 0.02, "learning_rate": 3.7554996857322438e-06, "loss": 0.7596, "step": 1195 }, { "epoch": 0.02, "learning_rate": 3.7586423632935265e-06, "loss": 1.0623, "step": 1196 }, { "epoch": 0.02, "learning_rate": 3.7617850408548084e-06, "loss": 1.025, "step": 1197 }, { "epoch": 0.02, "learning_rate": 3.764927718416091e-06, "loss": 0.9139, "step": 1198 }, { "epoch": 0.02, "learning_rate": 3.768070395977373e-06, "loss": 1.1852, "step": 1199 }, { "epoch": 0.02, "learning_rate": 3.7712130735386552e-06, "loss": 1.2761, "step": 1200 }, { "epoch": 0.02, "learning_rate": 3.7743557510999375e-06, "loss": 0.9276, "step": 1201 }, { "epoch": 0.02, "learning_rate": 3.77749842866122e-06, "loss": 1.0629, "step": 1202 }, { "epoch": 0.02, "learning_rate": 3.7806411062225017e-06, "loss": 0.9772, "step": 1203 }, { "epoch": 0.02, "learning_rate": 3.7837837837837844e-06, "loss": 0.8982, "step": 1204 }, { "epoch": 0.02, "learning_rate": 3.7869264613450663e-06, "loss": 1.1729, "step": 1205 }, { "epoch": 0.02, "learning_rate": 3.7900691389063485e-06, "loss": 1.1099, "step": 1206 }, { "epoch": 0.02, "learning_rate": 3.793211816467631e-06, "loss": 1.0301, "step": 1207 }, { "epoch": 0.02, "learning_rate": 3.796354494028913e-06, "loss": 0.8629, "step": 1208 }, { "epoch": 0.02, "learning_rate": 3.799497171590195e-06, "loss": 1.0325, "step": 1209 }, { "epoch": 0.02, "learning_rate": 3.8026398491514773e-06, "loss": 1.0541, "step": 1210 }, { "epoch": 0.02, "learning_rate": 3.8057825267127596e-06, "loss": 0.9384, "step": 1211 }, { "epoch": 0.02, "learning_rate": 3.8089252042740414e-06, "loss": 1.1, "step": 1212 }, { "epoch": 0.02, "learning_rate": 3.812067881835324e-06, "loss": 1.1032, "step": 1213 }, { "epoch": 0.02, "learning_rate": 3.815210559396606e-06, "loss": 0.9888, "step": 1214 }, { "epoch": 0.02, "learning_rate": 3.818353236957888e-06, "loss": 1.0165, "step": 1215 }, { "epoch": 0.02, "learning_rate": 3.82149591451917e-06, "loss": 0.9853, "step": 1216 }, { "epoch": 0.02, "learning_rate": 3.824638592080453e-06, "loss": 1.1058, "step": 1217 }, { "epoch": 0.02, "learning_rate": 3.827781269641735e-06, "loss": 0.9286, "step": 1218 }, { "epoch": 0.02, "learning_rate": 3.8309239472030175e-06, "loss": 1.0659, "step": 1219 }, { "epoch": 0.02, "learning_rate": 3.834066624764299e-06, "loss": 0.8148, "step": 1220 }, { "epoch": 0.02, "learning_rate": 3.837209302325582e-06, "loss": 0.9024, "step": 1221 }, { "epoch": 0.02, "learning_rate": 3.840351979886864e-06, "loss": 0.9862, "step": 1222 }, { "epoch": 0.02, "learning_rate": 3.843494657448147e-06, "loss": 0.8725, "step": 1223 }, { "epoch": 0.02, "learning_rate": 3.8466373350094285e-06, "loss": 0.9724, "step": 1224 }, { "epoch": 0.02, "learning_rate": 3.84978001257071e-06, "loss": 1.1994, "step": 1225 }, { "epoch": 0.02, "learning_rate": 3.852922690131993e-06, "loss": 0.9567, "step": 1226 }, { "epoch": 0.02, "learning_rate": 3.856065367693275e-06, "loss": 0.8817, "step": 1227 }, { "epoch": 0.02, "learning_rate": 3.859208045254557e-06, "loss": 0.83, "step": 1228 }, { "epoch": 0.02, "learning_rate": 3.8623507228158395e-06, "loss": 0.9802, "step": 1229 }, { "epoch": 0.02, "learning_rate": 3.865493400377121e-06, "loss": 1.0024, "step": 1230 }, { "epoch": 0.02, "learning_rate": 3.868636077938403e-06, "loss": 1.1985, "step": 1231 }, { "epoch": 0.02, "learning_rate": 3.871778755499686e-06, "loss": 1.0292, "step": 1232 }, { "epoch": 0.02, "learning_rate": 3.874921433060968e-06, "loss": 0.8531, "step": 1233 }, { "epoch": 0.02, "learning_rate": 3.8780641106222505e-06, "loss": 1.1031, "step": 1234 }, { "epoch": 0.02, "learning_rate": 3.881206788183532e-06, "loss": 0.7761, "step": 1235 }, { "epoch": 0.02, "learning_rate": 3.884349465744815e-06, "loss": 1.0161, "step": 1236 }, { "epoch": 0.02, "learning_rate": 3.887492143306097e-06, "loss": 1.0394, "step": 1237 }, { "epoch": 0.02, "learning_rate": 3.89063482086738e-06, "loss": 1.3003, "step": 1238 }, { "epoch": 0.02, "learning_rate": 3.8937774984286616e-06, "loss": 1.0949, "step": 1239 }, { "epoch": 0.02, "learning_rate": 3.896920175989944e-06, "loss": 1.0266, "step": 1240 }, { "epoch": 0.02, "learning_rate": 3.900062853551226e-06, "loss": 0.94, "step": 1241 }, { "epoch": 0.02, "learning_rate": 3.903205531112508e-06, "loss": 1.0183, "step": 1242 }, { "epoch": 0.02, "learning_rate": 3.90634820867379e-06, "loss": 1.0817, "step": 1243 }, { "epoch": 0.02, "learning_rate": 3.909490886235073e-06, "loss": 1.0258, "step": 1244 }, { "epoch": 0.02, "learning_rate": 3.9126335637963545e-06, "loss": 1.0276, "step": 1245 }, { "epoch": 0.02, "learning_rate": 3.915776241357637e-06, "loss": 0.9888, "step": 1246 }, { "epoch": 0.02, "learning_rate": 3.918918918918919e-06, "loss": 0.9427, "step": 1247 }, { "epoch": 0.02, "learning_rate": 3.922061596480202e-06, "loss": 0.8777, "step": 1248 }, { "epoch": 0.02, "learning_rate": 3.925204274041484e-06, "loss": 1.1135, "step": 1249 }, { "epoch": 0.02, "learning_rate": 3.928346951602766e-06, "loss": 1.3011, "step": 1250 }, { "epoch": 0.02, "learning_rate": 3.931489629164048e-06, "loss": 0.94, "step": 1251 }, { "epoch": 0.02, "learning_rate": 3.93463230672533e-06, "loss": 1.0527, "step": 1252 }, { "epoch": 0.02, "learning_rate": 3.937774984286613e-06, "loss": 0.9912, "step": 1253 }, { "epoch": 0.02, "learning_rate": 3.940917661847895e-06, "loss": 0.9211, "step": 1254 }, { "epoch": 0.02, "learning_rate": 3.944060339409177e-06, "loss": 1.0936, "step": 1255 }, { "epoch": 0.02, "learning_rate": 3.947203016970459e-06, "loss": 0.8951, "step": 1256 }, { "epoch": 0.02, "learning_rate": 3.950345694531741e-06, "loss": 0.9944, "step": 1257 }, { "epoch": 0.02, "learning_rate": 3.953488372093024e-06, "loss": 0.9391, "step": 1258 }, { "epoch": 0.02, "learning_rate": 3.956631049654306e-06, "loss": 1.0585, "step": 1259 }, { "epoch": 0.02, "learning_rate": 3.9597737272155875e-06, "loss": 0.8704, "step": 1260 }, { "epoch": 0.02, "learning_rate": 3.96291640477687e-06, "loss": 1.1075, "step": 1261 }, { "epoch": 0.02, "learning_rate": 3.966059082338152e-06, "loss": 1.2667, "step": 1262 }, { "epoch": 0.02, "learning_rate": 3.969201759899435e-06, "loss": 1.0735, "step": 1263 }, { "epoch": 0.02, "learning_rate": 3.972344437460717e-06, "loss": 0.9244, "step": 1264 }, { "epoch": 0.02, "learning_rate": 3.975487115021999e-06, "loss": 1.0746, "step": 1265 }, { "epoch": 0.02, "learning_rate": 3.978629792583281e-06, "loss": 0.8811, "step": 1266 }, { "epoch": 0.02, "learning_rate": 3.981772470144564e-06, "loss": 0.9545, "step": 1267 }, { "epoch": 0.02, "learning_rate": 3.984915147705846e-06, "loss": 0.9918, "step": 1268 }, { "epoch": 0.02, "learning_rate": 3.9880578252671286e-06, "loss": 1.0527, "step": 1269 }, { "epoch": 0.02, "learning_rate": 3.9912005028284104e-06, "loss": 1.0572, "step": 1270 }, { "epoch": 0.02, "learning_rate": 3.994343180389692e-06, "loss": 0.9083, "step": 1271 }, { "epoch": 0.02, "learning_rate": 3.997485857950974e-06, "loss": 1.0255, "step": 1272 }, { "epoch": 0.02, "learning_rate": 4.000628535512257e-06, "loss": 0.9365, "step": 1273 }, { "epoch": 0.02, "learning_rate": 4.003771213073539e-06, "loss": 1.327, "step": 1274 }, { "epoch": 0.02, "learning_rate": 4.006913890634821e-06, "loss": 1.2933, "step": 1275 }, { "epoch": 0.02, "learning_rate": 4.010056568196103e-06, "loss": 1.0406, "step": 1276 }, { "epoch": 0.02, "learning_rate": 4.013199245757385e-06, "loss": 0.9635, "step": 1277 }, { "epoch": 0.02, "learning_rate": 4.016341923318668e-06, "loss": 1.0059, "step": 1278 }, { "epoch": 0.02, "learning_rate": 4.01948460087995e-06, "loss": 1.0276, "step": 1279 }, { "epoch": 0.02, "learning_rate": 4.0226272784412325e-06, "loss": 0.9859, "step": 1280 }, { "epoch": 0.02, "learning_rate": 4.025769956002514e-06, "loss": 1.1519, "step": 1281 }, { "epoch": 0.02, "learning_rate": 4.028912633563797e-06, "loss": 0.9166, "step": 1282 }, { "epoch": 0.02, "learning_rate": 4.032055311125079e-06, "loss": 0.7724, "step": 1283 }, { "epoch": 0.02, "learning_rate": 4.035197988686362e-06, "loss": 1.0593, "step": 1284 }, { "epoch": 0.02, "learning_rate": 4.0383406662476435e-06, "loss": 1.0483, "step": 1285 }, { "epoch": 0.02, "learning_rate": 4.041483343808925e-06, "loss": 0.9945, "step": 1286 }, { "epoch": 0.02, "learning_rate": 4.044626021370208e-06, "loss": 1.2028, "step": 1287 }, { "epoch": 0.02, "learning_rate": 4.04776869893149e-06, "loss": 0.9684, "step": 1288 }, { "epoch": 0.02, "learning_rate": 4.050911376492772e-06, "loss": 0.8807, "step": 1289 }, { "epoch": 0.02, "learning_rate": 4.0540540540540545e-06, "loss": 0.7938, "step": 1290 }, { "epoch": 0.02, "learning_rate": 4.057196731615336e-06, "loss": 1.0113, "step": 1291 }, { "epoch": 0.02, "learning_rate": 4.060339409176619e-06, "loss": 1.0113, "step": 1292 }, { "epoch": 0.02, "learning_rate": 4.063482086737901e-06, "loss": 1.1227, "step": 1293 }, { "epoch": 0.02, "learning_rate": 4.066624764299184e-06, "loss": 1.1014, "step": 1294 }, { "epoch": 0.02, "learning_rate": 4.0697674418604655e-06, "loss": 0.7982, "step": 1295 }, { "epoch": 0.02, "learning_rate": 4.072910119421747e-06, "loss": 1.1558, "step": 1296 }, { "epoch": 0.02, "learning_rate": 4.07605279698303e-06, "loss": 0.9053, "step": 1297 }, { "epoch": 0.02, "learning_rate": 4.079195474544312e-06, "loss": 0.9432, "step": 1298 }, { "epoch": 0.02, "learning_rate": 4.082338152105595e-06, "loss": 1.1534, "step": 1299 }, { "epoch": 0.02, "learning_rate": 4.0854808296668766e-06, "loss": 1.2768, "step": 1300 }, { "epoch": 0.02, "learning_rate": 4.0886235072281584e-06, "loss": 0.9742, "step": 1301 }, { "epoch": 0.02, "learning_rate": 4.091766184789441e-06, "loss": 0.7272, "step": 1302 }, { "epoch": 0.02, "learning_rate": 4.094908862350723e-06, "loss": 1.0057, "step": 1303 }, { "epoch": 0.02, "learning_rate": 4.098051539912005e-06, "loss": 0.8776, "step": 1304 }, { "epoch": 0.02, "learning_rate": 4.101194217473288e-06, "loss": 1.0333, "step": 1305 }, { "epoch": 0.02, "learning_rate": 4.1043368950345695e-06, "loss": 1.0889, "step": 1306 }, { "epoch": 0.02, "learning_rate": 4.107479572595852e-06, "loss": 1.1345, "step": 1307 }, { "epoch": 0.02, "learning_rate": 4.110622250157134e-06, "loss": 0.8659, "step": 1308 }, { "epoch": 0.02, "learning_rate": 4.113764927718417e-06, "loss": 1.007, "step": 1309 }, { "epoch": 0.02, "learning_rate": 4.116907605279699e-06, "loss": 0.9398, "step": 1310 }, { "epoch": 0.02, "learning_rate": 4.120050282840981e-06, "loss": 1.1082, "step": 1311 }, { "epoch": 0.02, "learning_rate": 4.123192960402263e-06, "loss": 1.0757, "step": 1312 }, { "epoch": 0.02, "learning_rate": 4.126335637963546e-06, "loss": 1.0505, "step": 1313 }, { "epoch": 0.02, "learning_rate": 4.129478315524828e-06, "loss": 0.9461, "step": 1314 }, { "epoch": 0.02, "learning_rate": 4.13262099308611e-06, "loss": 1.0228, "step": 1315 }, { "epoch": 0.02, "learning_rate": 4.1357636706473915e-06, "loss": 0.9148, "step": 1316 }, { "epoch": 0.02, "learning_rate": 4.138906348208674e-06, "loss": 1.1581, "step": 1317 }, { "epoch": 0.02, "learning_rate": 4.142049025769956e-06, "loss": 1.1727, "step": 1318 }, { "epoch": 0.02, "learning_rate": 4.145191703331238e-06, "loss": 1.3271, "step": 1319 }, { "epoch": 0.02, "learning_rate": 4.148334380892521e-06, "loss": 0.7784, "step": 1320 }, { "epoch": 0.02, "learning_rate": 4.1514770584538025e-06, "loss": 1.1455, "step": 1321 }, { "epoch": 0.02, "learning_rate": 4.154619736015085e-06, "loss": 0.9324, "step": 1322 }, { "epoch": 0.02, "learning_rate": 4.157762413576367e-06, "loss": 0.8215, "step": 1323 }, { "epoch": 0.02, "learning_rate": 4.16090509113765e-06, "loss": 1.0871, "step": 1324 }, { "epoch": 0.02, "learning_rate": 4.164047768698932e-06, "loss": 1.2698, "step": 1325 }, { "epoch": 0.03, "learning_rate": 4.167190446260214e-06, "loss": 1.0295, "step": 1326 }, { "epoch": 0.03, "learning_rate": 4.170333123821496e-06, "loss": 0.9087, "step": 1327 }, { "epoch": 0.03, "learning_rate": 4.173475801382779e-06, "loss": 1.002, "step": 1328 }, { "epoch": 0.03, "learning_rate": 4.176618478944061e-06, "loss": 0.7862, "step": 1329 }, { "epoch": 0.03, "learning_rate": 4.179761156505343e-06, "loss": 0.9819, "step": 1330 }, { "epoch": 0.03, "learning_rate": 4.1829038340666254e-06, "loss": 1.2725, "step": 1331 }, { "epoch": 0.03, "learning_rate": 4.186046511627907e-06, "loss": 0.9578, "step": 1332 }, { "epoch": 0.03, "learning_rate": 4.189189189189189e-06, "loss": 1.0571, "step": 1333 }, { "epoch": 0.03, "learning_rate": 4.192331866750472e-06, "loss": 1.0402, "step": 1334 }, { "epoch": 0.03, "learning_rate": 4.195474544311754e-06, "loss": 0.9371, "step": 1335 }, { "epoch": 0.03, "learning_rate": 4.1986172218730365e-06, "loss": 1.0114, "step": 1336 }, { "epoch": 0.03, "learning_rate": 4.201759899434318e-06, "loss": 1.1327, "step": 1337 }, { "epoch": 0.03, "learning_rate": 4.2049025769956e-06, "loss": 1.3134, "step": 1338 }, { "epoch": 0.03, "learning_rate": 4.208045254556883e-06, "loss": 0.8463, "step": 1339 }, { "epoch": 0.03, "learning_rate": 4.211187932118165e-06, "loss": 0.9515, "step": 1340 }, { "epoch": 0.03, "learning_rate": 4.2143306096794475e-06, "loss": 0.9142, "step": 1341 }, { "epoch": 0.03, "learning_rate": 4.217473287240729e-06, "loss": 1.0489, "step": 1342 }, { "epoch": 0.03, "learning_rate": 4.220615964802012e-06, "loss": 1.2374, "step": 1343 }, { "epoch": 0.03, "learning_rate": 4.223758642363294e-06, "loss": 1.2231, "step": 1344 }, { "epoch": 0.03, "learning_rate": 4.226901319924576e-06, "loss": 0.9299, "step": 1345 }, { "epoch": 0.03, "learning_rate": 4.2300439974858585e-06, "loss": 0.9038, "step": 1346 }, { "epoch": 0.03, "learning_rate": 4.23318667504714e-06, "loss": 0.9694, "step": 1347 }, { "epoch": 0.03, "learning_rate": 4.236329352608422e-06, "loss": 0.8934, "step": 1348 }, { "epoch": 0.03, "learning_rate": 4.239472030169705e-06, "loss": 1.2328, "step": 1349 }, { "epoch": 0.03, "learning_rate": 4.242614707730987e-06, "loss": 1.0937, "step": 1350 }, { "epoch": 0.03, "learning_rate": 4.2457573852922695e-06, "loss": 0.8896, "step": 1351 }, { "epoch": 0.03, "learning_rate": 4.248900062853551e-06, "loss": 0.8799, "step": 1352 }, { "epoch": 0.03, "learning_rate": 4.252042740414834e-06, "loss": 0.8619, "step": 1353 }, { "epoch": 0.03, "learning_rate": 4.255185417976116e-06, "loss": 1.007, "step": 1354 }, { "epoch": 0.03, "learning_rate": 4.258328095537399e-06, "loss": 1.0529, "step": 1355 }, { "epoch": 0.03, "learning_rate": 4.2614707730986806e-06, "loss": 1.1018, "step": 1356 }, { "epoch": 0.03, "learning_rate": 4.264613450659963e-06, "loss": 1.1381, "step": 1357 }, { "epoch": 0.03, "learning_rate": 4.267756128221245e-06, "loss": 0.9441, "step": 1358 }, { "epoch": 0.03, "learning_rate": 4.270898805782527e-06, "loss": 0.9573, "step": 1359 }, { "epoch": 0.03, "learning_rate": 4.27404148334381e-06, "loss": 0.7575, "step": 1360 }, { "epoch": 0.03, "learning_rate": 4.277184160905092e-06, "loss": 1.0319, "step": 1361 }, { "epoch": 0.03, "learning_rate": 4.2803268384663734e-06, "loss": 1.2633, "step": 1362 }, { "epoch": 0.03, "learning_rate": 4.283469516027655e-06, "loss": 1.1516, "step": 1363 }, { "epoch": 0.03, "learning_rate": 4.286612193588938e-06, "loss": 0.7985, "step": 1364 }, { "epoch": 0.03, "learning_rate": 4.28975487115022e-06, "loss": 0.7659, "step": 1365 }, { "epoch": 0.03, "learning_rate": 4.292897548711503e-06, "loss": 0.9211, "step": 1366 }, { "epoch": 0.03, "learning_rate": 4.2960402262727845e-06, "loss": 0.9012, "step": 1367 }, { "epoch": 0.03, "learning_rate": 4.299182903834067e-06, "loss": 1.124, "step": 1368 }, { "epoch": 0.03, "learning_rate": 4.302325581395349e-06, "loss": 1.1323, "step": 1369 }, { "epoch": 0.03, "learning_rate": 4.305468258956632e-06, "loss": 0.9235, "step": 1370 }, { "epoch": 0.03, "learning_rate": 4.308610936517914e-06, "loss": 0.9207, "step": 1371 }, { "epoch": 0.03, "learning_rate": 4.311753614079196e-06, "loss": 0.8451, "step": 1372 }, { "epoch": 0.03, "learning_rate": 4.314896291640478e-06, "loss": 0.9451, "step": 1373 }, { "epoch": 0.03, "learning_rate": 4.31803896920176e-06, "loss": 1.1654, "step": 1374 }, { "epoch": 0.03, "learning_rate": 4.321181646763043e-06, "loss": 1.1489, "step": 1375 }, { "epoch": 0.03, "learning_rate": 4.324324324324325e-06, "loss": 0.8658, "step": 1376 }, { "epoch": 0.03, "learning_rate": 4.3274670018856065e-06, "loss": 0.9703, "step": 1377 }, { "epoch": 0.03, "learning_rate": 4.330609679446889e-06, "loss": 1.1593, "step": 1378 }, { "epoch": 0.03, "learning_rate": 4.333752357008171e-06, "loss": 1.0432, "step": 1379 }, { "epoch": 0.03, "learning_rate": 4.336895034569453e-06, "loss": 1.0425, "step": 1380 }, { "epoch": 0.03, "learning_rate": 4.340037712130736e-06, "loss": 1.0761, "step": 1381 }, { "epoch": 0.03, "learning_rate": 4.3431803896920175e-06, "loss": 1.2067, "step": 1382 }, { "epoch": 0.03, "learning_rate": 4.3463230672533e-06, "loss": 0.8131, "step": 1383 }, { "epoch": 0.03, "learning_rate": 4.349465744814582e-06, "loss": 0.9924, "step": 1384 }, { "epoch": 0.03, "learning_rate": 4.352608422375865e-06, "loss": 0.9048, "step": 1385 }, { "epoch": 0.03, "learning_rate": 4.355751099937147e-06, "loss": 0.9923, "step": 1386 }, { "epoch": 0.03, "learning_rate": 4.358893777498429e-06, "loss": 1.017, "step": 1387 }, { "epoch": 0.03, "learning_rate": 4.362036455059711e-06, "loss": 1.1425, "step": 1388 }, { "epoch": 0.03, "learning_rate": 4.365179132620994e-06, "loss": 0.8184, "step": 1389 }, { "epoch": 0.03, "learning_rate": 4.368321810182276e-06, "loss": 0.9193, "step": 1390 }, { "epoch": 0.03, "learning_rate": 4.371464487743558e-06, "loss": 0.8987, "step": 1391 }, { "epoch": 0.03, "learning_rate": 4.37460716530484e-06, "loss": 0.9332, "step": 1392 }, { "epoch": 0.03, "learning_rate": 4.377749842866122e-06, "loss": 0.9365, "step": 1393 }, { "epoch": 0.03, "learning_rate": 4.380892520427404e-06, "loss": 1.3259, "step": 1394 }, { "epoch": 0.03, "learning_rate": 4.384035197988687e-06, "loss": 1.0312, "step": 1395 }, { "epoch": 0.03, "learning_rate": 4.387177875549969e-06, "loss": 0.9489, "step": 1396 }, { "epoch": 0.03, "learning_rate": 4.3903205531112515e-06, "loss": 0.8973, "step": 1397 }, { "epoch": 0.03, "learning_rate": 4.393463230672533e-06, "loss": 0.9067, "step": 1398 }, { "epoch": 0.03, "learning_rate": 4.396605908233816e-06, "loss": 1.0388, "step": 1399 }, { "epoch": 0.03, "learning_rate": 4.399748585795098e-06, "loss": 1.1964, "step": 1400 }, { "epoch": 0.03, "learning_rate": 4.40289126335638e-06, "loss": 0.9374, "step": 1401 }, { "epoch": 0.03, "learning_rate": 4.4060339409176625e-06, "loss": 0.7857, "step": 1402 }, { "epoch": 0.03, "learning_rate": 4.409176618478944e-06, "loss": 1.0397, "step": 1403 }, { "epoch": 0.03, "learning_rate": 4.412319296040227e-06, "loss": 0.9763, "step": 1404 }, { "epoch": 0.03, "learning_rate": 4.415461973601509e-06, "loss": 0.986, "step": 1405 }, { "epoch": 0.03, "learning_rate": 4.418604651162791e-06, "loss": 1.1385, "step": 1406 }, { "epoch": 0.03, "learning_rate": 4.421747328724073e-06, "loss": 1.0836, "step": 1407 }, { "epoch": 0.03, "learning_rate": 4.424890006285355e-06, "loss": 1.1028, "step": 1408 }, { "epoch": 0.03, "learning_rate": 4.428032683846637e-06, "loss": 0.9783, "step": 1409 }, { "epoch": 0.03, "learning_rate": 4.43117536140792e-06, "loss": 0.8911, "step": 1410 }, { "epoch": 0.03, "learning_rate": 4.434318038969202e-06, "loss": 0.9558, "step": 1411 }, { "epoch": 0.03, "learning_rate": 4.4374607165304845e-06, "loss": 1.1379, "step": 1412 }, { "epoch": 0.03, "learning_rate": 4.440603394091766e-06, "loss": 1.2212, "step": 1413 }, { "epoch": 0.03, "learning_rate": 4.443746071653049e-06, "loss": 0.8972, "step": 1414 }, { "epoch": 0.03, "learning_rate": 4.446888749214331e-06, "loss": 0.7976, "step": 1415 }, { "epoch": 0.03, "learning_rate": 4.450031426775614e-06, "loss": 0.9966, "step": 1416 }, { "epoch": 0.03, "learning_rate": 4.4531741043368956e-06, "loss": 0.9464, "step": 1417 }, { "epoch": 0.03, "learning_rate": 4.4563167818981774e-06, "loss": 1.0117, "step": 1418 }, { "epoch": 0.03, "learning_rate": 4.45945945945946e-06, "loss": 1.2591, "step": 1419 }, { "epoch": 0.03, "learning_rate": 4.462602137020742e-06, "loss": 0.8933, "step": 1420 }, { "epoch": 0.03, "learning_rate": 4.465744814582024e-06, "loss": 0.8892, "step": 1421 }, { "epoch": 0.03, "learning_rate": 4.468887492143307e-06, "loss": 1.1658, "step": 1422 }, { "epoch": 0.03, "learning_rate": 4.4720301697045885e-06, "loss": 1.1083, "step": 1423 }, { "epoch": 0.03, "learning_rate": 4.47517284726587e-06, "loss": 0.8931, "step": 1424 }, { "epoch": 0.03, "learning_rate": 4.478315524827153e-06, "loss": 1.231, "step": 1425 }, { "epoch": 0.03, "learning_rate": 4.481458202388435e-06, "loss": 1.142, "step": 1426 }, { "epoch": 0.03, "learning_rate": 4.484600879949718e-06, "loss": 0.6625, "step": 1427 }, { "epoch": 0.03, "learning_rate": 4.4877435575109995e-06, "loss": 0.9799, "step": 1428 }, { "epoch": 0.03, "learning_rate": 4.490886235072282e-06, "loss": 1.0215, "step": 1429 }, { "epoch": 0.03, "learning_rate": 4.494028912633564e-06, "loss": 0.9741, "step": 1430 }, { "epoch": 0.03, "learning_rate": 4.497171590194847e-06, "loss": 1.1279, "step": 1431 }, { "epoch": 0.03, "learning_rate": 4.500314267756129e-06, "loss": 0.9953, "step": 1432 }, { "epoch": 0.03, "learning_rate": 4.503456945317411e-06, "loss": 0.7249, "step": 1433 }, { "epoch": 0.03, "learning_rate": 4.506599622878693e-06, "loss": 0.9725, "step": 1434 }, { "epoch": 0.03, "learning_rate": 4.509742300439975e-06, "loss": 1.001, "step": 1435 }, { "epoch": 0.03, "learning_rate": 4.512884978001257e-06, "loss": 1.0327, "step": 1436 }, { "epoch": 0.03, "learning_rate": 4.51602765556254e-06, "loss": 1.1702, "step": 1437 }, { "epoch": 0.03, "learning_rate": 4.5191703331238215e-06, "loss": 0.9439, "step": 1438 }, { "epoch": 0.03, "learning_rate": 4.522313010685104e-06, "loss": 0.9931, "step": 1439 }, { "epoch": 0.03, "learning_rate": 4.525455688246386e-06, "loss": 0.9331, "step": 1440 }, { "epoch": 0.03, "learning_rate": 4.528598365807669e-06, "loss": 0.8726, "step": 1441 }, { "epoch": 0.03, "learning_rate": 4.531741043368951e-06, "loss": 1.0234, "step": 1442 }, { "epoch": 0.03, "learning_rate": 4.5348837209302326e-06, "loss": 1.2224, "step": 1443 }, { "epoch": 0.03, "learning_rate": 4.538026398491515e-06, "loss": 1.2252, "step": 1444 }, { "epoch": 0.03, "learning_rate": 4.541169076052797e-06, "loss": 1.0419, "step": 1445 }, { "epoch": 0.03, "learning_rate": 4.54431175361408e-06, "loss": 1.0157, "step": 1446 }, { "epoch": 0.03, "learning_rate": 4.547454431175362e-06, "loss": 0.9302, "step": 1447 }, { "epoch": 0.03, "learning_rate": 4.5505971087366444e-06, "loss": 0.9778, "step": 1448 }, { "epoch": 0.03, "learning_rate": 4.553739786297926e-06, "loss": 1.4026, "step": 1449 }, { "epoch": 0.03, "learning_rate": 4.556882463859208e-06, "loss": 1.2654, "step": 1450 }, { "epoch": 0.03, "learning_rate": 4.560025141420491e-06, "loss": 1.1558, "step": 1451 }, { "epoch": 0.03, "learning_rate": 4.563167818981773e-06, "loss": 0.9923, "step": 1452 }, { "epoch": 0.03, "learning_rate": 4.566310496543055e-06, "loss": 1.0092, "step": 1453 }, { "epoch": 0.03, "learning_rate": 4.569453174104337e-06, "loss": 0.9649, "step": 1454 }, { "epoch": 0.03, "learning_rate": 4.572595851665619e-06, "loss": 0.7249, "step": 1455 }, { "epoch": 0.03, "learning_rate": 4.575738529226902e-06, "loss": 1.1607, "step": 1456 }, { "epoch": 0.03, "learning_rate": 4.578881206788184e-06, "loss": 0.8123, "step": 1457 }, { "epoch": 0.03, "learning_rate": 4.5820238843494665e-06, "loss": 1.0239, "step": 1458 }, { "epoch": 0.03, "learning_rate": 4.585166561910748e-06, "loss": 1.0264, "step": 1459 }, { "epoch": 0.03, "learning_rate": 4.588309239472031e-06, "loss": 1.0719, "step": 1460 }, { "epoch": 0.03, "learning_rate": 4.591451917033313e-06, "loss": 1.046, "step": 1461 }, { "epoch": 0.03, "learning_rate": 4.594594594594596e-06, "loss": 1.2761, "step": 1462 }, { "epoch": 0.03, "learning_rate": 4.5977372721558775e-06, "loss": 0.9346, "step": 1463 }, { "epoch": 0.03, "learning_rate": 4.600879949717159e-06, "loss": 1.1836, "step": 1464 }, { "epoch": 0.03, "learning_rate": 4.604022627278441e-06, "loss": 0.7466, "step": 1465 }, { "epoch": 0.03, "learning_rate": 4.607165304839724e-06, "loss": 0.9378, "step": 1466 }, { "epoch": 0.03, "learning_rate": 4.610307982401006e-06, "loss": 1.0245, "step": 1467 }, { "epoch": 0.03, "learning_rate": 4.613450659962288e-06, "loss": 1.1527, "step": 1468 }, { "epoch": 0.03, "learning_rate": 4.61659333752357e-06, "loss": 0.95, "step": 1469 }, { "epoch": 0.03, "learning_rate": 4.619736015084852e-06, "loss": 0.9789, "step": 1470 }, { "epoch": 0.03, "learning_rate": 4.622878692646135e-06, "loss": 0.9301, "step": 1471 }, { "epoch": 0.03, "learning_rate": 4.626021370207417e-06, "loss": 0.8643, "step": 1472 }, { "epoch": 0.03, "learning_rate": 4.6291640477686995e-06, "loss": 0.9028, "step": 1473 }, { "epoch": 0.03, "learning_rate": 4.632306725329981e-06, "loss": 1.1351, "step": 1474 }, { "epoch": 0.03, "learning_rate": 4.635449402891264e-06, "loss": 1.2505, "step": 1475 }, { "epoch": 0.03, "learning_rate": 4.638592080452546e-06, "loss": 0.8688, "step": 1476 }, { "epoch": 0.03, "learning_rate": 4.641734758013829e-06, "loss": 0.8701, "step": 1477 }, { "epoch": 0.03, "learning_rate": 4.6448774355751106e-06, "loss": 0.9518, "step": 1478 }, { "epoch": 0.03, "learning_rate": 4.6480201131363924e-06, "loss": 0.7967, "step": 1479 }, { "epoch": 0.03, "learning_rate": 4.651162790697675e-06, "loss": 1.1152, "step": 1480 }, { "epoch": 0.03, "learning_rate": 4.654305468258957e-06, "loss": 1.1196, "step": 1481 }, { "epoch": 0.03, "learning_rate": 4.657448145820239e-06, "loss": 1.0035, "step": 1482 }, { "epoch": 0.03, "learning_rate": 4.660590823381522e-06, "loss": 1.1637, "step": 1483 }, { "epoch": 0.03, "learning_rate": 4.6637335009428035e-06, "loss": 1.1779, "step": 1484 }, { "epoch": 0.03, "learning_rate": 4.666876178504085e-06, "loss": 0.9852, "step": 1485 }, { "epoch": 0.03, "learning_rate": 4.670018856065368e-06, "loss": 1.1404, "step": 1486 }, { "epoch": 0.03, "learning_rate": 4.67316153362665e-06, "loss": 1.3105, "step": 1487 }, { "epoch": 0.03, "learning_rate": 4.676304211187933e-06, "loss": 1.1274, "step": 1488 }, { "epoch": 0.03, "learning_rate": 4.6794468887492145e-06, "loss": 0.9982, "step": 1489 }, { "epoch": 0.03, "learning_rate": 4.682589566310497e-06, "loss": 0.8507, "step": 1490 }, { "epoch": 0.03, "learning_rate": 4.685732243871779e-06, "loss": 1.1374, "step": 1491 }, { "epoch": 0.03, "learning_rate": 4.688874921433062e-06, "loss": 1.0634, "step": 1492 }, { "epoch": 0.03, "learning_rate": 4.692017598994344e-06, "loss": 1.1861, "step": 1493 }, { "epoch": 0.03, "learning_rate": 4.6951602765556255e-06, "loss": 1.0273, "step": 1494 }, { "epoch": 0.03, "learning_rate": 4.698302954116908e-06, "loss": 0.9991, "step": 1495 }, { "epoch": 0.03, "learning_rate": 4.70144563167819e-06, "loss": 0.9584, "step": 1496 }, { "epoch": 0.03, "learning_rate": 4.704588309239472e-06, "loss": 1.176, "step": 1497 }, { "epoch": 0.03, "learning_rate": 4.707730986800755e-06, "loss": 0.9737, "step": 1498 }, { "epoch": 0.03, "learning_rate": 4.7108736643620365e-06, "loss": 0.9615, "step": 1499 }, { "epoch": 0.03, "learning_rate": 4.714016341923319e-06, "loss": 1.1819, "step": 1500 }, { "epoch": 0.03, "learning_rate": 4.717159019484601e-06, "loss": 1.1443, "step": 1501 }, { "epoch": 0.03, "learning_rate": 4.720301697045884e-06, "loss": 0.9321, "step": 1502 }, { "epoch": 0.03, "learning_rate": 4.723444374607166e-06, "loss": 0.749, "step": 1503 }, { "epoch": 0.03, "learning_rate": 4.726587052168448e-06, "loss": 0.9339, "step": 1504 }, { "epoch": 0.03, "learning_rate": 4.72972972972973e-06, "loss": 1.0021, "step": 1505 }, { "epoch": 0.03, "learning_rate": 4.732872407291013e-06, "loss": 1.0067, "step": 1506 }, { "epoch": 0.03, "learning_rate": 4.736015084852295e-06, "loss": 1.0827, "step": 1507 }, { "epoch": 0.03, "learning_rate": 4.739157762413577e-06, "loss": 1.1535, "step": 1508 }, { "epoch": 0.03, "learning_rate": 4.742300439974859e-06, "loss": 1.0161, "step": 1509 }, { "epoch": 0.03, "learning_rate": 4.745443117536141e-06, "loss": 0.9359, "step": 1510 }, { "epoch": 0.03, "learning_rate": 4.748585795097423e-06, "loss": 1.211, "step": 1511 }, { "epoch": 0.03, "learning_rate": 4.751728472658705e-06, "loss": 1.1047, "step": 1512 }, { "epoch": 0.03, "learning_rate": 4.754871150219988e-06, "loss": 0.9033, "step": 1513 }, { "epoch": 0.03, "learning_rate": 4.75801382778127e-06, "loss": 0.6956, "step": 1514 }, { "epoch": 0.03, "learning_rate": 4.761156505342552e-06, "loss": 1.075, "step": 1515 }, { "epoch": 0.03, "learning_rate": 4.764299182903834e-06, "loss": 0.8818, "step": 1516 }, { "epoch": 0.03, "learning_rate": 4.767441860465117e-06, "loss": 1.0526, "step": 1517 }, { "epoch": 0.03, "learning_rate": 4.770584538026399e-06, "loss": 1.0573, "step": 1518 }, { "epoch": 0.03, "learning_rate": 4.7737272155876815e-06, "loss": 1.2299, "step": 1519 }, { "epoch": 0.03, "learning_rate": 4.776869893148963e-06, "loss": 1.1223, "step": 1520 }, { "epoch": 0.03, "learning_rate": 4.780012570710246e-06, "loss": 0.9717, "step": 1521 }, { "epoch": 0.03, "learning_rate": 4.783155248271528e-06, "loss": 0.8892, "step": 1522 }, { "epoch": 0.03, "learning_rate": 4.78629792583281e-06, "loss": 1.0914, "step": 1523 }, { "epoch": 0.03, "learning_rate": 4.7894406033940925e-06, "loss": 1.1879, "step": 1524 }, { "epoch": 0.03, "learning_rate": 4.792583280955374e-06, "loss": 1.0748, "step": 1525 }, { "epoch": 0.03, "learning_rate": 4.795725958516656e-06, "loss": 1.071, "step": 1526 }, { "epoch": 0.03, "learning_rate": 4.798868636077939e-06, "loss": 0.7417, "step": 1527 }, { "epoch": 0.03, "learning_rate": 4.802011313639221e-06, "loss": 0.8862, "step": 1528 }, { "epoch": 0.03, "learning_rate": 4.805153991200503e-06, "loss": 0.9319, "step": 1529 }, { "epoch": 0.03, "learning_rate": 4.808296668761785e-06, "loss": 0.9287, "step": 1530 }, { "epoch": 0.03, "learning_rate": 4.811439346323067e-06, "loss": 1.2853, "step": 1531 }, { "epoch": 0.03, "learning_rate": 4.81458202388435e-06, "loss": 0.9591, "step": 1532 }, { "epoch": 0.03, "learning_rate": 4.817724701445632e-06, "loss": 0.8653, "step": 1533 }, { "epoch": 0.03, "learning_rate": 4.8208673790069146e-06, "loss": 0.9592, "step": 1534 }, { "epoch": 0.03, "learning_rate": 4.8240100565681964e-06, "loss": 0.9463, "step": 1535 }, { "epoch": 0.03, "learning_rate": 4.827152734129479e-06, "loss": 0.978, "step": 1536 }, { "epoch": 0.03, "learning_rate": 4.830295411690761e-06, "loss": 1.1407, "step": 1537 }, { "epoch": 0.03, "learning_rate": 4.833438089252043e-06, "loss": 1.2871, "step": 1538 }, { "epoch": 0.03, "learning_rate": 4.836580766813326e-06, "loss": 0.9311, "step": 1539 }, { "epoch": 0.03, "learning_rate": 4.8397234443746074e-06, "loss": 1.1248, "step": 1540 }, { "epoch": 0.03, "learning_rate": 4.842866121935889e-06, "loss": 0.9875, "step": 1541 }, { "epoch": 0.03, "learning_rate": 4.846008799497172e-06, "loss": 0.9886, "step": 1542 }, { "epoch": 0.03, "learning_rate": 4.849151477058454e-06, "loss": 1.1179, "step": 1543 }, { "epoch": 0.03, "learning_rate": 4.852294154619737e-06, "loss": 1.2452, "step": 1544 }, { "epoch": 0.03, "learning_rate": 4.8554368321810185e-06, "loss": 0.875, "step": 1545 }, { "epoch": 0.03, "learning_rate": 4.858579509742301e-06, "loss": 0.9106, "step": 1546 }, { "epoch": 0.03, "learning_rate": 4.861722187303583e-06, "loss": 0.8013, "step": 1547 }, { "epoch": 0.03, "learning_rate": 4.864864864864866e-06, "loss": 0.9832, "step": 1548 }, { "epoch": 0.03, "learning_rate": 4.868007542426148e-06, "loss": 0.8381, "step": 1549 }, { "epoch": 0.03, "learning_rate": 4.8711502199874295e-06, "loss": 1.1805, "step": 1550 }, { "epoch": 0.03, "learning_rate": 4.874292897548712e-06, "loss": 1.1351, "step": 1551 }, { "epoch": 0.03, "learning_rate": 4.877435575109994e-06, "loss": 0.5865, "step": 1552 }, { "epoch": 0.03, "learning_rate": 4.880578252671277e-06, "loss": 0.8726, "step": 1553 }, { "epoch": 0.03, "learning_rate": 4.883720930232559e-06, "loss": 1.0565, "step": 1554 }, { "epoch": 0.03, "learning_rate": 4.8868636077938405e-06, "loss": 1.06, "step": 1555 }, { "epoch": 0.03, "learning_rate": 4.890006285355122e-06, "loss": 1.2842, "step": 1556 }, { "epoch": 0.03, "learning_rate": 4.893148962916405e-06, "loss": 0.8689, "step": 1557 }, { "epoch": 0.03, "learning_rate": 4.896291640477687e-06, "loss": 0.9763, "step": 1558 }, { "epoch": 0.03, "learning_rate": 4.89943431803897e-06, "loss": 0.863, "step": 1559 }, { "epoch": 0.03, "learning_rate": 4.9025769956002515e-06, "loss": 0.8089, "step": 1560 }, { "epoch": 0.03, "learning_rate": 4.905719673161534e-06, "loss": 1.0579, "step": 1561 }, { "epoch": 0.03, "learning_rate": 4.908862350722816e-06, "loss": 1.0696, "step": 1562 }, { "epoch": 0.03, "learning_rate": 4.912005028284099e-06, "loss": 1.2589, "step": 1563 }, { "epoch": 0.03, "learning_rate": 4.915147705845381e-06, "loss": 0.933, "step": 1564 }, { "epoch": 0.03, "learning_rate": 4.918290383406663e-06, "loss": 1.1069, "step": 1565 }, { "epoch": 0.03, "learning_rate": 4.921433060967945e-06, "loss": 1.027, "step": 1566 }, { "epoch": 0.03, "learning_rate": 4.924575738529227e-06, "loss": 1.0121, "step": 1567 }, { "epoch": 0.03, "learning_rate": 4.92771841609051e-06, "loss": 1.2827, "step": 1568 }, { "epoch": 0.03, "learning_rate": 4.930861093651792e-06, "loss": 1.1112, "step": 1569 }, { "epoch": 0.03, "learning_rate": 4.934003771213074e-06, "loss": 1.0571, "step": 1570 }, { "epoch": 0.03, "learning_rate": 4.937146448774356e-06, "loss": 0.9673, "step": 1571 }, { "epoch": 0.03, "learning_rate": 4.940289126335638e-06, "loss": 1.0016, "step": 1572 }, { "epoch": 0.03, "learning_rate": 4.94343180389692e-06, "loss": 0.9779, "step": 1573 }, { "epoch": 0.03, "learning_rate": 4.946574481458203e-06, "loss": 1.1196, "step": 1574 }, { "epoch": 0.03, "learning_rate": 4.949717159019485e-06, "loss": 1.2184, "step": 1575 }, { "epoch": 0.03, "learning_rate": 4.952859836580767e-06, "loss": 1.1135, "step": 1576 }, { "epoch": 0.03, "learning_rate": 4.956002514142049e-06, "loss": 0.9836, "step": 1577 }, { "epoch": 0.03, "learning_rate": 4.959145191703332e-06, "loss": 0.8796, "step": 1578 }, { "epoch": 0.03, "learning_rate": 4.962287869264614e-06, "loss": 0.9099, "step": 1579 }, { "epoch": 0.03, "learning_rate": 4.9654305468258965e-06, "loss": 0.9687, "step": 1580 }, { "epoch": 0.03, "learning_rate": 4.968573224387178e-06, "loss": 1.333, "step": 1581 }, { "epoch": 0.03, "learning_rate": 4.971715901948461e-06, "loss": 0.9408, "step": 1582 }, { "epoch": 0.03, "learning_rate": 4.974858579509743e-06, "loss": 1.0333, "step": 1583 }, { "epoch": 0.03, "learning_rate": 4.978001257071025e-06, "loss": 1.0742, "step": 1584 }, { "epoch": 0.03, "learning_rate": 4.981143934632307e-06, "loss": 0.9309, "step": 1585 }, { "epoch": 0.03, "learning_rate": 4.984286612193589e-06, "loss": 0.9882, "step": 1586 }, { "epoch": 0.03, "learning_rate": 4.987429289754871e-06, "loss": 1.1993, "step": 1587 }, { "epoch": 0.03, "learning_rate": 4.990571967316154e-06, "loss": 1.1161, "step": 1588 }, { "epoch": 0.03, "learning_rate": 4.993714644877436e-06, "loss": 0.681, "step": 1589 }, { "epoch": 0.03, "learning_rate": 4.9968573224387185e-06, "loss": 0.9024, "step": 1590 }, { "epoch": 0.03, "learning_rate": 5e-06, "loss": 0.9939, "step": 1591 }, { "epoch": 0.03, "learning_rate": 4.999999995332539e-06, "loss": 1.1035, "step": 1592 }, { "epoch": 0.03, "learning_rate": 4.999999981330153e-06, "loss": 1.2289, "step": 1593 }, { "epoch": 0.03, "learning_rate": 4.999999957992846e-06, "loss": 1.0718, "step": 1594 }, { "epoch": 0.03, "learning_rate": 4.999999925320614e-06, "loss": 0.9224, "step": 1595 }, { "epoch": 0.03, "learning_rate": 4.999999883313459e-06, "loss": 1.1184, "step": 1596 }, { "epoch": 0.03, "learning_rate": 4.999999831971382e-06, "loss": 1.0529, "step": 1597 }, { "epoch": 0.03, "learning_rate": 4.999999771294382e-06, "loss": 0.8725, "step": 1598 }, { "epoch": 0.03, "learning_rate": 4.999999701282459e-06, "loss": 0.9771, "step": 1599 }, { "epoch": 0.03, "learning_rate": 4.999999621935614e-06, "loss": 1.1838, "step": 1600 }, { "epoch": 0.03, "learning_rate": 4.999999533253848e-06, "loss": 1.084, "step": 1601 }, { "epoch": 0.03, "learning_rate": 4.999999435237159e-06, "loss": 0.9578, "step": 1602 }, { "epoch": 0.03, "learning_rate": 4.999999327885549e-06, "loss": 0.9954, "step": 1603 }, { "epoch": 0.03, "learning_rate": 4.999999211199019e-06, "loss": 0.8792, "step": 1604 }, { "epoch": 0.03, "learning_rate": 4.999999085177568e-06, "loss": 1.1431, "step": 1605 }, { "epoch": 0.03, "learning_rate": 4.999998949821197e-06, "loss": 1.3456, "step": 1606 }, { "epoch": 0.03, "learning_rate": 4.999998805129906e-06, "loss": 1.0781, "step": 1607 }, { "epoch": 0.03, "learning_rate": 4.999998651103697e-06, "loss": 0.8344, "step": 1608 }, { "epoch": 0.03, "learning_rate": 4.99999848774257e-06, "loss": 1.0341, "step": 1609 }, { "epoch": 0.03, "learning_rate": 4.9999983150465245e-06, "loss": 0.9046, "step": 1610 }, { "epoch": 0.03, "learning_rate": 4.999998133015562e-06, "loss": 1.1248, "step": 1611 }, { "epoch": 0.03, "learning_rate": 4.999997941649683e-06, "loss": 1.1213, "step": 1612 }, { "epoch": 0.03, "learning_rate": 4.99999774094889e-06, "loss": 1.1373, "step": 1613 }, { "epoch": 0.03, "learning_rate": 4.99999753091318e-06, "loss": 1.1271, "step": 1614 }, { "epoch": 0.03, "learning_rate": 4.999997311542557e-06, "loss": 0.9613, "step": 1615 }, { "epoch": 0.03, "learning_rate": 4.99999708283702e-06, "loss": 0.9586, "step": 1616 }, { "epoch": 0.03, "learning_rate": 4.999996844796571e-06, "loss": 1.0369, "step": 1617 }, { "epoch": 0.03, "learning_rate": 4.999996597421211e-06, "loss": 1.1457, "step": 1618 }, { "epoch": 0.03, "learning_rate": 4.99999634071094e-06, "loss": 1.2128, "step": 1619 }, { "epoch": 0.03, "learning_rate": 4.999996074665758e-06, "loss": 0.9042, "step": 1620 }, { "epoch": 0.03, "learning_rate": 4.999995799285669e-06, "loss": 0.8655, "step": 1621 }, { "epoch": 0.03, "learning_rate": 4.9999955145706715e-06, "loss": 1.0455, "step": 1622 }, { "epoch": 0.03, "learning_rate": 4.999995220520767e-06, "loss": 1.1566, "step": 1623 }, { "epoch": 0.03, "learning_rate": 4.999994917135958e-06, "loss": 1.1622, "step": 1624 }, { "epoch": 0.03, "learning_rate": 4.999994604416244e-06, "loss": 1.0972, "step": 1625 }, { "epoch": 0.03, "learning_rate": 4.999994282361627e-06, "loss": 0.92, "step": 1626 }, { "epoch": 0.03, "learning_rate": 4.999993950972108e-06, "loss": 0.9213, "step": 1627 }, { "epoch": 0.03, "learning_rate": 4.999993610247688e-06, "loss": 0.8884, "step": 1628 }, { "epoch": 0.03, "learning_rate": 4.999993260188369e-06, "loss": 0.9815, "step": 1629 }, { "epoch": 0.03, "learning_rate": 4.9999929007941515e-06, "loss": 1.2551, "step": 1630 }, { "epoch": 0.03, "learning_rate": 4.999992532065038e-06, "loss": 1.1216, "step": 1631 }, { "epoch": 0.03, "learning_rate": 4.999992154001028e-06, "loss": 1.0925, "step": 1632 }, { "epoch": 0.03, "learning_rate": 4.999991766602124e-06, "loss": 0.9579, "step": 1633 }, { "epoch": 0.03, "learning_rate": 4.999991369868328e-06, "loss": 1.0662, "step": 1634 }, { "epoch": 0.03, "learning_rate": 4.9999909637996405e-06, "loss": 1.0462, "step": 1635 }, { "epoch": 0.03, "learning_rate": 4.999990548396063e-06, "loss": 1.115, "step": 1636 }, { "epoch": 0.03, "learning_rate": 4.999990123657598e-06, "loss": 1.2252, "step": 1637 }, { "epoch": 0.03, "learning_rate": 4.999989689584246e-06, "loss": 1.1115, "step": 1638 }, { "epoch": 0.03, "learning_rate": 4.999989246176009e-06, "loss": 1.0482, "step": 1639 }, { "epoch": 0.03, "learning_rate": 4.99998879343289e-06, "loss": 0.9917, "step": 1640 }, { "epoch": 0.03, "learning_rate": 4.999988331354889e-06, "loss": 0.9507, "step": 1641 }, { "epoch": 0.03, "learning_rate": 4.999987859942008e-06, "loss": 0.9108, "step": 1642 }, { "epoch": 0.03, "learning_rate": 4.999987379194249e-06, "loss": 1.0851, "step": 1643 }, { "epoch": 0.03, "learning_rate": 4.999986889111613e-06, "loss": 1.1525, "step": 1644 }, { "epoch": 0.03, "learning_rate": 4.999986389694104e-06, "loss": 0.9325, "step": 1645 }, { "epoch": 0.03, "learning_rate": 4.999985880941721e-06, "loss": 1.0599, "step": 1646 }, { "epoch": 0.03, "learning_rate": 4.999985362854469e-06, "loss": 1.0426, "step": 1647 }, { "epoch": 0.03, "learning_rate": 4.999984835432347e-06, "loss": 0.9378, "step": 1648 }, { "epoch": 0.03, "learning_rate": 4.999984298675359e-06, "loss": 1.1078, "step": 1649 }, { "epoch": 0.03, "learning_rate": 4.999983752583506e-06, "loss": 1.3647, "step": 1650 }, { "epoch": 0.03, "learning_rate": 4.99998319715679e-06, "loss": 0.9031, "step": 1651 }, { "epoch": 0.03, "learning_rate": 4.999982632395215e-06, "loss": 0.8463, "step": 1652 }, { "epoch": 0.03, "learning_rate": 4.999982058298779e-06, "loss": 1.1206, "step": 1653 }, { "epoch": 0.03, "learning_rate": 4.999981474867489e-06, "loss": 0.9165, "step": 1654 }, { "epoch": 0.03, "learning_rate": 4.9999808821013436e-06, "loss": 0.9688, "step": 1655 }, { "epoch": 0.03, "learning_rate": 4.9999802800003465e-06, "loss": 1.1884, "step": 1656 }, { "epoch": 0.03, "learning_rate": 4.9999796685645e-06, "loss": 0.9324, "step": 1657 }, { "epoch": 0.03, "learning_rate": 4.999979047793805e-06, "loss": 0.953, "step": 1658 }, { "epoch": 0.03, "learning_rate": 4.9999784176882655e-06, "loss": 1.027, "step": 1659 }, { "epoch": 0.03, "learning_rate": 4.999977778247883e-06, "loss": 1.2924, "step": 1660 }, { "epoch": 0.03, "learning_rate": 4.99997712947266e-06, "loss": 1.0975, "step": 1661 }, { "epoch": 0.03, "learning_rate": 4.9999764713626e-06, "loss": 1.0325, "step": 1662 }, { "epoch": 0.03, "learning_rate": 4.9999758039177034e-06, "loss": 1.0893, "step": 1663 }, { "epoch": 0.03, "learning_rate": 4.9999751271379745e-06, "loss": 0.9348, "step": 1664 }, { "epoch": 0.03, "learning_rate": 4.999974441023415e-06, "loss": 1.137, "step": 1665 }, { "epoch": 0.03, "learning_rate": 4.999973745574029e-06, "loss": 0.8333, "step": 1666 }, { "epoch": 0.03, "learning_rate": 4.999973040789815e-06, "loss": 1.0095, "step": 1667 }, { "epoch": 0.03, "learning_rate": 4.99997232667078e-06, "loss": 1.1686, "step": 1668 }, { "epoch": 0.03, "learning_rate": 4.999971603216924e-06, "loss": 1.1801, "step": 1669 }, { "epoch": 0.03, "learning_rate": 4.999970870428252e-06, "loss": 0.9084, "step": 1670 }, { "epoch": 0.03, "learning_rate": 4.999970128304764e-06, "loss": 1.0507, "step": 1671 }, { "epoch": 0.03, "learning_rate": 4.999969376846465e-06, "loss": 1.0039, "step": 1672 }, { "epoch": 0.03, "learning_rate": 4.999968616053357e-06, "loss": 1.0148, "step": 1673 }, { "epoch": 0.03, "learning_rate": 4.999967845925443e-06, "loss": 1.0669, "step": 1674 }, { "epoch": 0.03, "learning_rate": 4.999967066462725e-06, "loss": 0.9344, "step": 1675 }, { "epoch": 0.03, "learning_rate": 4.999966277665207e-06, "loss": 0.9953, "step": 1676 }, { "epoch": 0.03, "learning_rate": 4.999965479532892e-06, "loss": 0.8823, "step": 1677 }, { "epoch": 0.03, "learning_rate": 4.9999646720657824e-06, "loss": 0.9462, "step": 1678 }, { "epoch": 0.03, "learning_rate": 4.999963855263881e-06, "loss": 0.8339, "step": 1679 }, { "epoch": 0.03, "learning_rate": 4.999963029127191e-06, "loss": 0.9733, "step": 1680 }, { "epoch": 0.03, "learning_rate": 4.999962193655716e-06, "loss": 1.2757, "step": 1681 }, { "epoch": 0.03, "learning_rate": 4.999961348849459e-06, "loss": 1.0832, "step": 1682 }, { "epoch": 0.03, "learning_rate": 4.999960494708423e-06, "loss": 0.9738, "step": 1683 }, { "epoch": 0.03, "learning_rate": 4.999959631232611e-06, "loss": 1.0134, "step": 1684 }, { "epoch": 0.03, "learning_rate": 4.999958758422027e-06, "loss": 1.0795, "step": 1685 }, { "epoch": 0.03, "learning_rate": 4.999957876276672e-06, "loss": 1.0237, "step": 1686 }, { "epoch": 0.03, "learning_rate": 4.9999569847965525e-06, "loss": 1.1865, "step": 1687 }, { "epoch": 0.03, "learning_rate": 4.999956083981669e-06, "loss": 1.0945, "step": 1688 }, { "epoch": 0.03, "learning_rate": 4.999955173832027e-06, "loss": 0.799, "step": 1689 }, { "epoch": 0.03, "learning_rate": 4.999954254347629e-06, "loss": 0.9192, "step": 1690 }, { "epoch": 0.03, "learning_rate": 4.999953325528479e-06, "loss": 0.9908, "step": 1691 }, { "epoch": 0.03, "learning_rate": 4.999952387374579e-06, "loss": 0.9173, "step": 1692 }, { "epoch": 0.03, "learning_rate": 4.999951439885934e-06, "loss": 1.0961, "step": 1693 }, { "epoch": 0.03, "learning_rate": 4.999950483062547e-06, "loss": 1.2491, "step": 1694 }, { "epoch": 0.03, "learning_rate": 4.999949516904421e-06, "loss": 1.0078, "step": 1695 }, { "epoch": 0.03, "learning_rate": 4.99994854141156e-06, "loss": 0.9654, "step": 1696 }, { "epoch": 0.03, "learning_rate": 4.9999475565839686e-06, "loss": 1.0412, "step": 1697 }, { "epoch": 0.03, "learning_rate": 4.999946562421649e-06, "loss": 1.0081, "step": 1698 }, { "epoch": 0.03, "learning_rate": 4.9999455589246056e-06, "loss": 1.0997, "step": 1699 }, { "epoch": 0.03, "learning_rate": 4.999944546092842e-06, "loss": 1.1071, "step": 1700 }, { "epoch": 0.03, "learning_rate": 4.9999435239263624e-06, "loss": 0.8339, "step": 1701 }, { "epoch": 0.03, "learning_rate": 4.999942492425171e-06, "loss": 0.958, "step": 1702 }, { "epoch": 0.03, "learning_rate": 4.9999414515892705e-06, "loss": 0.9933, "step": 1703 }, { "epoch": 0.03, "learning_rate": 4.999940401418665e-06, "loss": 1.0509, "step": 1704 }, { "epoch": 0.03, "learning_rate": 4.999939341913359e-06, "loss": 1.0332, "step": 1705 }, { "epoch": 0.03, "learning_rate": 4.999938273073356e-06, "loss": 0.9817, "step": 1706 }, { "epoch": 0.03, "learning_rate": 4.999937194898661e-06, "loss": 0.8988, "step": 1707 }, { "epoch": 0.03, "learning_rate": 4.999936107389276e-06, "loss": 1.0566, "step": 1708 }, { "epoch": 0.03, "learning_rate": 4.999935010545206e-06, "loss": 1.159, "step": 1709 }, { "epoch": 0.03, "learning_rate": 4.9999339043664565e-06, "loss": 0.8004, "step": 1710 }, { "epoch": 0.03, "learning_rate": 4.999932788853029e-06, "loss": 1.2232, "step": 1711 }, { "epoch": 0.03, "learning_rate": 4.9999316640049304e-06, "loss": 1.1609, "step": 1712 }, { "epoch": 0.03, "learning_rate": 4.9999305298221635e-06, "loss": 1.2143, "step": 1713 }, { "epoch": 0.03, "learning_rate": 4.999929386304732e-06, "loss": 1.0246, "step": 1714 }, { "epoch": 0.03, "learning_rate": 4.999928233452641e-06, "loss": 0.9345, "step": 1715 }, { "epoch": 0.03, "learning_rate": 4.9999270712658945e-06, "loss": 0.9492, "step": 1716 }, { "epoch": 0.03, "learning_rate": 4.999925899744497e-06, "loss": 0.9512, "step": 1717 }, { "epoch": 0.03, "learning_rate": 4.999924718888454e-06, "loss": 1.327, "step": 1718 }, { "epoch": 0.03, "learning_rate": 4.999923528697768e-06, "loss": 1.0217, "step": 1719 }, { "epoch": 0.03, "learning_rate": 4.999922329172443e-06, "loss": 0.8664, "step": 1720 }, { "epoch": 0.03, "learning_rate": 4.999921120312486e-06, "loss": 0.9211, "step": 1721 }, { "epoch": 0.03, "learning_rate": 4.9999199021179e-06, "loss": 0.7712, "step": 1722 }, { "epoch": 0.03, "learning_rate": 4.9999186745886895e-06, "loss": 1.0143, "step": 1723 }, { "epoch": 0.03, "learning_rate": 4.999917437724859e-06, "loss": 0.9064, "step": 1724 }, { "epoch": 0.03, "learning_rate": 4.999916191526414e-06, "loss": 1.0682, "step": 1725 }, { "epoch": 0.03, "learning_rate": 4.9999149359933586e-06, "loss": 1.0838, "step": 1726 }, { "epoch": 0.03, "learning_rate": 4.999913671125698e-06, "loss": 0.925, "step": 1727 }, { "epoch": 0.03, "learning_rate": 4.999912396923435e-06, "loss": 0.8932, "step": 1728 }, { "epoch": 0.03, "learning_rate": 4.999911113386577e-06, "loss": 1.1853, "step": 1729 }, { "epoch": 0.03, "learning_rate": 4.999909820515127e-06, "loss": 1.1824, "step": 1730 }, { "epoch": 0.03, "learning_rate": 4.99990851830909e-06, "loss": 0.9745, "step": 1731 }, { "epoch": 0.03, "learning_rate": 4.999907206768472e-06, "loss": 1.1814, "step": 1732 }, { "epoch": 0.03, "learning_rate": 4.999905885893277e-06, "loss": 0.9621, "step": 1733 }, { "epoch": 0.03, "learning_rate": 4.99990455568351e-06, "loss": 0.9789, "step": 1734 }, { "epoch": 0.03, "learning_rate": 4.999903216139176e-06, "loss": 0.9067, "step": 1735 }, { "epoch": 0.03, "learning_rate": 4.999901867260279e-06, "loss": 0.948, "step": 1736 }, { "epoch": 0.03, "learning_rate": 4.999900509046827e-06, "loss": 1.3283, "step": 1737 }, { "epoch": 0.03, "learning_rate": 4.9998991414988214e-06, "loss": 0.9966, "step": 1738 }, { "epoch": 0.03, "learning_rate": 4.999897764616271e-06, "loss": 0.9908, "step": 1739 }, { "epoch": 0.03, "learning_rate": 4.999896378399177e-06, "loss": 1.052, "step": 1740 }, { "epoch": 0.03, "learning_rate": 4.999894982847547e-06, "loss": 0.8521, "step": 1741 }, { "epoch": 0.03, "learning_rate": 4.999893577961387e-06, "loss": 0.9622, "step": 1742 }, { "epoch": 0.03, "learning_rate": 4.9998921637407e-06, "loss": 1.077, "step": 1743 }, { "epoch": 0.03, "learning_rate": 4.999890740185493e-06, "loss": 1.2213, "step": 1744 }, { "epoch": 0.03, "learning_rate": 4.999889307295769e-06, "loss": 1.1053, "step": 1745 }, { "epoch": 0.03, "learning_rate": 4.999887865071537e-06, "loss": 1.1165, "step": 1746 }, { "epoch": 0.03, "learning_rate": 4.999886413512799e-06, "loss": 1.0569, "step": 1747 }, { "epoch": 0.03, "learning_rate": 4.999884952619563e-06, "loss": 0.911, "step": 1748 }, { "epoch": 0.03, "learning_rate": 4.999883482391832e-06, "loss": 1.192, "step": 1749 }, { "epoch": 0.03, "learning_rate": 4.999882002829613e-06, "loss": 1.1898, "step": 1750 }, { "epoch": 0.03, "learning_rate": 4.999880513932911e-06, "loss": 1.2797, "step": 1751 }, { "epoch": 0.03, "learning_rate": 4.999879015701733e-06, "loss": 0.7438, "step": 1752 }, { "epoch": 0.03, "learning_rate": 4.999877508136082e-06, "loss": 1.0152, "step": 1753 }, { "epoch": 0.03, "learning_rate": 4.9998759912359665e-06, "loss": 1.0884, "step": 1754 }, { "epoch": 0.03, "learning_rate": 4.999874465001389e-06, "loss": 0.9691, "step": 1755 }, { "epoch": 0.03, "learning_rate": 4.9998729294323575e-06, "loss": 1.4146, "step": 1756 }, { "epoch": 0.03, "learning_rate": 4.999871384528879e-06, "loss": 1.016, "step": 1757 }, { "epoch": 0.03, "learning_rate": 4.999869830290955e-06, "loss": 0.8448, "step": 1758 }, { "epoch": 0.03, "learning_rate": 4.999868266718594e-06, "loss": 0.9155, "step": 1759 }, { "epoch": 0.03, "learning_rate": 4.999866693811803e-06, "loss": 1.0929, "step": 1760 }, { "epoch": 0.03, "learning_rate": 4.999865111570585e-06, "loss": 1.2159, "step": 1761 }, { "epoch": 0.03, "learning_rate": 4.9998635199949474e-06, "loss": 1.0726, "step": 1762 }, { "epoch": 0.03, "learning_rate": 4.999861919084897e-06, "loss": 1.0197, "step": 1763 }, { "epoch": 0.03, "learning_rate": 4.9998603088404386e-06, "loss": 0.9963, "step": 1764 }, { "epoch": 0.03, "learning_rate": 4.999858689261577e-06, "loss": 0.8674, "step": 1765 }, { "epoch": 0.03, "learning_rate": 4.999857060348322e-06, "loss": 0.9738, "step": 1766 }, { "epoch": 0.03, "learning_rate": 4.9998554221006754e-06, "loss": 0.949, "step": 1767 }, { "epoch": 0.03, "learning_rate": 4.999853774518646e-06, "loss": 1.2358, "step": 1768 }, { "epoch": 0.03, "learning_rate": 4.99985211760224e-06, "loss": 1.1458, "step": 1769 }, { "epoch": 0.03, "learning_rate": 4.999850451351462e-06, "loss": 0.9387, "step": 1770 }, { "epoch": 0.03, "learning_rate": 4.99984877576632e-06, "loss": 1.1385, "step": 1771 }, { "epoch": 0.03, "learning_rate": 4.999847090846818e-06, "loss": 1.069, "step": 1772 }, { "epoch": 0.03, "learning_rate": 4.9998453965929645e-06, "loss": 0.773, "step": 1773 }, { "epoch": 0.03, "learning_rate": 4.9998436930047645e-06, "loss": 1.0866, "step": 1774 }, { "epoch": 0.03, "learning_rate": 4.999841980082225e-06, "loss": 1.2744, "step": 1775 }, { "epoch": 0.03, "learning_rate": 4.999840257825352e-06, "loss": 0.9791, "step": 1776 }, { "epoch": 0.03, "learning_rate": 4.999838526234152e-06, "loss": 0.8254, "step": 1777 }, { "epoch": 0.03, "learning_rate": 4.9998367853086324e-06, "loss": 0.7762, "step": 1778 }, { "epoch": 0.03, "learning_rate": 4.999835035048798e-06, "loss": 1.1093, "step": 1779 }, { "epoch": 0.03, "learning_rate": 4.9998332754546564e-06, "loss": 1.1101, "step": 1780 }, { "epoch": 0.03, "learning_rate": 4.999831506526215e-06, "loss": 1.1923, "step": 1781 }, { "epoch": 0.03, "learning_rate": 4.9998297282634775e-06, "loss": 1.0633, "step": 1782 }, { "epoch": 0.03, "learning_rate": 4.999827940666454e-06, "loss": 0.7479, "step": 1783 }, { "epoch": 0.03, "learning_rate": 4.999826143735149e-06, "loss": 1.0578, "step": 1784 }, { "epoch": 0.03, "learning_rate": 4.99982433746957e-06, "loss": 0.8752, "step": 1785 }, { "epoch": 0.03, "learning_rate": 4.999822521869724e-06, "loss": 0.9971, "step": 1786 }, { "epoch": 0.03, "learning_rate": 4.999820696935617e-06, "loss": 1.2626, "step": 1787 }, { "epoch": 0.03, "learning_rate": 4.999818862667255e-06, "loss": 1.1432, "step": 1788 }, { "epoch": 0.03, "learning_rate": 4.999817019064648e-06, "loss": 1.0125, "step": 1789 }, { "epoch": 0.03, "learning_rate": 4.9998151661278e-06, "loss": 0.9831, "step": 1790 }, { "epoch": 0.03, "learning_rate": 4.999813303856718e-06, "loss": 0.9397, "step": 1791 }, { "epoch": 0.03, "learning_rate": 4.999811432251411e-06, "loss": 0.8645, "step": 1792 }, { "epoch": 0.03, "learning_rate": 4.999809551311885e-06, "loss": 1.1019, "step": 1793 }, { "epoch": 0.03, "learning_rate": 4.999807661038145e-06, "loss": 1.1896, "step": 1794 }, { "epoch": 0.03, "learning_rate": 4.999805761430201e-06, "loss": 0.8092, "step": 1795 }, { "epoch": 0.03, "learning_rate": 4.9998038524880595e-06, "loss": 0.7824, "step": 1796 }, { "epoch": 0.03, "learning_rate": 4.999801934211726e-06, "loss": 0.82, "step": 1797 }, { "epoch": 0.03, "learning_rate": 4.999800006601209e-06, "loss": 0.8913, "step": 1798 }, { "epoch": 0.03, "learning_rate": 4.999798069656515e-06, "loss": 0.9724, "step": 1799 }, { "epoch": 0.03, "learning_rate": 4.999796123377653e-06, "loss": 1.1956, "step": 1800 }, { "epoch": 0.03, "learning_rate": 4.999794167764628e-06, "loss": 0.9939, "step": 1801 }, { "epoch": 0.03, "learning_rate": 4.999792202817448e-06, "loss": 0.8468, "step": 1802 }, { "epoch": 0.03, "learning_rate": 4.999790228536121e-06, "loss": 1.004, "step": 1803 }, { "epoch": 0.03, "learning_rate": 4.999788244920654e-06, "loss": 1.0403, "step": 1804 }, { "epoch": 0.03, "learning_rate": 4.999786251971054e-06, "loss": 1.0468, "step": 1805 }, { "epoch": 0.03, "learning_rate": 4.99978424968733e-06, "loss": 1.355, "step": 1806 }, { "epoch": 0.03, "learning_rate": 4.9997822380694865e-06, "loss": 0.799, "step": 1807 }, { "epoch": 0.03, "learning_rate": 4.999780217117534e-06, "loss": 1.0793, "step": 1808 }, { "epoch": 0.03, "learning_rate": 4.9997781868314774e-06, "loss": 0.9576, "step": 1809 }, { "epoch": 0.03, "learning_rate": 4.999776147211327e-06, "loss": 0.9472, "step": 1810 }, { "epoch": 0.03, "learning_rate": 4.999774098257089e-06, "loss": 0.9733, "step": 1811 }, { "epoch": 0.03, "learning_rate": 4.999772039968771e-06, "loss": 1.3118, "step": 1812 }, { "epoch": 0.03, "learning_rate": 4.9997699723463805e-06, "loss": 0.8775, "step": 1813 }, { "epoch": 0.03, "learning_rate": 4.999767895389926e-06, "loss": 0.9072, "step": 1814 }, { "epoch": 0.03, "learning_rate": 4.999765809099414e-06, "loss": 0.9851, "step": 1815 }, { "epoch": 0.03, "learning_rate": 4.999763713474854e-06, "loss": 0.8884, "step": 1816 }, { "epoch": 0.03, "learning_rate": 4.999761608516253e-06, "loss": 0.9473, "step": 1817 }, { "epoch": 0.03, "learning_rate": 4.999759494223618e-06, "loss": 1.101, "step": 1818 }, { "epoch": 0.03, "learning_rate": 4.9997573705969585e-06, "loss": 1.1447, "step": 1819 }, { "epoch": 0.03, "learning_rate": 4.999755237636281e-06, "loss": 0.9385, "step": 1820 }, { "epoch": 0.03, "learning_rate": 4.999753095341594e-06, "loss": 1.0262, "step": 1821 }, { "epoch": 0.03, "learning_rate": 4.9997509437129065e-06, "loss": 0.8976, "step": 1822 }, { "epoch": 0.03, "learning_rate": 4.999748782750225e-06, "loss": 0.9599, "step": 1823 }, { "epoch": 0.03, "learning_rate": 4.999746612453558e-06, "loss": 0.9937, "step": 1824 }, { "epoch": 0.03, "learning_rate": 4.999744432822914e-06, "loss": 1.1072, "step": 1825 }, { "epoch": 0.03, "learning_rate": 4.999742243858301e-06, "loss": 0.865, "step": 1826 }, { "epoch": 0.03, "learning_rate": 4.999740045559727e-06, "loss": 1.0281, "step": 1827 }, { "epoch": 0.03, "learning_rate": 4.999737837927201e-06, "loss": 0.8832, "step": 1828 }, { "epoch": 0.03, "learning_rate": 4.999735620960729e-06, "loss": 0.853, "step": 1829 }, { "epoch": 0.03, "learning_rate": 4.999733394660322e-06, "loss": 1.1737, "step": 1830 }, { "epoch": 0.03, "learning_rate": 4.999731159025988e-06, "loss": 1.239, "step": 1831 }, { "epoch": 0.03, "learning_rate": 4.999728914057733e-06, "loss": 1.1696, "step": 1832 }, { "epoch": 0.03, "learning_rate": 4.999726659755567e-06, "loss": 1.0068, "step": 1833 }, { "epoch": 0.03, "learning_rate": 4.999724396119498e-06, "loss": 0.8796, "step": 1834 }, { "epoch": 0.03, "learning_rate": 4.9997221231495365e-06, "loss": 0.8439, "step": 1835 }, { "epoch": 0.03, "learning_rate": 4.999719840845688e-06, "loss": 1.0507, "step": 1836 }, { "epoch": 0.03, "learning_rate": 4.999717549207962e-06, "loss": 1.0632, "step": 1837 }, { "epoch": 0.03, "learning_rate": 4.999715248236368e-06, "loss": 1.0062, "step": 1838 }, { "epoch": 0.03, "learning_rate": 4.999712937930913e-06, "loss": 0.9303, "step": 1839 }, { "epoch": 0.03, "learning_rate": 4.999710618291608e-06, "loss": 0.8994, "step": 1840 }, { "epoch": 0.03, "learning_rate": 4.999708289318459e-06, "loss": 0.9216, "step": 1841 }, { "epoch": 0.03, "learning_rate": 4.999705951011476e-06, "loss": 1.0643, "step": 1842 }, { "epoch": 0.03, "learning_rate": 4.999703603370668e-06, "loss": 1.0656, "step": 1843 }, { "epoch": 0.03, "learning_rate": 4.999701246396042e-06, "loss": 1.1543, "step": 1844 }, { "epoch": 0.03, "learning_rate": 4.99969888008761e-06, "loss": 1.0995, "step": 1845 }, { "epoch": 0.03, "learning_rate": 4.999696504445379e-06, "loss": 1.1035, "step": 1846 }, { "epoch": 0.03, "learning_rate": 4.999694119469357e-06, "loss": 0.9337, "step": 1847 }, { "epoch": 0.03, "learning_rate": 4.999691725159555e-06, "loss": 1.0884, "step": 1848 }, { "epoch": 0.03, "learning_rate": 4.999689321515979e-06, "loss": 1.0796, "step": 1849 }, { "epoch": 0.03, "learning_rate": 4.99968690853864e-06, "loss": 1.1296, "step": 1850 }, { "epoch": 0.03, "learning_rate": 4.999684486227548e-06, "loss": 0.8917, "step": 1851 }, { "epoch": 0.03, "learning_rate": 4.99968205458271e-06, "loss": 1.04, "step": 1852 }, { "epoch": 0.03, "learning_rate": 4.999679613604136e-06, "loss": 0.7884, "step": 1853 }, { "epoch": 0.03, "learning_rate": 4.999677163291835e-06, "loss": 0.9825, "step": 1854 }, { "epoch": 0.03, "learning_rate": 4.999674703645816e-06, "loss": 1.171, "step": 1855 }, { "epoch": 0.04, "learning_rate": 4.999672234666088e-06, "loss": 1.1411, "step": 1856 }, { "epoch": 0.04, "learning_rate": 4.999669756352661e-06, "loss": 0.8875, "step": 1857 }, { "epoch": 0.04, "learning_rate": 4.999667268705544e-06, "loss": 1.0266, "step": 1858 }, { "epoch": 0.04, "learning_rate": 4.999664771724745e-06, "loss": 1.0344, "step": 1859 }, { "epoch": 0.04, "learning_rate": 4.999662265410275e-06, "loss": 0.9412, "step": 1860 }, { "epoch": 0.04, "learning_rate": 4.999659749762143e-06, "loss": 1.0066, "step": 1861 }, { "epoch": 0.04, "learning_rate": 4.9996572247803575e-06, "loss": 1.0432, "step": 1862 }, { "epoch": 0.04, "learning_rate": 4.999654690464929e-06, "loss": 1.0287, "step": 1863 }, { "epoch": 0.04, "learning_rate": 4.999652146815867e-06, "loss": 1.006, "step": 1864 }, { "epoch": 0.04, "learning_rate": 4.99964959383318e-06, "loss": 0.9397, "step": 1865 }, { "epoch": 0.04, "learning_rate": 4.999647031516878e-06, "loss": 1.0097, "step": 1866 }, { "epoch": 0.04, "learning_rate": 4.99964445986697e-06, "loss": 1.061, "step": 1867 }, { "epoch": 0.04, "learning_rate": 4.999641878883467e-06, "loss": 0.8653, "step": 1868 }, { "epoch": 0.04, "learning_rate": 4.999639288566378e-06, "loss": 0.8571, "step": 1869 }, { "epoch": 0.04, "learning_rate": 4.9996366889157126e-06, "loss": 1.0322, "step": 1870 }, { "epoch": 0.04, "learning_rate": 4.9996340799314805e-06, "loss": 0.9828, "step": 1871 }, { "epoch": 0.04, "learning_rate": 4.999631461613691e-06, "loss": 1.0566, "step": 1872 }, { "epoch": 0.04, "learning_rate": 4.999628833962354e-06, "loss": 0.9747, "step": 1873 }, { "epoch": 0.04, "learning_rate": 4.9996261969774795e-06, "loss": 0.9587, "step": 1874 }, { "epoch": 0.04, "learning_rate": 4.999623550659078e-06, "loss": 1.2123, "step": 1875 }, { "epoch": 0.04, "learning_rate": 4.999620895007159e-06, "loss": 0.9456, "step": 1876 }, { "epoch": 0.04, "learning_rate": 4.999618230021731e-06, "loss": 1.0312, "step": 1877 }, { "epoch": 0.04, "learning_rate": 4.999615555702806e-06, "loss": 0.9922, "step": 1878 }, { "epoch": 0.04, "learning_rate": 4.999612872050393e-06, "loss": 1.0322, "step": 1879 }, { "epoch": 0.04, "learning_rate": 4.9996101790645025e-06, "loss": 0.9974, "step": 1880 }, { "epoch": 0.04, "learning_rate": 4.999607476745144e-06, "loss": 1.3098, "step": 1881 }, { "epoch": 0.04, "learning_rate": 4.999604765092329e-06, "loss": 1.0722, "step": 1882 }, { "epoch": 0.04, "learning_rate": 4.999602044106064e-06, "loss": 0.8734, "step": 1883 }, { "epoch": 0.04, "learning_rate": 4.999599313786363e-06, "loss": 0.9609, "step": 1884 }, { "epoch": 0.04, "learning_rate": 4.999596574133235e-06, "loss": 0.9027, "step": 1885 }, { "epoch": 0.04, "learning_rate": 4.99959382514669e-06, "loss": 0.9023, "step": 1886 }, { "epoch": 0.04, "learning_rate": 4.999591066826738e-06, "loss": 1.013, "step": 1887 }, { "epoch": 0.04, "learning_rate": 4.999588299173391e-06, "loss": 0.9935, "step": 1888 }, { "epoch": 0.04, "learning_rate": 4.999585522186655e-06, "loss": 0.9223, "step": 1889 }, { "epoch": 0.04, "learning_rate": 4.999582735866545e-06, "loss": 0.9785, "step": 1890 }, { "epoch": 0.04, "learning_rate": 4.9995799402130695e-06, "loss": 0.879, "step": 1891 }, { "epoch": 0.04, "learning_rate": 4.999577135226239e-06, "loss": 0.8885, "step": 1892 }, { "epoch": 0.04, "learning_rate": 4.999574320906065e-06, "loss": 1.0565, "step": 1893 }, { "epoch": 0.04, "learning_rate": 4.999571497252556e-06, "loss": 1.1261, "step": 1894 }, { "epoch": 0.04, "learning_rate": 4.999568664265725e-06, "loss": 0.8137, "step": 1895 }, { "epoch": 0.04, "learning_rate": 4.99956582194558e-06, "loss": 0.8983, "step": 1896 }, { "epoch": 0.04, "learning_rate": 4.999562970292134e-06, "loss": 1.0596, "step": 1897 }, { "epoch": 0.04, "learning_rate": 4.999560109305395e-06, "loss": 0.7692, "step": 1898 }, { "epoch": 0.04, "learning_rate": 4.999557238985376e-06, "loss": 0.9682, "step": 1899 }, { "epoch": 0.04, "learning_rate": 4.999554359332087e-06, "loss": 1.1212, "step": 1900 }, { "epoch": 0.04, "learning_rate": 4.9995514703455385e-06, "loss": 0.7949, "step": 1901 }, { "epoch": 0.04, "learning_rate": 4.999548572025741e-06, "loss": 1.121, "step": 1902 }, { "epoch": 0.04, "learning_rate": 4.999545664372706e-06, "loss": 0.9943, "step": 1903 }, { "epoch": 0.04, "learning_rate": 4.999542747386445e-06, "loss": 1.0279, "step": 1904 }, { "epoch": 0.04, "learning_rate": 4.999539821066967e-06, "loss": 1.0022, "step": 1905 }, { "epoch": 0.04, "learning_rate": 4.999536885414285e-06, "loss": 0.9752, "step": 1906 }, { "epoch": 0.04, "learning_rate": 4.999533940428407e-06, "loss": 1.0695, "step": 1907 }, { "epoch": 0.04, "learning_rate": 4.999530986109347e-06, "loss": 1.0342, "step": 1908 }, { "epoch": 0.04, "learning_rate": 4.999528022457116e-06, "loss": 0.8014, "step": 1909 }, { "epoch": 0.04, "learning_rate": 4.999525049471723e-06, "loss": 0.8597, "step": 1910 }, { "epoch": 0.04, "learning_rate": 4.99952206715318e-06, "loss": 0.9138, "step": 1911 }, { "epoch": 0.04, "learning_rate": 4.9995190755014986e-06, "loss": 1.014, "step": 1912 }, { "epoch": 0.04, "learning_rate": 4.999516074516689e-06, "loss": 1.1207, "step": 1913 }, { "epoch": 0.04, "learning_rate": 4.999513064198764e-06, "loss": 0.8625, "step": 1914 }, { "epoch": 0.04, "learning_rate": 4.999510044547733e-06, "loss": 1.0737, "step": 1915 }, { "epoch": 0.04, "learning_rate": 4.999507015563608e-06, "loss": 0.9028, "step": 1916 }, { "epoch": 0.04, "learning_rate": 4.9995039772464015e-06, "loss": 0.8961, "step": 1917 }, { "epoch": 0.04, "learning_rate": 4.999500929596123e-06, "loss": 1.1121, "step": 1918 }, { "epoch": 0.04, "learning_rate": 4.999497872612785e-06, "loss": 1.1133, "step": 1919 }, { "epoch": 0.04, "learning_rate": 4.999494806296398e-06, "loss": 0.9767, "step": 1920 }, { "epoch": 0.04, "learning_rate": 4.999491730646974e-06, "loss": 1.0815, "step": 1921 }, { "epoch": 0.04, "learning_rate": 4.999488645664526e-06, "loss": 1.0143, "step": 1922 }, { "epoch": 0.04, "learning_rate": 4.999485551349062e-06, "loss": 0.9296, "step": 1923 }, { "epoch": 0.04, "learning_rate": 4.999482447700597e-06, "loss": 1.031, "step": 1924 }, { "epoch": 0.04, "learning_rate": 4.99947933471914e-06, "loss": 1.0756, "step": 1925 }, { "epoch": 0.04, "learning_rate": 4.999476212404705e-06, "loss": 0.9343, "step": 1926 }, { "epoch": 0.04, "learning_rate": 4.9994730807573024e-06, "loss": 0.9678, "step": 1927 }, { "epoch": 0.04, "learning_rate": 4.999469939776944e-06, "loss": 0.9608, "step": 1928 }, { "epoch": 0.04, "learning_rate": 4.99946678946364e-06, "loss": 0.92, "step": 1929 }, { "epoch": 0.04, "learning_rate": 4.999463629817405e-06, "loss": 1.1167, "step": 1930 }, { "epoch": 0.04, "learning_rate": 4.9994604608382495e-06, "loss": 1.2597, "step": 1931 }, { "epoch": 0.04, "learning_rate": 4.9994572825261845e-06, "loss": 0.8833, "step": 1932 }, { "epoch": 0.04, "learning_rate": 4.999454094881223e-06, "loss": 0.9628, "step": 1933 }, { "epoch": 0.04, "learning_rate": 4.999450897903377e-06, "loss": 0.9174, "step": 1934 }, { "epoch": 0.04, "learning_rate": 4.999447691592657e-06, "loss": 0.9384, "step": 1935 }, { "epoch": 0.04, "learning_rate": 4.999444475949077e-06, "loss": 1.0092, "step": 1936 }, { "epoch": 0.04, "learning_rate": 4.999441250972647e-06, "loss": 0.9731, "step": 1937 }, { "epoch": 0.04, "learning_rate": 4.999438016663381e-06, "loss": 0.8572, "step": 1938 }, { "epoch": 0.04, "learning_rate": 4.999434773021289e-06, "loss": 0.8946, "step": 1939 }, { "epoch": 0.04, "learning_rate": 4.999431520046385e-06, "loss": 0.8142, "step": 1940 }, { "epoch": 0.04, "learning_rate": 4.99942825773868e-06, "loss": 1.0073, "step": 1941 }, { "epoch": 0.04, "learning_rate": 4.999424986098187e-06, "loss": 0.9194, "step": 1942 }, { "epoch": 0.04, "learning_rate": 4.999421705124917e-06, "loss": 1.2682, "step": 1943 }, { "epoch": 0.04, "learning_rate": 4.9994184148188835e-06, "loss": 1.2228, "step": 1944 }, { "epoch": 0.04, "learning_rate": 4.999415115180098e-06, "loss": 0.9803, "step": 1945 }, { "epoch": 0.04, "learning_rate": 4.999411806208573e-06, "loss": 1.0167, "step": 1946 }, { "epoch": 0.04, "learning_rate": 4.999408487904321e-06, "loss": 0.9204, "step": 1947 }, { "epoch": 0.04, "learning_rate": 4.999405160267355e-06, "loss": 0.9773, "step": 1948 }, { "epoch": 0.04, "learning_rate": 4.999401823297686e-06, "loss": 1.0959, "step": 1949 }, { "epoch": 0.04, "learning_rate": 4.999398476995327e-06, "loss": 1.0934, "step": 1950 }, { "epoch": 0.04, "learning_rate": 4.999395121360292e-06, "loss": 0.9653, "step": 1951 }, { "epoch": 0.04, "learning_rate": 4.9993917563925906e-06, "loss": 0.9504, "step": 1952 }, { "epoch": 0.04, "learning_rate": 4.999388382092238e-06, "loss": 1.0279, "step": 1953 }, { "epoch": 0.04, "learning_rate": 4.999384998459246e-06, "loss": 1.0342, "step": 1954 }, { "epoch": 0.04, "learning_rate": 4.999381605493627e-06, "loss": 1.0391, "step": 1955 }, { "epoch": 0.04, "learning_rate": 4.999378203195393e-06, "loss": 1.1188, "step": 1956 }, { "epoch": 0.04, "learning_rate": 4.999374791564558e-06, "loss": 1.0175, "step": 1957 }, { "epoch": 0.04, "learning_rate": 4.999371370601133e-06, "loss": 0.9691, "step": 1958 }, { "epoch": 0.04, "learning_rate": 4.999367940305134e-06, "loss": 1.1392, "step": 1959 }, { "epoch": 0.04, "learning_rate": 4.9993645006765704e-06, "loss": 0.8798, "step": 1960 }, { "epoch": 0.04, "learning_rate": 4.999361051715457e-06, "loss": 0.8727, "step": 1961 }, { "epoch": 0.04, "learning_rate": 4.999357593421806e-06, "loss": 1.202, "step": 1962 }, { "epoch": 0.04, "learning_rate": 4.99935412579563e-06, "loss": 0.8295, "step": 1963 }, { "epoch": 0.04, "learning_rate": 4.999350648836943e-06, "loss": 0.849, "step": 1964 }, { "epoch": 0.04, "learning_rate": 4.9993471625457555e-06, "loss": 0.9734, "step": 1965 }, { "epoch": 0.04, "learning_rate": 4.999343666922084e-06, "loss": 0.9155, "step": 1966 }, { "epoch": 0.04, "learning_rate": 4.9993401619659395e-06, "loss": 1.0341, "step": 1967 }, { "epoch": 0.04, "learning_rate": 4.999336647677335e-06, "loss": 1.1567, "step": 1968 }, { "epoch": 0.04, "learning_rate": 4.9993331240562845e-06, "loss": 1.1866, "step": 1969 }, { "epoch": 0.04, "learning_rate": 4.999329591102802e-06, "loss": 0.7064, "step": 1970 }, { "epoch": 0.04, "learning_rate": 4.999326048816897e-06, "loss": 0.8455, "step": 1971 }, { "epoch": 0.04, "learning_rate": 4.999322497198586e-06, "loss": 0.9583, "step": 1972 }, { "epoch": 0.04, "learning_rate": 4.999318936247883e-06, "loss": 0.9456, "step": 1973 }, { "epoch": 0.04, "learning_rate": 4.999315365964799e-06, "loss": 0.9895, "step": 1974 }, { "epoch": 0.04, "learning_rate": 4.999311786349347e-06, "loss": 1.0821, "step": 1975 }, { "epoch": 0.04, "learning_rate": 4.999308197401542e-06, "loss": 1.1078, "step": 1976 }, { "epoch": 0.04, "learning_rate": 4.999304599121396e-06, "loss": 0.9527, "step": 1977 }, { "epoch": 0.04, "learning_rate": 4.999300991508925e-06, "loss": 1.062, "step": 1978 }, { "epoch": 0.04, "learning_rate": 4.999297374564139e-06, "loss": 0.9314, "step": 1979 }, { "epoch": 0.04, "learning_rate": 4.999293748287055e-06, "loss": 1.123, "step": 1980 }, { "epoch": 0.04, "learning_rate": 4.999290112677683e-06, "loss": 1.2587, "step": 1981 }, { "epoch": 0.04, "learning_rate": 4.99928646773604e-06, "loss": 1.0898, "step": 1982 }, { "epoch": 0.04, "learning_rate": 4.999282813462136e-06, "loss": 0.8279, "step": 1983 }, { "epoch": 0.04, "learning_rate": 4.999279149855988e-06, "loss": 0.9006, "step": 1984 }, { "epoch": 0.04, "learning_rate": 4.999275476917609e-06, "loss": 0.8201, "step": 1985 }, { "epoch": 0.04, "learning_rate": 4.99927179464701e-06, "loss": 0.993, "step": 1986 }, { "epoch": 0.04, "learning_rate": 4.999268103044208e-06, "loss": 1.0628, "step": 1987 }, { "epoch": 0.04, "learning_rate": 4.9992644021092156e-06, "loss": 1.0317, "step": 1988 }, { "epoch": 0.04, "learning_rate": 4.999260691842046e-06, "loss": 0.8529, "step": 1989 }, { "epoch": 0.04, "learning_rate": 4.999256972242714e-06, "loss": 0.8425, "step": 1990 }, { "epoch": 0.04, "learning_rate": 4.9992532433112326e-06, "loss": 1.0824, "step": 1991 }, { "epoch": 0.04, "learning_rate": 4.999249505047617e-06, "loss": 1.0649, "step": 1992 }, { "epoch": 0.04, "learning_rate": 4.99924575745188e-06, "loss": 1.3013, "step": 1993 }, { "epoch": 0.04, "learning_rate": 4.999242000524036e-06, "loss": 0.8559, "step": 1994 }, { "epoch": 0.04, "learning_rate": 4.999238234264098e-06, "loss": 0.8567, "step": 1995 }, { "epoch": 0.04, "learning_rate": 4.999234458672082e-06, "loss": 0.8454, "step": 1996 }, { "epoch": 0.04, "learning_rate": 4.999230673748001e-06, "loss": 1.0924, "step": 1997 }, { "epoch": 0.04, "learning_rate": 4.99922687949187e-06, "loss": 1.0488, "step": 1998 }, { "epoch": 0.04, "learning_rate": 4.999223075903702e-06, "loss": 1.066, "step": 1999 }, { "epoch": 0.04, "learning_rate": 4.999219262983511e-06, "loss": 1.0874, "step": 2000 }, { "epoch": 0.04, "learning_rate": 4.999215440731313e-06, "loss": 0.9946, "step": 2001 }, { "epoch": 0.04, "learning_rate": 4.99921160914712e-06, "loss": 1.0459, "step": 2002 }, { "epoch": 0.04, "learning_rate": 4.999207768230948e-06, "loss": 0.9843, "step": 2003 }, { "epoch": 0.04, "learning_rate": 4.9992039179828115e-06, "loss": 0.9846, "step": 2004 }, { "epoch": 0.04, "learning_rate": 4.999200058402723e-06, "loss": 0.952, "step": 2005 }, { "epoch": 0.04, "learning_rate": 4.9991961894907e-06, "loss": 1.0157, "step": 2006 }, { "epoch": 0.04, "learning_rate": 4.999192311246753e-06, "loss": 0.6832, "step": 2007 }, { "epoch": 0.04, "learning_rate": 4.999188423670899e-06, "loss": 0.8381, "step": 2008 }, { "epoch": 0.04, "learning_rate": 4.9991845267631525e-06, "loss": 0.8697, "step": 2009 }, { "epoch": 0.04, "learning_rate": 4.999180620523527e-06, "loss": 0.9619, "step": 2010 }, { "epoch": 0.04, "learning_rate": 4.999176704952039e-06, "loss": 1.1588, "step": 2011 }, { "epoch": 0.04, "learning_rate": 4.9991727800487004e-06, "loss": 0.9976, "step": 2012 }, { "epoch": 0.04, "learning_rate": 4.999168845813528e-06, "loss": 0.9909, "step": 2013 }, { "epoch": 0.04, "learning_rate": 4.999164902246535e-06, "loss": 0.8737, "step": 2014 }, { "epoch": 0.04, "learning_rate": 4.9991609493477376e-06, "loss": 1.0318, "step": 2015 }, { "epoch": 0.04, "learning_rate": 4.99915698711715e-06, "loss": 0.8815, "step": 2016 }, { "epoch": 0.04, "learning_rate": 4.999153015554786e-06, "loss": 0.887, "step": 2017 }, { "epoch": 0.04, "learning_rate": 4.999149034660663e-06, "loss": 1.1517, "step": 2018 }, { "epoch": 0.04, "learning_rate": 4.999145044434792e-06, "loss": 1.2054, "step": 2019 }, { "epoch": 0.04, "learning_rate": 4.999141044877192e-06, "loss": 1.1964, "step": 2020 }, { "epoch": 0.04, "learning_rate": 4.999137035987874e-06, "loss": 1.0398, "step": 2021 }, { "epoch": 0.04, "learning_rate": 4.999133017766856e-06, "loss": 1.2041, "step": 2022 }, { "epoch": 0.04, "learning_rate": 4.9991289902141516e-06, "loss": 1.0527, "step": 2023 }, { "epoch": 0.04, "learning_rate": 4.999124953329777e-06, "loss": 1.463, "step": 2024 }, { "epoch": 0.04, "learning_rate": 4.999120907113746e-06, "loss": 1.0904, "step": 2025 }, { "epoch": 0.04, "learning_rate": 4.999116851566073e-06, "loss": 1.1296, "step": 2026 }, { "epoch": 0.04, "learning_rate": 4.999112786686776e-06, "loss": 0.8461, "step": 2027 }, { "epoch": 0.04, "learning_rate": 4.999108712475868e-06, "loss": 0.8158, "step": 2028 }, { "epoch": 0.04, "learning_rate": 4.999104628933364e-06, "loss": 1.1053, "step": 2029 }, { "epoch": 0.04, "learning_rate": 4.99910053605928e-06, "loss": 1.0966, "step": 2030 }, { "epoch": 0.04, "learning_rate": 4.9990964338536315e-06, "loss": 1.2255, "step": 2031 }, { "epoch": 0.04, "learning_rate": 4.999092322316435e-06, "loss": 0.6582, "step": 2032 }, { "epoch": 0.04, "learning_rate": 4.999088201447702e-06, "loss": 0.927, "step": 2033 }, { "epoch": 0.04, "learning_rate": 4.999084071247452e-06, "loss": 0.8253, "step": 2034 }, { "epoch": 0.04, "learning_rate": 4.999079931715698e-06, "loss": 0.8519, "step": 2035 }, { "epoch": 0.04, "learning_rate": 4.999075782852456e-06, "loss": 0.9525, "step": 2036 }, { "epoch": 0.04, "learning_rate": 4.999071624657742e-06, "loss": 1.1376, "step": 2037 }, { "epoch": 0.04, "learning_rate": 4.999067457131571e-06, "loss": 1.1054, "step": 2038 }, { "epoch": 0.04, "learning_rate": 4.999063280273958e-06, "loss": 1.0667, "step": 2039 }, { "epoch": 0.04, "learning_rate": 4.99905909408492e-06, "loss": 1.0241, "step": 2040 }, { "epoch": 0.04, "learning_rate": 4.999054898564473e-06, "loss": 0.7993, "step": 2041 }, { "epoch": 0.04, "learning_rate": 4.999050693712631e-06, "loss": 0.7864, "step": 2042 }, { "epoch": 0.04, "learning_rate": 4.999046479529409e-06, "loss": 1.1709, "step": 2043 }, { "epoch": 0.04, "learning_rate": 4.9990422560148255e-06, "loss": 1.132, "step": 2044 }, { "epoch": 0.04, "learning_rate": 4.999038023168894e-06, "loss": 0.9973, "step": 2045 }, { "epoch": 0.04, "learning_rate": 4.999033780991632e-06, "loss": 0.8548, "step": 2046 }, { "epoch": 0.04, "learning_rate": 4.999029529483053e-06, "loss": 0.8892, "step": 2047 }, { "epoch": 0.04, "learning_rate": 4.999025268643176e-06, "loss": 0.9008, "step": 2048 }, { "epoch": 0.04, "learning_rate": 4.999020998472015e-06, "loss": 1.0322, "step": 2049 }, { "epoch": 0.04, "learning_rate": 4.999016718969586e-06, "loss": 1.3525, "step": 2050 }, { "epoch": 0.04, "learning_rate": 4.999012430135904e-06, "loss": 1.1969, "step": 2051 }, { "epoch": 0.04, "learning_rate": 4.9990081319709885e-06, "loss": 0.8668, "step": 2052 }, { "epoch": 0.04, "learning_rate": 4.999003824474852e-06, "loss": 0.9232, "step": 2053 }, { "epoch": 0.04, "learning_rate": 4.998999507647512e-06, "loss": 1.0925, "step": 2054 }, { "epoch": 0.04, "learning_rate": 4.998995181488984e-06, "loss": 0.9805, "step": 2055 }, { "epoch": 0.04, "learning_rate": 4.998990845999285e-06, "loss": 1.2201, "step": 2056 }, { "epoch": 0.04, "learning_rate": 4.998986501178431e-06, "loss": 0.9491, "step": 2057 }, { "epoch": 0.04, "learning_rate": 4.998982147026438e-06, "loss": 0.9646, "step": 2058 }, { "epoch": 0.04, "learning_rate": 4.998977783543322e-06, "loss": 0.9631, "step": 2059 }, { "epoch": 0.04, "learning_rate": 4.998973410729099e-06, "loss": 0.9766, "step": 2060 }, { "epoch": 0.04, "learning_rate": 4.998969028583787e-06, "loss": 0.8524, "step": 2061 }, { "epoch": 0.04, "learning_rate": 4.998964637107401e-06, "loss": 1.1208, "step": 2062 }, { "epoch": 0.04, "learning_rate": 4.9989602362999565e-06, "loss": 1.2088, "step": 2063 }, { "epoch": 0.04, "learning_rate": 4.998955826161472e-06, "loss": 1.0018, "step": 2064 }, { "epoch": 0.04, "learning_rate": 4.998951406691963e-06, "loss": 1.075, "step": 2065 }, { "epoch": 0.04, "learning_rate": 4.9989469778914464e-06, "loss": 0.8628, "step": 2066 }, { "epoch": 0.04, "learning_rate": 4.998942539759939e-06, "loss": 1.0894, "step": 2067 }, { "epoch": 0.04, "learning_rate": 4.998938092297455e-06, "loss": 1.1426, "step": 2068 }, { "epoch": 0.04, "learning_rate": 4.998933635504014e-06, "loss": 1.1041, "step": 2069 }, { "epoch": 0.04, "learning_rate": 4.998929169379632e-06, "loss": 1.0583, "step": 2070 }, { "epoch": 0.04, "learning_rate": 4.998924693924324e-06, "loss": 0.9639, "step": 2071 }, { "epoch": 0.04, "learning_rate": 4.998920209138108e-06, "loss": 0.988, "step": 2072 }, { "epoch": 0.04, "learning_rate": 4.998915715021001e-06, "loss": 0.962, "step": 2073 }, { "epoch": 0.04, "learning_rate": 4.9989112115730184e-06, "loss": 1.1686, "step": 2074 }, { "epoch": 0.04, "learning_rate": 4.998906698794179e-06, "loss": 1.1896, "step": 2075 }, { "epoch": 0.04, "learning_rate": 4.998902176684498e-06, "loss": 1.1357, "step": 2076 }, { "epoch": 0.04, "learning_rate": 4.998897645243993e-06, "loss": 0.9198, "step": 2077 }, { "epoch": 0.04, "learning_rate": 4.998893104472681e-06, "loss": 1.0633, "step": 2078 }, { "epoch": 0.04, "learning_rate": 4.998888554370579e-06, "loss": 0.7776, "step": 2079 }, { "epoch": 0.04, "learning_rate": 4.9988839949377035e-06, "loss": 1.2126, "step": 2080 }, { "epoch": 0.04, "learning_rate": 4.9988794261740714e-06, "loss": 1.2131, "step": 2081 }, { "epoch": 0.04, "learning_rate": 4.9988748480797e-06, "loss": 1.002, "step": 2082 }, { "epoch": 0.04, "learning_rate": 4.998870260654607e-06, "loss": 1.0456, "step": 2083 }, { "epoch": 0.04, "learning_rate": 4.998865663898809e-06, "loss": 0.8184, "step": 2084 }, { "epoch": 0.04, "learning_rate": 4.9988610578123234e-06, "loss": 0.8906, "step": 2085 }, { "epoch": 0.04, "learning_rate": 4.998856442395167e-06, "loss": 0.9429, "step": 2086 }, { "epoch": 0.04, "learning_rate": 4.998851817647357e-06, "loss": 1.1821, "step": 2087 }, { "epoch": 0.04, "learning_rate": 4.9988471835689114e-06, "loss": 1.1547, "step": 2088 }, { "epoch": 0.04, "learning_rate": 4.998842540159847e-06, "loss": 0.9703, "step": 2089 }, { "epoch": 0.04, "learning_rate": 4.998837887420181e-06, "loss": 0.9925, "step": 2090 }, { "epoch": 0.04, "learning_rate": 4.998833225349931e-06, "loss": 0.9257, "step": 2091 }, { "epoch": 0.04, "learning_rate": 4.998828553949114e-06, "loss": 0.9471, "step": 2092 }, { "epoch": 0.04, "learning_rate": 4.9988238732177484e-06, "loss": 1.0677, "step": 2093 }, { "epoch": 0.04, "learning_rate": 4.998819183155851e-06, "loss": 1.2003, "step": 2094 }, { "epoch": 0.04, "learning_rate": 4.998814483763439e-06, "loss": 1.1359, "step": 2095 }, { "epoch": 0.04, "learning_rate": 4.99880977504053e-06, "loss": 1.0016, "step": 2096 }, { "epoch": 0.04, "learning_rate": 4.998805056987143e-06, "loss": 0.8975, "step": 2097 }, { "epoch": 0.04, "learning_rate": 4.998800329603294e-06, "loss": 0.8696, "step": 2098 }, { "epoch": 0.04, "learning_rate": 4.998795592889001e-06, "loss": 1.1611, "step": 2099 }, { "epoch": 0.04, "learning_rate": 4.998790846844282e-06, "loss": 1.221, "step": 2100 }, { "epoch": 0.04, "learning_rate": 4.9987860914691546e-06, "loss": 1.0376, "step": 2101 }, { "epoch": 0.04, "learning_rate": 4.998781326763637e-06, "loss": 1.0151, "step": 2102 }, { "epoch": 0.04, "learning_rate": 4.998776552727746e-06, "loss": 0.8779, "step": 2103 }, { "epoch": 0.04, "learning_rate": 4.9987717693615e-06, "loss": 0.9189, "step": 2104 }, { "epoch": 0.04, "learning_rate": 4.9987669766649174e-06, "loss": 1.1122, "step": 2105 }, { "epoch": 0.04, "learning_rate": 4.9987621746380146e-06, "loss": 1.2969, "step": 2106 }, { "epoch": 0.04, "learning_rate": 4.998757363280811e-06, "loss": 1.1682, "step": 2107 }, { "epoch": 0.04, "learning_rate": 4.998752542593324e-06, "loss": 1.0642, "step": 2108 }, { "epoch": 0.04, "learning_rate": 4.998747712575571e-06, "loss": 1.024, "step": 2109 }, { "epoch": 0.04, "learning_rate": 4.998742873227572e-06, "loss": 1.1284, "step": 2110 }, { "epoch": 0.04, "learning_rate": 4.998738024549342e-06, "loss": 0.8748, "step": 2111 }, { "epoch": 0.04, "learning_rate": 4.998733166540902e-06, "loss": 1.1201, "step": 2112 }, { "epoch": 0.04, "learning_rate": 4.998728299202269e-06, "loss": 1.08, "step": 2113 }, { "epoch": 0.04, "learning_rate": 4.998723422533461e-06, "loss": 1.0632, "step": 2114 }, { "epoch": 0.04, "learning_rate": 4.998718536534496e-06, "loss": 0.9608, "step": 2115 }, { "epoch": 0.04, "learning_rate": 4.998713641205393e-06, "loss": 0.9368, "step": 2116 }, { "epoch": 0.04, "learning_rate": 4.99870873654617e-06, "loss": 0.9988, "step": 2117 }, { "epoch": 0.04, "learning_rate": 4.998703822556844e-06, "loss": 1.1865, "step": 2118 }, { "epoch": 0.04, "learning_rate": 4.998698899237436e-06, "loss": 1.0469, "step": 2119 }, { "epoch": 0.04, "learning_rate": 4.998693966587962e-06, "loss": 1.0194, "step": 2120 }, { "epoch": 0.04, "learning_rate": 4.998689024608442e-06, "loss": 0.9626, "step": 2121 }, { "epoch": 0.04, "learning_rate": 4.998684073298893e-06, "loss": 1.1569, "step": 2122 }, { "epoch": 0.04, "learning_rate": 4.998679112659334e-06, "loss": 0.9813, "step": 2123 }, { "epoch": 0.04, "learning_rate": 4.998674142689785e-06, "loss": 1.0717, "step": 2124 }, { "epoch": 0.04, "learning_rate": 4.998669163390264e-06, "loss": 1.231, "step": 2125 }, { "epoch": 0.04, "learning_rate": 4.998664174760787e-06, "loss": 0.9508, "step": 2126 }, { "epoch": 0.04, "learning_rate": 4.9986591768013756e-06, "loss": 0.9029, "step": 2127 }, { "epoch": 0.04, "learning_rate": 4.998654169512047e-06, "loss": 1.0065, "step": 2128 }, { "epoch": 0.04, "learning_rate": 4.998649152892821e-06, "loss": 1.0385, "step": 2129 }, { "epoch": 0.04, "learning_rate": 4.998644126943715e-06, "loss": 0.9986, "step": 2130 }, { "epoch": 0.04, "learning_rate": 4.998639091664748e-06, "loss": 1.2236, "step": 2131 }, { "epoch": 0.04, "learning_rate": 4.998634047055942e-06, "loss": 1.0293, "step": 2132 }, { "epoch": 0.04, "learning_rate": 4.99862899311731e-06, "loss": 0.8329, "step": 2133 }, { "epoch": 0.04, "learning_rate": 4.998623929848875e-06, "loss": 0.8767, "step": 2134 }, { "epoch": 0.04, "learning_rate": 4.998618857250655e-06, "loss": 0.71, "step": 2135 }, { "epoch": 0.04, "learning_rate": 4.998613775322669e-06, "loss": 1.1262, "step": 2136 }, { "epoch": 0.04, "learning_rate": 4.998608684064935e-06, "loss": 1.2296, "step": 2137 }, { "epoch": 0.04, "learning_rate": 4.998603583477473e-06, "loss": 0.9865, "step": 2138 }, { "epoch": 0.04, "learning_rate": 4.998598473560302e-06, "loss": 0.9999, "step": 2139 }, { "epoch": 0.04, "learning_rate": 4.998593354313441e-06, "loss": 0.9907, "step": 2140 }, { "epoch": 0.04, "learning_rate": 4.998588225736909e-06, "loss": 0.9344, "step": 2141 }, { "epoch": 0.04, "learning_rate": 4.998583087830725e-06, "loss": 0.9724, "step": 2142 }, { "epoch": 0.04, "learning_rate": 4.998577940594908e-06, "loss": 1.0714, "step": 2143 }, { "epoch": 0.04, "learning_rate": 4.998572784029479e-06, "loss": 1.0396, "step": 2144 }, { "epoch": 0.04, "learning_rate": 4.998567618134455e-06, "loss": 0.9932, "step": 2145 }, { "epoch": 0.04, "learning_rate": 4.998562442909856e-06, "loss": 1.0335, "step": 2146 }, { "epoch": 0.04, "learning_rate": 4.998557258355702e-06, "loss": 0.9903, "step": 2147 }, { "epoch": 0.04, "learning_rate": 4.998552064472011e-06, "loss": 1.0074, "step": 2148 }, { "epoch": 0.04, "learning_rate": 4.9985468612588034e-06, "loss": 1.1719, "step": 2149 }, { "epoch": 0.04, "learning_rate": 4.9985416487160986e-06, "loss": 1.1304, "step": 2150 }, { "epoch": 0.04, "learning_rate": 4.998536426843915e-06, "loss": 1.2034, "step": 2151 }, { "epoch": 0.04, "learning_rate": 4.998531195642274e-06, "loss": 0.8758, "step": 2152 }, { "epoch": 0.04, "learning_rate": 4.998525955111194e-06, "loss": 0.9897, "step": 2153 }, { "epoch": 0.04, "learning_rate": 4.998520705250695e-06, "loss": 0.8771, "step": 2154 }, { "epoch": 0.04, "learning_rate": 4.998515446060796e-06, "loss": 1.0876, "step": 2155 }, { "epoch": 0.04, "learning_rate": 4.998510177541517e-06, "loss": 1.1329, "step": 2156 }, { "epoch": 0.04, "learning_rate": 4.998504899692878e-06, "loss": 0.9847, "step": 2157 }, { "epoch": 0.04, "learning_rate": 4.9984996125148965e-06, "loss": 1.1088, "step": 2158 }, { "epoch": 0.04, "learning_rate": 4.998494316007596e-06, "loss": 1.0917, "step": 2159 }, { "epoch": 0.04, "learning_rate": 4.998489010170993e-06, "loss": 0.7842, "step": 2160 }, { "epoch": 0.04, "learning_rate": 4.99848369500511e-06, "loss": 1.0104, "step": 2161 }, { "epoch": 0.04, "learning_rate": 4.998478370509964e-06, "loss": 1.1251, "step": 2162 }, { "epoch": 0.04, "learning_rate": 4.998473036685577e-06, "loss": 0.9352, "step": 2163 }, { "epoch": 0.04, "learning_rate": 4.998467693531969e-06, "loss": 0.8951, "step": 2164 }, { "epoch": 0.04, "learning_rate": 4.9984623410491586e-06, "loss": 0.8206, "step": 2165 }, { "epoch": 0.04, "learning_rate": 4.998456979237166e-06, "loss": 1.0173, "step": 2166 }, { "epoch": 0.04, "learning_rate": 4.998451608096012e-06, "loss": 0.8498, "step": 2167 }, { "epoch": 0.04, "learning_rate": 4.998446227625717e-06, "loss": 1.1638, "step": 2168 }, { "epoch": 0.04, "learning_rate": 4.998440837826299e-06, "loss": 1.1557, "step": 2169 }, { "epoch": 0.04, "learning_rate": 4.998435438697781e-06, "loss": 0.9537, "step": 2170 }, { "epoch": 0.04, "learning_rate": 4.9984300302401814e-06, "loss": 0.9136, "step": 2171 }, { "epoch": 0.04, "learning_rate": 4.9984246124535194e-06, "loss": 0.7774, "step": 2172 }, { "epoch": 0.04, "learning_rate": 4.998419185337819e-06, "loss": 0.8906, "step": 2173 }, { "epoch": 0.04, "learning_rate": 4.998413748893095e-06, "loss": 1.0157, "step": 2174 }, { "epoch": 0.04, "learning_rate": 4.998408303119372e-06, "loss": 0.9025, "step": 2175 }, { "epoch": 0.04, "learning_rate": 4.998402848016669e-06, "loss": 1.0743, "step": 2176 }, { "epoch": 0.04, "learning_rate": 4.9983973835850065e-06, "loss": 0.7629, "step": 2177 }, { "epoch": 0.04, "learning_rate": 4.998391909824405e-06, "loss": 0.8894, "step": 2178 }, { "epoch": 0.04, "learning_rate": 4.998386426734884e-06, "loss": 1.0587, "step": 2179 }, { "epoch": 0.04, "learning_rate": 4.998380934316465e-06, "loss": 1.0593, "step": 2180 }, { "epoch": 0.04, "learning_rate": 4.998375432569168e-06, "loss": 1.2956, "step": 2181 }, { "epoch": 0.04, "learning_rate": 4.998369921493015e-06, "loss": 1.0036, "step": 2182 }, { "epoch": 0.04, "learning_rate": 4.998364401088024e-06, "loss": 0.9829, "step": 2183 }, { "epoch": 0.04, "learning_rate": 4.998358871354217e-06, "loss": 1.0258, "step": 2184 }, { "epoch": 0.04, "learning_rate": 4.998353332291615e-06, "loss": 1.0234, "step": 2185 }, { "epoch": 0.04, "learning_rate": 4.998347783900238e-06, "loss": 0.9797, "step": 2186 }, { "epoch": 0.04, "learning_rate": 4.998342226180107e-06, "loss": 1.1451, "step": 2187 }, { "epoch": 0.04, "learning_rate": 4.998336659131242e-06, "loss": 1.0255, "step": 2188 }, { "epoch": 0.04, "learning_rate": 4.998331082753666e-06, "loss": 1.1974, "step": 2189 }, { "epoch": 0.04, "learning_rate": 4.998325497047397e-06, "loss": 1.0674, "step": 2190 }, { "epoch": 0.04, "learning_rate": 4.998319902012459e-06, "loss": 1.0844, "step": 2191 }, { "epoch": 0.04, "learning_rate": 4.9983142976488685e-06, "loss": 1.1071, "step": 2192 }, { "epoch": 0.04, "learning_rate": 4.998308683956651e-06, "loss": 1.1158, "step": 2193 }, { "epoch": 0.04, "learning_rate": 4.998303060935825e-06, "loss": 1.11, "step": 2194 }, { "epoch": 0.04, "learning_rate": 4.9982974285864116e-06, "loss": 0.922, "step": 2195 }, { "epoch": 0.04, "learning_rate": 4.998291786908432e-06, "loss": 0.8952, "step": 2196 }, { "epoch": 0.04, "learning_rate": 4.998286135901908e-06, "loss": 1.0637, "step": 2197 }, { "epoch": 0.04, "learning_rate": 4.99828047556686e-06, "loss": 1.1713, "step": 2198 }, { "epoch": 0.04, "learning_rate": 4.99827480590331e-06, "loss": 0.9599, "step": 2199 }, { "epoch": 0.04, "learning_rate": 4.998269126911278e-06, "loss": 1.2402, "step": 2200 }, { "epoch": 0.04, "learning_rate": 4.998263438590785e-06, "loss": 0.9955, "step": 2201 }, { "epoch": 0.04, "learning_rate": 4.998257740941854e-06, "loss": 0.9059, "step": 2202 }, { "epoch": 0.04, "learning_rate": 4.998252033964504e-06, "loss": 1.0371, "step": 2203 }, { "epoch": 0.04, "learning_rate": 4.998246317658758e-06, "loss": 0.8522, "step": 2204 }, { "epoch": 0.04, "learning_rate": 4.998240592024637e-06, "loss": 0.9926, "step": 2205 }, { "epoch": 0.04, "learning_rate": 4.9982348570621625e-06, "loss": 1.3098, "step": 2206 }, { "epoch": 0.04, "learning_rate": 4.998229112771355e-06, "loss": 1.1143, "step": 2207 }, { "epoch": 0.04, "learning_rate": 4.998223359152238e-06, "loss": 0.7163, "step": 2208 }, { "epoch": 0.04, "learning_rate": 4.998217596204829e-06, "loss": 1.0797, "step": 2209 }, { "epoch": 0.04, "learning_rate": 4.9982118239291546e-06, "loss": 0.8448, "step": 2210 }, { "epoch": 0.04, "learning_rate": 4.998206042325232e-06, "loss": 0.9203, "step": 2211 }, { "epoch": 0.04, "learning_rate": 4.998200251393086e-06, "loss": 1.0715, "step": 2212 }, { "epoch": 0.04, "learning_rate": 4.998194451132736e-06, "loss": 1.0749, "step": 2213 }, { "epoch": 0.04, "learning_rate": 4.998188641544206e-06, "loss": 0.9267, "step": 2214 }, { "epoch": 0.04, "learning_rate": 4.998182822627514e-06, "loss": 1.02, "step": 2215 }, { "epoch": 0.04, "learning_rate": 4.998176994382685e-06, "loss": 0.9164, "step": 2216 }, { "epoch": 0.04, "learning_rate": 4.9981711568097405e-06, "loss": 0.9329, "step": 2217 }, { "epoch": 0.04, "learning_rate": 4.9981653099087004e-06, "loss": 1.1425, "step": 2218 }, { "epoch": 0.04, "learning_rate": 4.998159453679588e-06, "loss": 1.1467, "step": 2219 }, { "epoch": 0.04, "learning_rate": 4.998153588122425e-06, "loss": 0.9529, "step": 2220 }, { "epoch": 0.04, "learning_rate": 4.998147713237232e-06, "loss": 0.8869, "step": 2221 }, { "epoch": 0.04, "learning_rate": 4.998141829024033e-06, "loss": 1.1325, "step": 2222 }, { "epoch": 0.04, "learning_rate": 4.9981359354828495e-06, "loss": 1.0394, "step": 2223 }, { "epoch": 0.04, "learning_rate": 4.998130032613703e-06, "loss": 0.9517, "step": 2224 }, { "epoch": 0.04, "learning_rate": 4.998124120416614e-06, "loss": 1.2171, "step": 2225 }, { "epoch": 0.04, "learning_rate": 4.998118198891607e-06, "loss": 1.0488, "step": 2226 }, { "epoch": 0.04, "learning_rate": 4.998112268038703e-06, "loss": 0.8118, "step": 2227 }, { "epoch": 0.04, "learning_rate": 4.998106327857925e-06, "loss": 0.9485, "step": 2228 }, { "epoch": 0.04, "learning_rate": 4.998100378349294e-06, "loss": 1.0045, "step": 2229 }, { "epoch": 0.04, "learning_rate": 4.998094419512833e-06, "loss": 1.1303, "step": 2230 }, { "epoch": 0.04, "learning_rate": 4.998088451348564e-06, "loss": 1.1493, "step": 2231 }, { "epoch": 0.04, "learning_rate": 4.99808247385651e-06, "loss": 1.0078, "step": 2232 }, { "epoch": 0.04, "learning_rate": 4.998076487036691e-06, "loss": 1.2086, "step": 2233 }, { "epoch": 0.04, "learning_rate": 4.998070490889133e-06, "loss": 0.7765, "step": 2234 }, { "epoch": 0.04, "learning_rate": 4.9980644854138555e-06, "loss": 0.7526, "step": 2235 }, { "epoch": 0.04, "learning_rate": 4.998058470610882e-06, "loss": 0.9755, "step": 2236 }, { "epoch": 0.04, "learning_rate": 4.998052446480234e-06, "loss": 1.0338, "step": 2237 }, { "epoch": 0.04, "learning_rate": 4.9980464130219356e-06, "loss": 1.0809, "step": 2238 }, { "epoch": 0.04, "learning_rate": 4.998040370236008e-06, "loss": 0.8893, "step": 2239 }, { "epoch": 0.04, "learning_rate": 4.998034318122475e-06, "loss": 0.809, "step": 2240 }, { "epoch": 0.04, "learning_rate": 4.998028256681356e-06, "loss": 1.0169, "step": 2241 }, { "epoch": 0.04, "learning_rate": 4.998022185912679e-06, "loss": 0.8633, "step": 2242 }, { "epoch": 0.04, "learning_rate": 4.998016105816462e-06, "loss": 0.8559, "step": 2243 }, { "epoch": 0.04, "learning_rate": 4.99801001639273e-06, "loss": 1.2089, "step": 2244 }, { "epoch": 0.04, "learning_rate": 4.9980039176415054e-06, "loss": 0.9699, "step": 2245 }, { "epoch": 0.04, "learning_rate": 4.997997809562811e-06, "loss": 0.9397, "step": 2246 }, { "epoch": 0.04, "learning_rate": 4.997991692156668e-06, "loss": 0.9747, "step": 2247 }, { "epoch": 0.04, "learning_rate": 4.997985565423103e-06, "loss": 1.0078, "step": 2248 }, { "epoch": 0.04, "learning_rate": 4.997979429362135e-06, "loss": 0.9453, "step": 2249 }, { "epoch": 0.04, "learning_rate": 4.997973283973788e-06, "loss": 1.0094, "step": 2250 }, { "epoch": 0.04, "learning_rate": 4.997967129258086e-06, "loss": 1.0492, "step": 2251 }, { "epoch": 0.04, "learning_rate": 4.997960965215051e-06, "loss": 0.8392, "step": 2252 }, { "epoch": 0.04, "learning_rate": 4.997954791844707e-06, "loss": 0.8975, "step": 2253 }, { "epoch": 0.04, "learning_rate": 4.997948609147075e-06, "loss": 0.908, "step": 2254 }, { "epoch": 0.04, "learning_rate": 4.997942417122181e-06, "loss": 1.0337, "step": 2255 }, { "epoch": 0.04, "learning_rate": 4.997936215770046e-06, "loss": 1.0663, "step": 2256 }, { "epoch": 0.04, "learning_rate": 4.997930005090694e-06, "loss": 1.0842, "step": 2257 }, { "epoch": 0.04, "learning_rate": 4.997923785084147e-06, "loss": 0.6822, "step": 2258 }, { "epoch": 0.04, "learning_rate": 4.99791755575043e-06, "loss": 1.1534, "step": 2259 }, { "epoch": 0.04, "learning_rate": 4.997911317089566e-06, "loss": 0.9708, "step": 2260 }, { "epoch": 0.04, "learning_rate": 4.997905069101576e-06, "loss": 1.0905, "step": 2261 }, { "epoch": 0.04, "learning_rate": 4.997898811786487e-06, "loss": 1.2418, "step": 2262 }, { "epoch": 0.04, "learning_rate": 4.99789254514432e-06, "loss": 1.212, "step": 2263 }, { "epoch": 0.04, "learning_rate": 4.997886269175097e-06, "loss": 0.9263, "step": 2264 }, { "epoch": 0.04, "learning_rate": 4.997879983878845e-06, "loss": 0.9399, "step": 2265 }, { "epoch": 0.04, "learning_rate": 4.997873689255586e-06, "loss": 0.9047, "step": 2266 }, { "epoch": 0.04, "learning_rate": 4.997867385305342e-06, "loss": 1.019, "step": 2267 }, { "epoch": 0.04, "learning_rate": 4.997861072028139e-06, "loss": 0.9815, "step": 2268 }, { "epoch": 0.04, "learning_rate": 4.9978547494239985e-06, "loss": 1.1105, "step": 2269 }, { "epoch": 0.04, "learning_rate": 4.997848417492944e-06, "loss": 0.9396, "step": 2270 }, { "epoch": 0.04, "learning_rate": 4.997842076235002e-06, "loss": 1.0163, "step": 2271 }, { "epoch": 0.04, "learning_rate": 4.997835725650193e-06, "loss": 1.0108, "step": 2272 }, { "epoch": 0.04, "learning_rate": 4.997829365738543e-06, "loss": 0.9337, "step": 2273 }, { "epoch": 0.04, "learning_rate": 4.997822996500074e-06, "loss": 1.1555, "step": 2274 }, { "epoch": 0.04, "learning_rate": 4.997816617934811e-06, "loss": 0.9682, "step": 2275 }, { "epoch": 0.04, "learning_rate": 4.997810230042777e-06, "loss": 0.8091, "step": 2276 }, { "epoch": 0.04, "learning_rate": 4.997803832823996e-06, "loss": 0.9676, "step": 2277 }, { "epoch": 0.04, "learning_rate": 4.997797426278492e-06, "loss": 1.0646, "step": 2278 }, { "epoch": 0.04, "learning_rate": 4.9977910104062895e-06, "loss": 0.9187, "step": 2279 }, { "epoch": 0.04, "learning_rate": 4.997784585207412e-06, "loss": 1.1119, "step": 2280 }, { "epoch": 0.04, "learning_rate": 4.997778150681883e-06, "loss": 1.2076, "step": 2281 }, { "epoch": 0.04, "learning_rate": 4.9977717068297275e-06, "loss": 1.1225, "step": 2282 }, { "epoch": 0.04, "learning_rate": 4.997765253650968e-06, "loss": 1.0205, "step": 2283 }, { "epoch": 0.04, "learning_rate": 4.997758791145631e-06, "loss": 1.082, "step": 2284 }, { "epoch": 0.04, "learning_rate": 4.997752319313739e-06, "loss": 1.0493, "step": 2285 }, { "epoch": 0.04, "learning_rate": 4.997745838155315e-06, "loss": 0.9445, "step": 2286 }, { "epoch": 0.04, "learning_rate": 4.997739347670386e-06, "loss": 0.9671, "step": 2287 }, { "epoch": 0.04, "learning_rate": 4.997732847858975e-06, "loss": 1.0966, "step": 2288 }, { "epoch": 0.04, "learning_rate": 4.997726338721105e-06, "loss": 1.0138, "step": 2289 }, { "epoch": 0.04, "learning_rate": 4.9977198202568025e-06, "loss": 0.8934, "step": 2290 }, { "epoch": 0.04, "learning_rate": 4.99771329246609e-06, "loss": 0.7627, "step": 2291 }, { "epoch": 0.04, "learning_rate": 4.997706755348993e-06, "loss": 0.9875, "step": 2292 }, { "epoch": 0.04, "learning_rate": 4.997700208905536e-06, "loss": 1.0259, "step": 2293 }, { "epoch": 0.04, "learning_rate": 4.997693653135742e-06, "loss": 1.0186, "step": 2294 }, { "epoch": 0.04, "learning_rate": 4.997687088039637e-06, "loss": 1.1537, "step": 2295 }, { "epoch": 0.04, "learning_rate": 4.997680513617245e-06, "loss": 0.7933, "step": 2296 }, { "epoch": 0.04, "learning_rate": 4.99767392986859e-06, "loss": 1.0447, "step": 2297 }, { "epoch": 0.04, "learning_rate": 4.997667336793698e-06, "loss": 1.0231, "step": 2298 }, { "epoch": 0.04, "learning_rate": 4.9976607343925935e-06, "loss": 1.1169, "step": 2299 }, { "epoch": 0.04, "learning_rate": 4.9976541226652985e-06, "loss": 1.2643, "step": 2300 }, { "epoch": 0.04, "learning_rate": 4.997647501611841e-06, "loss": 0.9677, "step": 2301 }, { "epoch": 0.04, "learning_rate": 4.997640871232244e-06, "loss": 1.1011, "step": 2302 }, { "epoch": 0.04, "learning_rate": 4.997634231526531e-06, "loss": 0.9142, "step": 2303 }, { "epoch": 0.04, "learning_rate": 4.9976275824947305e-06, "loss": 1.1206, "step": 2304 }, { "epoch": 0.04, "learning_rate": 4.997620924136865e-06, "loss": 0.8636, "step": 2305 }, { "epoch": 0.04, "learning_rate": 4.997614256452958e-06, "loss": 1.0391, "step": 2306 }, { "epoch": 0.04, "learning_rate": 4.997607579443037e-06, "loss": 0.8753, "step": 2307 }, { "epoch": 0.04, "learning_rate": 4.997600893107125e-06, "loss": 0.9754, "step": 2308 }, { "epoch": 0.04, "learning_rate": 4.997594197445249e-06, "loss": 1.0082, "step": 2309 }, { "epoch": 0.04, "learning_rate": 4.997587492457433e-06, "loss": 1.0005, "step": 2310 }, { "epoch": 0.04, "learning_rate": 4.997580778143701e-06, "loss": 0.9169, "step": 2311 }, { "epoch": 0.04, "learning_rate": 4.997574054504078e-06, "loss": 1.2164, "step": 2312 }, { "epoch": 0.04, "learning_rate": 4.997567321538592e-06, "loss": 1.0249, "step": 2313 }, { "epoch": 0.04, "learning_rate": 4.9975605792472655e-06, "loss": 0.8056, "step": 2314 }, { "epoch": 0.04, "learning_rate": 4.9975538276301245e-06, "loss": 1.1831, "step": 2315 }, { "epoch": 0.04, "learning_rate": 4.997547066687194e-06, "loss": 0.9287, "step": 2316 }, { "epoch": 0.04, "learning_rate": 4.997540296418499e-06, "loss": 1.1053, "step": 2317 }, { "epoch": 0.04, "learning_rate": 4.997533516824066e-06, "loss": 1.1021, "step": 2318 }, { "epoch": 0.04, "learning_rate": 4.997526727903919e-06, "loss": 1.2411, "step": 2319 }, { "epoch": 0.04, "learning_rate": 4.9975199296580825e-06, "loss": 0.8793, "step": 2320 }, { "epoch": 0.04, "learning_rate": 4.9975131220865845e-06, "loss": 0.9003, "step": 2321 }, { "epoch": 0.04, "learning_rate": 4.997506305189449e-06, "loss": 0.9758, "step": 2322 }, { "epoch": 0.04, "learning_rate": 4.997499478966701e-06, "loss": 1.0507, "step": 2323 }, { "epoch": 0.04, "learning_rate": 4.997492643418367e-06, "loss": 1.0414, "step": 2324 }, { "epoch": 0.04, "learning_rate": 4.997485798544472e-06, "loss": 1.1473, "step": 2325 }, { "epoch": 0.04, "learning_rate": 4.997478944345041e-06, "loss": 1.165, "step": 2326 }, { "epoch": 0.04, "learning_rate": 4.997472080820102e-06, "loss": 0.9477, "step": 2327 }, { "epoch": 0.04, "learning_rate": 4.997465207969677e-06, "loss": 1.0015, "step": 2328 }, { "epoch": 0.04, "learning_rate": 4.997458325793794e-06, "loss": 0.8978, "step": 2329 }, { "epoch": 0.04, "learning_rate": 4.997451434292478e-06, "loss": 0.9355, "step": 2330 }, { "epoch": 0.04, "learning_rate": 4.997444533465755e-06, "loss": 1.003, "step": 2331 }, { "epoch": 0.04, "learning_rate": 4.997437623313652e-06, "loss": 1.0204, "step": 2332 }, { "epoch": 0.04, "learning_rate": 4.997430703836192e-06, "loss": 0.7126, "step": 2333 }, { "epoch": 0.04, "learning_rate": 4.997423775033402e-06, "loss": 0.958, "step": 2334 }, { "epoch": 0.04, "learning_rate": 4.997416836905309e-06, "loss": 0.7828, "step": 2335 }, { "epoch": 0.04, "learning_rate": 4.997409889451937e-06, "loss": 0.8133, "step": 2336 }, { "epoch": 0.04, "learning_rate": 4.997402932673314e-06, "loss": 1.2706, "step": 2337 }, { "epoch": 0.04, "learning_rate": 4.997395966569465e-06, "loss": 1.1257, "step": 2338 }, { "epoch": 0.04, "learning_rate": 4.997388991140416e-06, "loss": 0.8815, "step": 2339 }, { "epoch": 0.04, "learning_rate": 4.997382006386194e-06, "loss": 0.8238, "step": 2340 }, { "epoch": 0.04, "learning_rate": 4.997375012306823e-06, "loss": 1.119, "step": 2341 }, { "epoch": 0.04, "learning_rate": 4.9973680089023304e-06, "loss": 0.9201, "step": 2342 }, { "epoch": 0.04, "learning_rate": 4.997360996172742e-06, "loss": 1.2729, "step": 2343 }, { "epoch": 0.04, "learning_rate": 4.997353974118085e-06, "loss": 1.1539, "step": 2344 }, { "epoch": 0.04, "learning_rate": 4.997346942738384e-06, "loss": 1.0964, "step": 2345 }, { "epoch": 0.04, "learning_rate": 4.997339902033667e-06, "loss": 0.9666, "step": 2346 }, { "epoch": 0.04, "learning_rate": 4.997332852003959e-06, "loss": 0.9594, "step": 2347 }, { "epoch": 0.04, "learning_rate": 4.9973257926492854e-06, "loss": 0.9956, "step": 2348 }, { "epoch": 0.04, "learning_rate": 4.9973187239696755e-06, "loss": 1.0966, "step": 2349 }, { "epoch": 0.04, "learning_rate": 4.997311645965154e-06, "loss": 1.2269, "step": 2350 }, { "epoch": 0.04, "learning_rate": 4.997304558635747e-06, "loss": 0.7933, "step": 2351 }, { "epoch": 0.04, "learning_rate": 4.99729746198148e-06, "loss": 0.9324, "step": 2352 }, { "epoch": 0.04, "learning_rate": 4.997290356002383e-06, "loss": 0.9594, "step": 2353 }, { "epoch": 0.04, "learning_rate": 4.997283240698479e-06, "loss": 0.9108, "step": 2354 }, { "epoch": 0.04, "learning_rate": 4.997276116069797e-06, "loss": 1.0797, "step": 2355 }, { "epoch": 0.04, "learning_rate": 4.997268982116362e-06, "loss": 0.9209, "step": 2356 }, { "epoch": 0.04, "learning_rate": 4.997261838838201e-06, "loss": 1.0598, "step": 2357 }, { "epoch": 0.04, "learning_rate": 4.997254686235341e-06, "loss": 0.8282, "step": 2358 }, { "epoch": 0.04, "learning_rate": 4.997247524307809e-06, "loss": 0.9254, "step": 2359 }, { "epoch": 0.04, "learning_rate": 4.997240353055631e-06, "loss": 1.1039, "step": 2360 }, { "epoch": 0.04, "learning_rate": 4.9972331724788335e-06, "loss": 1.0436, "step": 2361 }, { "epoch": 0.04, "learning_rate": 4.997225982577445e-06, "loss": 0.959, "step": 2362 }, { "epoch": 0.04, "learning_rate": 4.997218783351491e-06, "loss": 1.108, "step": 2363 }, { "epoch": 0.04, "learning_rate": 4.9972115748009984e-06, "loss": 1.0141, "step": 2364 }, { "epoch": 0.04, "learning_rate": 4.9972043569259945e-06, "loss": 1.0119, "step": 2365 }, { "epoch": 0.04, "learning_rate": 4.9971971297265055e-06, "loss": 0.9247, "step": 2366 }, { "epoch": 0.04, "learning_rate": 4.9971898932025585e-06, "loss": 0.9553, "step": 2367 }, { "epoch": 0.04, "learning_rate": 4.997182647354182e-06, "loss": 1.0199, "step": 2368 }, { "epoch": 0.04, "learning_rate": 4.997175392181403e-06, "loss": 1.0611, "step": 2369 }, { "epoch": 0.04, "learning_rate": 4.997168127684246e-06, "loss": 1.0549, "step": 2370 }, { "epoch": 0.04, "learning_rate": 4.997160853862741e-06, "loss": 0.8018, "step": 2371 }, { "epoch": 0.04, "learning_rate": 4.997153570716913e-06, "loss": 1.0179, "step": 2372 }, { "epoch": 0.04, "learning_rate": 4.99714627824679e-06, "loss": 0.9772, "step": 2373 }, { "epoch": 0.04, "learning_rate": 4.997138976452399e-06, "loss": 0.9792, "step": 2374 }, { "epoch": 0.04, "learning_rate": 4.997131665333769e-06, "loss": 1.0915, "step": 2375 }, { "epoch": 0.04, "learning_rate": 4.9971243448909255e-06, "loss": 0.8912, "step": 2376 }, { "epoch": 0.04, "learning_rate": 4.997117015123896e-06, "loss": 0.9666, "step": 2377 }, { "epoch": 0.04, "learning_rate": 4.997109676032708e-06, "loss": 0.8747, "step": 2378 }, { "epoch": 0.04, "learning_rate": 4.997102327617389e-06, "loss": 0.9233, "step": 2379 }, { "epoch": 0.04, "learning_rate": 4.997094969877967e-06, "loss": 1.0243, "step": 2380 }, { "epoch": 0.04, "learning_rate": 4.9970876028144685e-06, "loss": 1.2963, "step": 2381 }, { "epoch": 0.04, "learning_rate": 4.997080226426922e-06, "loss": 1.1926, "step": 2382 }, { "epoch": 0.04, "learning_rate": 4.997072840715354e-06, "loss": 0.9952, "step": 2383 }, { "epoch": 0.04, "learning_rate": 4.997065445679793e-06, "loss": 0.9924, "step": 2384 }, { "epoch": 0.04, "learning_rate": 4.997058041320265e-06, "loss": 1.0687, "step": 2385 }, { "epoch": 0.05, "learning_rate": 4.9970506276368e-06, "loss": 0.8896, "step": 2386 }, { "epoch": 0.05, "learning_rate": 4.9970432046294245e-06, "loss": 1.1547, "step": 2387 }, { "epoch": 0.05, "learning_rate": 4.997035772298165e-06, "loss": 0.9196, "step": 2388 }, { "epoch": 0.05, "learning_rate": 4.997028330643052e-06, "loss": 0.8693, "step": 2389 }, { "epoch": 0.05, "learning_rate": 4.997020879664112e-06, "loss": 1.1883, "step": 2390 }, { "epoch": 0.05, "learning_rate": 4.997013419361372e-06, "loss": 1.1262, "step": 2391 }, { "epoch": 0.05, "learning_rate": 4.99700594973486e-06, "loss": 0.8725, "step": 2392 }, { "epoch": 0.05, "learning_rate": 4.9969984707846044e-06, "loss": 0.9312, "step": 2393 }, { "epoch": 0.05, "learning_rate": 4.996990982510633e-06, "loss": 0.8753, "step": 2394 }, { "epoch": 0.05, "learning_rate": 4.996983484912974e-06, "loss": 1.0457, "step": 2395 }, { "epoch": 0.05, "learning_rate": 4.9969759779916555e-06, "loss": 0.9518, "step": 2396 }, { "epoch": 0.05, "learning_rate": 4.996968461746705e-06, "loss": 0.7665, "step": 2397 }, { "epoch": 0.05, "learning_rate": 4.996960936178151e-06, "loss": 1.0523, "step": 2398 }, { "epoch": 0.05, "learning_rate": 4.996953401286021e-06, "loss": 1.1733, "step": 2399 }, { "epoch": 0.05, "learning_rate": 4.996945857070345e-06, "loss": 0.9304, "step": 2400 }, { "epoch": 0.05, "learning_rate": 4.996938303531148e-06, "loss": 0.8415, "step": 2401 }, { "epoch": 0.05, "learning_rate": 4.996930740668461e-06, "loss": 0.9942, "step": 2402 }, { "epoch": 0.05, "learning_rate": 4.9969231684823105e-06, "loss": 0.962, "step": 2403 }, { "epoch": 0.05, "learning_rate": 4.996915586972725e-06, "loss": 1.1083, "step": 2404 }, { "epoch": 0.05, "learning_rate": 4.996907996139734e-06, "loss": 1.1027, "step": 2405 }, { "epoch": 0.05, "learning_rate": 4.996900395983365e-06, "loss": 1.1508, "step": 2406 }, { "epoch": 0.05, "learning_rate": 4.996892786503647e-06, "loss": 0.9096, "step": 2407 }, { "epoch": 0.05, "learning_rate": 4.996885167700607e-06, "loss": 0.8227, "step": 2408 }, { "epoch": 0.05, "learning_rate": 4.996877539574275e-06, "loss": 0.9612, "step": 2409 }, { "epoch": 0.05, "learning_rate": 4.996869902124679e-06, "loss": 0.8669, "step": 2410 }, { "epoch": 0.05, "learning_rate": 4.996862255351847e-06, "loss": 0.9207, "step": 2411 }, { "epoch": 0.05, "learning_rate": 4.996854599255807e-06, "loss": 1.2382, "step": 2412 }, { "epoch": 0.05, "learning_rate": 4.996846933836589e-06, "loss": 0.9065, "step": 2413 }, { "epoch": 0.05, "learning_rate": 4.996839259094222e-06, "loss": 0.8559, "step": 2414 }, { "epoch": 0.05, "learning_rate": 4.996831575028733e-06, "loss": 0.8471, "step": 2415 }, { "epoch": 0.05, "learning_rate": 4.996823881640152e-06, "loss": 0.834, "step": 2416 }, { "epoch": 0.05, "learning_rate": 4.996816178928507e-06, "loss": 0.9771, "step": 2417 }, { "epoch": 0.05, "learning_rate": 4.996808466893826e-06, "loss": 1.0546, "step": 2418 }, { "epoch": 0.05, "learning_rate": 4.9968007455361395e-06, "loss": 0.8676, "step": 2419 }, { "epoch": 0.05, "learning_rate": 4.996793014855476e-06, "loss": 0.9791, "step": 2420 }, { "epoch": 0.05, "learning_rate": 4.996785274851863e-06, "loss": 0.6642, "step": 2421 }, { "epoch": 0.05, "learning_rate": 4.9967775255253305e-06, "loss": 1.0531, "step": 2422 }, { "epoch": 0.05, "learning_rate": 4.996769766875908e-06, "loss": 1.0298, "step": 2423 }, { "epoch": 0.05, "learning_rate": 4.996761998903623e-06, "loss": 0.9694, "step": 2424 }, { "epoch": 0.05, "learning_rate": 4.996754221608506e-06, "loss": 1.1849, "step": 2425 }, { "epoch": 0.05, "learning_rate": 4.996746434990585e-06, "loss": 0.9384, "step": 2426 }, { "epoch": 0.05, "learning_rate": 4.996738639049889e-06, "loss": 0.8275, "step": 2427 }, { "epoch": 0.05, "learning_rate": 4.9967308337864475e-06, "loss": 1.0562, "step": 2428 }, { "epoch": 0.05, "learning_rate": 4.99672301920029e-06, "loss": 0.7932, "step": 2429 }, { "epoch": 0.05, "learning_rate": 4.996715195291445e-06, "loss": 0.8877, "step": 2430 }, { "epoch": 0.05, "learning_rate": 4.996707362059942e-06, "loss": 1.155, "step": 2431 }, { "epoch": 0.05, "learning_rate": 4.99669951950581e-06, "loss": 1.0533, "step": 2432 }, { "epoch": 0.05, "learning_rate": 4.99669166762908e-06, "loss": 0.9757, "step": 2433 }, { "epoch": 0.05, "learning_rate": 4.9966838064297785e-06, "loss": 1.0864, "step": 2434 }, { "epoch": 0.05, "learning_rate": 4.996675935907937e-06, "loss": 1.1221, "step": 2435 }, { "epoch": 0.05, "learning_rate": 4.996668056063583e-06, "loss": 1.043, "step": 2436 }, { "epoch": 0.05, "learning_rate": 4.9966601668967475e-06, "loss": 1.0156, "step": 2437 }, { "epoch": 0.05, "learning_rate": 4.996652268407459e-06, "loss": 1.0488, "step": 2438 }, { "epoch": 0.05, "learning_rate": 4.9966443605957485e-06, "loss": 0.771, "step": 2439 }, { "epoch": 0.05, "learning_rate": 4.996636443461645e-06, "loss": 0.8616, "step": 2440 }, { "epoch": 0.05, "learning_rate": 4.996628517005176e-06, "loss": 0.8579, "step": 2441 }, { "epoch": 0.05, "learning_rate": 4.9966205812263735e-06, "loss": 1.0199, "step": 2442 }, { "epoch": 0.05, "learning_rate": 4.996612636125266e-06, "loss": 1.0231, "step": 2443 }, { "epoch": 0.05, "learning_rate": 4.996604681701883e-06, "loss": 1.2661, "step": 2444 }, { "epoch": 0.05, "learning_rate": 4.996596717956256e-06, "loss": 1.1879, "step": 2445 }, { "epoch": 0.05, "learning_rate": 4.996588744888412e-06, "loss": 0.8585, "step": 2446 }, { "epoch": 0.05, "learning_rate": 4.996580762498383e-06, "loss": 1.0215, "step": 2447 }, { "epoch": 0.05, "learning_rate": 4.996572770786198e-06, "loss": 0.8109, "step": 2448 }, { "epoch": 0.05, "learning_rate": 4.996564769751887e-06, "loss": 1.0459, "step": 2449 }, { "epoch": 0.05, "learning_rate": 4.996556759395479e-06, "loss": 1.2755, "step": 2450 }, { "epoch": 0.05, "learning_rate": 4.996548739717005e-06, "loss": 1.2357, "step": 2451 }, { "epoch": 0.05, "learning_rate": 4.996540710716494e-06, "loss": 0.7621, "step": 2452 }, { "epoch": 0.05, "learning_rate": 4.996532672393978e-06, "loss": 0.9714, "step": 2453 }, { "epoch": 0.05, "learning_rate": 4.996524624749484e-06, "loss": 0.9062, "step": 2454 }, { "epoch": 0.05, "learning_rate": 4.996516567783044e-06, "loss": 1.2751, "step": 2455 }, { "epoch": 0.05, "learning_rate": 4.996508501494688e-06, "loss": 1.1334, "step": 2456 }, { "epoch": 0.05, "learning_rate": 4.996500425884446e-06, "loss": 1.0227, "step": 2457 }, { "epoch": 0.05, "learning_rate": 4.996492340952347e-06, "loss": 0.9178, "step": 2458 }, { "epoch": 0.05, "learning_rate": 4.996484246698423e-06, "loss": 0.853, "step": 2459 }, { "epoch": 0.05, "learning_rate": 4.996476143122704e-06, "loss": 0.9612, "step": 2460 }, { "epoch": 0.05, "learning_rate": 4.996468030225217e-06, "loss": 1.1218, "step": 2461 }, { "epoch": 0.05, "learning_rate": 4.996459908005997e-06, "loss": 1.1701, "step": 2462 }, { "epoch": 0.05, "learning_rate": 4.996451776465072e-06, "loss": 1.2157, "step": 2463 }, { "epoch": 0.05, "learning_rate": 4.9964436356024735e-06, "loss": 0.8865, "step": 2464 }, { "epoch": 0.05, "learning_rate": 4.996435485418229e-06, "loss": 0.8732, "step": 2465 }, { "epoch": 0.05, "learning_rate": 4.996427325912372e-06, "loss": 0.8422, "step": 2466 }, { "epoch": 0.05, "learning_rate": 4.996419157084932e-06, "loss": 0.9436, "step": 2467 }, { "epoch": 0.05, "learning_rate": 4.996410978935939e-06, "loss": 1.1846, "step": 2468 }, { "epoch": 0.05, "learning_rate": 4.996402791465425e-06, "loss": 1.0206, "step": 2469 }, { "epoch": 0.05, "learning_rate": 4.996394594673418e-06, "loss": 0.9934, "step": 2470 }, { "epoch": 0.05, "learning_rate": 4.996386388559952e-06, "loss": 1.0388, "step": 2471 }, { "epoch": 0.05, "learning_rate": 4.996378173125054e-06, "loss": 0.969, "step": 2472 }, { "epoch": 0.05, "learning_rate": 4.9963699483687575e-06, "loss": 1.0319, "step": 2473 }, { "epoch": 0.05, "learning_rate": 4.996361714291091e-06, "loss": 1.0294, "step": 2474 }, { "epoch": 0.05, "learning_rate": 4.996353470892088e-06, "loss": 1.2341, "step": 2475 }, { "epoch": 0.05, "learning_rate": 4.996345218171777e-06, "loss": 0.9739, "step": 2476 }, { "epoch": 0.05, "learning_rate": 4.996336956130189e-06, "loss": 0.8588, "step": 2477 }, { "epoch": 0.05, "learning_rate": 4.996328684767355e-06, "loss": 1.0137, "step": 2478 }, { "epoch": 0.05, "learning_rate": 4.996320404083307e-06, "loss": 0.9952, "step": 2479 }, { "epoch": 0.05, "learning_rate": 4.996312114078075e-06, "loss": 0.8556, "step": 2480 }, { "epoch": 0.05, "learning_rate": 4.9963038147516905e-06, "loss": 0.9481, "step": 2481 }, { "epoch": 0.05, "learning_rate": 4.996295506104184e-06, "loss": 1.028, "step": 2482 }, { "epoch": 0.05, "learning_rate": 4.996287188135586e-06, "loss": 0.8206, "step": 2483 }, { "epoch": 0.05, "learning_rate": 4.996278860845928e-06, "loss": 0.9423, "step": 2484 }, { "epoch": 0.05, "learning_rate": 4.996270524235242e-06, "loss": 0.972, "step": 2485 }, { "epoch": 0.05, "learning_rate": 4.996262178303558e-06, "loss": 0.9318, "step": 2486 }, { "epoch": 0.05, "learning_rate": 4.996253823050908e-06, "loss": 1.0916, "step": 2487 }, { "epoch": 0.05, "learning_rate": 4.996245458477323e-06, "loss": 0.9137, "step": 2488 }, { "epoch": 0.05, "learning_rate": 4.996237084582833e-06, "loss": 1.0225, "step": 2489 }, { "epoch": 0.05, "learning_rate": 4.996228701367471e-06, "loss": 1.0541, "step": 2490 }, { "epoch": 0.05, "learning_rate": 4.996220308831268e-06, "loss": 0.9404, "step": 2491 }, { "epoch": 0.05, "learning_rate": 4.996211906974253e-06, "loss": 0.8799, "step": 2492 }, { "epoch": 0.05, "learning_rate": 4.996203495796461e-06, "loss": 1.1533, "step": 2493 }, { "epoch": 0.05, "learning_rate": 4.9961950752979215e-06, "loss": 0.9086, "step": 2494 }, { "epoch": 0.05, "learning_rate": 4.996186645478665e-06, "loss": 1.1453, "step": 2495 }, { "epoch": 0.05, "learning_rate": 4.9961782063387256e-06, "loss": 1.0404, "step": 2496 }, { "epoch": 0.05, "learning_rate": 4.996169757878133e-06, "loss": 0.9088, "step": 2497 }, { "epoch": 0.05, "learning_rate": 4.996161300096919e-06, "loss": 0.8822, "step": 2498 }, { "epoch": 0.05, "learning_rate": 4.996152832995114e-06, "loss": 0.9948, "step": 2499 }, { "epoch": 0.05, "learning_rate": 4.996144356572752e-06, "loss": 1.2227, "step": 2500 }, { "epoch": 0.05, "learning_rate": 4.996135870829864e-06, "loss": 0.9102, "step": 2501 }, { "epoch": 0.05, "learning_rate": 4.9961273757664795e-06, "loss": 0.8559, "step": 2502 }, { "epoch": 0.05, "learning_rate": 4.9961188713826334e-06, "loss": 0.9181, "step": 2503 }, { "epoch": 0.05, "learning_rate": 4.996110357678355e-06, "loss": 0.9991, "step": 2504 }, { "epoch": 0.05, "learning_rate": 4.996101834653678e-06, "loss": 1.0787, "step": 2505 }, { "epoch": 0.05, "learning_rate": 4.9960933023086325e-06, "loss": 1.2021, "step": 2506 }, { "epoch": 0.05, "learning_rate": 4.996084760643251e-06, "loss": 0.8942, "step": 2507 }, { "epoch": 0.05, "learning_rate": 4.996076209657567e-06, "loss": 0.8279, "step": 2508 }, { "epoch": 0.05, "learning_rate": 4.9960676493516095e-06, "loss": 0.9865, "step": 2509 }, { "epoch": 0.05, "learning_rate": 4.996059079725412e-06, "loss": 0.9958, "step": 2510 }, { "epoch": 0.05, "learning_rate": 4.996050500779007e-06, "loss": 0.9416, "step": 2511 }, { "epoch": 0.05, "learning_rate": 4.996041912512426e-06, "loss": 1.0609, "step": 2512 }, { "epoch": 0.05, "learning_rate": 4.996033314925701e-06, "loss": 1.1297, "step": 2513 }, { "epoch": 0.05, "learning_rate": 4.996024708018864e-06, "loss": 0.9931, "step": 2514 }, { "epoch": 0.05, "learning_rate": 4.996016091791947e-06, "loss": 0.9673, "step": 2515 }, { "epoch": 0.05, "learning_rate": 4.996007466244983e-06, "loss": 0.9033, "step": 2516 }, { "epoch": 0.05, "learning_rate": 4.995998831378003e-06, "loss": 1.0727, "step": 2517 }, { "epoch": 0.05, "learning_rate": 4.99599018719104e-06, "loss": 1.0739, "step": 2518 }, { "epoch": 0.05, "learning_rate": 4.995981533684126e-06, "loss": 1.0201, "step": 2519 }, { "epoch": 0.05, "learning_rate": 4.995972870857294e-06, "loss": 0.9438, "step": 2520 }, { "epoch": 0.05, "learning_rate": 4.995964198710576e-06, "loss": 0.8405, "step": 2521 }, { "epoch": 0.05, "learning_rate": 4.9959555172440035e-06, "loss": 0.9697, "step": 2522 }, { "epoch": 0.05, "learning_rate": 4.9959468264576105e-06, "loss": 0.9039, "step": 2523 }, { "epoch": 0.05, "learning_rate": 4.9959381263514275e-06, "loss": 0.8931, "step": 2524 }, { "epoch": 0.05, "learning_rate": 4.995929416925489e-06, "loss": 1.2561, "step": 2525 }, { "epoch": 0.05, "learning_rate": 4.995920698179826e-06, "loss": 1.0666, "step": 2526 }, { "epoch": 0.05, "learning_rate": 4.995911970114472e-06, "loss": 0.8622, "step": 2527 }, { "epoch": 0.05, "learning_rate": 4.995903232729459e-06, "loss": 0.959, "step": 2528 }, { "epoch": 0.05, "learning_rate": 4.99589448602482e-06, "loss": 0.8411, "step": 2529 }, { "epoch": 0.05, "learning_rate": 4.995885730000587e-06, "loss": 0.9047, "step": 2530 }, { "epoch": 0.05, "learning_rate": 4.995876964656794e-06, "loss": 1.299, "step": 2531 }, { "epoch": 0.05, "learning_rate": 4.995868189993473e-06, "loss": 1.2379, "step": 2532 }, { "epoch": 0.05, "learning_rate": 4.995859406010656e-06, "loss": 0.8615, "step": 2533 }, { "epoch": 0.05, "learning_rate": 4.995850612708377e-06, "loss": 0.7419, "step": 2534 }, { "epoch": 0.05, "learning_rate": 4.995841810086668e-06, "loss": 1.0057, "step": 2535 }, { "epoch": 0.05, "learning_rate": 4.995832998145562e-06, "loss": 0.933, "step": 2536 }, { "epoch": 0.05, "learning_rate": 4.995824176885093e-06, "loss": 1.2712, "step": 2537 }, { "epoch": 0.05, "learning_rate": 4.995815346305293e-06, "loss": 0.9713, "step": 2538 }, { "epoch": 0.05, "learning_rate": 4.995806506406194e-06, "loss": 0.8776, "step": 2539 }, { "epoch": 0.05, "learning_rate": 4.995797657187831e-06, "loss": 0.9802, "step": 2540 }, { "epoch": 0.05, "learning_rate": 4.995788798650235e-06, "loss": 0.8569, "step": 2541 }, { "epoch": 0.05, "learning_rate": 4.995779930793441e-06, "loss": 1.1318, "step": 2542 }, { "epoch": 0.05, "learning_rate": 4.995771053617481e-06, "loss": 1.0898, "step": 2543 }, { "epoch": 0.05, "learning_rate": 4.995762167122388e-06, "loss": 0.924, "step": 2544 }, { "epoch": 0.05, "learning_rate": 4.995753271308196e-06, "loss": 0.9006, "step": 2545 }, { "epoch": 0.05, "learning_rate": 4.995744366174938e-06, "loss": 0.8673, "step": 2546 }, { "epoch": 0.05, "learning_rate": 4.995735451722647e-06, "loss": 0.9315, "step": 2547 }, { "epoch": 0.05, "learning_rate": 4.9957265279513566e-06, "loss": 0.8688, "step": 2548 }, { "epoch": 0.05, "learning_rate": 4.995717594861099e-06, "loss": 1.2169, "step": 2549 }, { "epoch": 0.05, "learning_rate": 4.99570865245191e-06, "loss": 1.2692, "step": 2550 }, { "epoch": 0.05, "learning_rate": 4.99569970072382e-06, "loss": 0.869, "step": 2551 }, { "epoch": 0.05, "learning_rate": 4.995690739676864e-06, "loss": 0.6845, "step": 2552 }, { "epoch": 0.05, "learning_rate": 4.995681769311075e-06, "loss": 0.9282, "step": 2553 }, { "epoch": 0.05, "learning_rate": 4.995672789626488e-06, "loss": 0.9985, "step": 2554 }, { "epoch": 0.05, "learning_rate": 4.995663800623134e-06, "loss": 0.996, "step": 2555 }, { "epoch": 0.05, "learning_rate": 4.995654802301049e-06, "loss": 1.1138, "step": 2556 }, { "epoch": 0.05, "learning_rate": 4.995645794660265e-06, "loss": 0.8227, "step": 2557 }, { "epoch": 0.05, "learning_rate": 4.9956367777008156e-06, "loss": 0.8141, "step": 2558 }, { "epoch": 0.05, "learning_rate": 4.995627751422736e-06, "loss": 0.949, "step": 2559 }, { "epoch": 0.05, "learning_rate": 4.995618715826058e-06, "loss": 0.9792, "step": 2560 }, { "epoch": 0.05, "learning_rate": 4.995609670910817e-06, "loss": 0.8926, "step": 2561 }, { "epoch": 0.05, "learning_rate": 4.995600616677045e-06, "loss": 1.0317, "step": 2562 }, { "epoch": 0.05, "learning_rate": 4.9955915531247775e-06, "loss": 1.0246, "step": 2563 }, { "epoch": 0.05, "learning_rate": 4.995582480254047e-06, "loss": 0.8686, "step": 2564 }, { "epoch": 0.05, "learning_rate": 4.995573398064889e-06, "loss": 1.045, "step": 2565 }, { "epoch": 0.05, "learning_rate": 4.995564306557337e-06, "loss": 0.9793, "step": 2566 }, { "epoch": 0.05, "learning_rate": 4.995555205731422e-06, "loss": 1.0486, "step": 2567 }, { "epoch": 0.05, "learning_rate": 4.995546095587183e-06, "loss": 1.1396, "step": 2568 }, { "epoch": 0.05, "learning_rate": 4.9955369761246495e-06, "loss": 1.1357, "step": 2569 }, { "epoch": 0.05, "learning_rate": 4.995527847343859e-06, "loss": 0.9573, "step": 2570 }, { "epoch": 0.05, "learning_rate": 4.995518709244842e-06, "loss": 1.0143, "step": 2571 }, { "epoch": 0.05, "learning_rate": 4.995509561827637e-06, "loss": 0.8653, "step": 2572 }, { "epoch": 0.05, "learning_rate": 4.995500405092274e-06, "loss": 0.9361, "step": 2573 }, { "epoch": 0.05, "learning_rate": 4.99549123903879e-06, "loss": 1.0085, "step": 2574 }, { "epoch": 0.05, "learning_rate": 4.995482063667218e-06, "loss": 1.1558, "step": 2575 }, { "epoch": 0.05, "learning_rate": 4.995472878977592e-06, "loss": 1.001, "step": 2576 }, { "epoch": 0.05, "learning_rate": 4.9954636849699474e-06, "loss": 0.9299, "step": 2577 }, { "epoch": 0.05, "learning_rate": 4.995454481644317e-06, "loss": 0.9277, "step": 2578 }, { "epoch": 0.05, "learning_rate": 4.995445269000737e-06, "loss": 1.0126, "step": 2579 }, { "epoch": 0.05, "learning_rate": 4.995436047039241e-06, "loss": 1.1818, "step": 2580 }, { "epoch": 0.05, "learning_rate": 4.995426815759863e-06, "loss": 1.3268, "step": 2581 }, { "epoch": 0.05, "learning_rate": 4.9954175751626375e-06, "loss": 1.0738, "step": 2582 }, { "epoch": 0.05, "learning_rate": 4.9954083252476e-06, "loss": 1.0116, "step": 2583 }, { "epoch": 0.05, "learning_rate": 4.9953990660147835e-06, "loss": 1.0571, "step": 2584 }, { "epoch": 0.05, "learning_rate": 4.995389797464224e-06, "loss": 1.143, "step": 2585 }, { "epoch": 0.05, "learning_rate": 4.995380519595955e-06, "loss": 1.0275, "step": 2586 }, { "epoch": 0.05, "learning_rate": 4.9953712324100125e-06, "loss": 1.2064, "step": 2587 }, { "epoch": 0.05, "learning_rate": 4.99536193590643e-06, "loss": 1.1005, "step": 2588 }, { "epoch": 0.05, "learning_rate": 4.995352630085242e-06, "loss": 1.0127, "step": 2589 }, { "epoch": 0.05, "learning_rate": 4.9953433149464836e-06, "loss": 0.99, "step": 2590 }, { "epoch": 0.05, "learning_rate": 4.99533399049019e-06, "loss": 1.1523, "step": 2591 }, { "epoch": 0.05, "learning_rate": 4.995324656716396e-06, "loss": 1.0781, "step": 2592 }, { "epoch": 0.05, "learning_rate": 4.995315313625137e-06, "loss": 1.2458, "step": 2593 }, { "epoch": 0.05, "learning_rate": 4.995305961216446e-06, "loss": 1.1763, "step": 2594 }, { "epoch": 0.05, "learning_rate": 4.995296599490359e-06, "loss": 0.8541, "step": 2595 }, { "epoch": 0.05, "learning_rate": 4.995287228446912e-06, "loss": 0.8688, "step": 2596 }, { "epoch": 0.05, "learning_rate": 4.9952778480861385e-06, "loss": 0.9352, "step": 2597 }, { "epoch": 0.05, "learning_rate": 4.995268458408073e-06, "loss": 0.9727, "step": 2598 }, { "epoch": 0.05, "learning_rate": 4.995259059412753e-06, "loss": 1.0677, "step": 2599 }, { "epoch": 0.05, "learning_rate": 4.9952496511002115e-06, "loss": 1.3555, "step": 2600 }, { "epoch": 0.05, "learning_rate": 4.995240233470485e-06, "loss": 1.0192, "step": 2601 }, { "epoch": 0.05, "learning_rate": 4.995230806523608e-06, "loss": 0.9164, "step": 2602 }, { "epoch": 0.05, "learning_rate": 4.995221370259615e-06, "loss": 0.6715, "step": 2603 }, { "epoch": 0.05, "learning_rate": 4.995211924678542e-06, "loss": 0.8386, "step": 2604 }, { "epoch": 0.05, "learning_rate": 4.9952024697804236e-06, "loss": 1.108, "step": 2605 }, { "epoch": 0.05, "learning_rate": 4.995193005565296e-06, "loss": 1.115, "step": 2606 }, { "epoch": 0.05, "learning_rate": 4.995183532033195e-06, "loss": 0.8257, "step": 2607 }, { "epoch": 0.05, "learning_rate": 4.9951740491841545e-06, "loss": 0.9175, "step": 2608 }, { "epoch": 0.05, "learning_rate": 4.995164557018211e-06, "loss": 1.0457, "step": 2609 }, { "epoch": 0.05, "learning_rate": 4.9951550555354e-06, "loss": 0.888, "step": 2610 }, { "epoch": 0.05, "learning_rate": 4.9951455447357556e-06, "loss": 1.1155, "step": 2611 }, { "epoch": 0.05, "learning_rate": 4.995136024619315e-06, "loss": 1.072, "step": 2612 }, { "epoch": 0.05, "learning_rate": 4.9951264951861125e-06, "loss": 1.1666, "step": 2613 }, { "epoch": 0.05, "learning_rate": 4.995116956436184e-06, "loss": 1.0449, "step": 2614 }, { "epoch": 0.05, "learning_rate": 4.995107408369565e-06, "loss": 0.8899, "step": 2615 }, { "epoch": 0.05, "learning_rate": 4.995097850986292e-06, "loss": 0.9402, "step": 2616 }, { "epoch": 0.05, "learning_rate": 4.9950882842864e-06, "loss": 0.9651, "step": 2617 }, { "epoch": 0.05, "learning_rate": 4.995078708269926e-06, "loss": 1.0272, "step": 2618 }, { "epoch": 0.05, "learning_rate": 4.995069122936903e-06, "loss": 1.1932, "step": 2619 }, { "epoch": 0.05, "learning_rate": 4.995059528287369e-06, "loss": 0.7903, "step": 2620 }, { "epoch": 0.05, "learning_rate": 4.995049924321359e-06, "loss": 1.0673, "step": 2621 }, { "epoch": 0.05, "learning_rate": 4.995040311038909e-06, "loss": 1.0141, "step": 2622 }, { "epoch": 0.05, "learning_rate": 4.995030688440056e-06, "loss": 0.9458, "step": 2623 }, { "epoch": 0.05, "learning_rate": 4.995021056524833e-06, "loss": 1.077, "step": 2624 }, { "epoch": 0.05, "learning_rate": 4.995011415293279e-06, "loss": 1.1441, "step": 2625 }, { "epoch": 0.05, "learning_rate": 4.995001764745429e-06, "loss": 1.143, "step": 2626 }, { "epoch": 0.05, "learning_rate": 4.99499210488132e-06, "loss": 0.9321, "step": 2627 }, { "epoch": 0.05, "learning_rate": 4.9949824357009845e-06, "loss": 0.9778, "step": 2628 }, { "epoch": 0.05, "learning_rate": 4.9949727572044625e-06, "loss": 1.0178, "step": 2629 }, { "epoch": 0.05, "learning_rate": 4.9949630693917885e-06, "loss": 0.9494, "step": 2630 }, { "epoch": 0.05, "learning_rate": 4.994953372263e-06, "loss": 1.015, "step": 2631 }, { "epoch": 0.05, "learning_rate": 4.99494366581813e-06, "loss": 0.9313, "step": 2632 }, { "epoch": 0.05, "learning_rate": 4.994933950057218e-06, "loss": 0.7882, "step": 2633 }, { "epoch": 0.05, "learning_rate": 4.994924224980299e-06, "loss": 0.8688, "step": 2634 }, { "epoch": 0.05, "learning_rate": 4.99491449058741e-06, "loss": 0.8613, "step": 2635 }, { "epoch": 0.05, "learning_rate": 4.994904746878586e-06, "loss": 1.085, "step": 2636 }, { "epoch": 0.05, "learning_rate": 4.994894993853865e-06, "loss": 0.9789, "step": 2637 }, { "epoch": 0.05, "learning_rate": 4.994885231513281e-06, "loss": 1.0547, "step": 2638 }, { "epoch": 0.05, "learning_rate": 4.994875459856874e-06, "loss": 1.1049, "step": 2639 }, { "epoch": 0.05, "learning_rate": 4.994865678884677e-06, "loss": 0.9473, "step": 2640 }, { "epoch": 0.05, "learning_rate": 4.994855888596729e-06, "loss": 0.9101, "step": 2641 }, { "epoch": 0.05, "learning_rate": 4.994846088993065e-06, "loss": 0.916, "step": 2642 }, { "epoch": 0.05, "learning_rate": 4.994836280073723e-06, "loss": 1.1742, "step": 2643 }, { "epoch": 0.05, "learning_rate": 4.994826461838737e-06, "loss": 1.2063, "step": 2644 }, { "epoch": 0.05, "learning_rate": 4.994816634288148e-06, "loss": 1.1725, "step": 2645 }, { "epoch": 0.05, "learning_rate": 4.9948067974219884e-06, "loss": 0.9899, "step": 2646 }, { "epoch": 0.05, "learning_rate": 4.994796951240297e-06, "loss": 1.1337, "step": 2647 }, { "epoch": 0.05, "learning_rate": 4.994787095743111e-06, "loss": 0.8811, "step": 2648 }, { "epoch": 0.05, "learning_rate": 4.994777230930466e-06, "loss": 1.1015, "step": 2649 }, { "epoch": 0.05, "learning_rate": 4.994767356802399e-06, "loss": 1.1533, "step": 2650 }, { "epoch": 0.05, "learning_rate": 4.994757473358947e-06, "loss": 0.9843, "step": 2651 }, { "epoch": 0.05, "learning_rate": 4.994747580600148e-06, "loss": 0.8442, "step": 2652 }, { "epoch": 0.05, "learning_rate": 4.994737678526038e-06, "loss": 0.9902, "step": 2653 }, { "epoch": 0.05, "learning_rate": 4.994727767136654e-06, "loss": 0.9652, "step": 2654 }, { "epoch": 0.05, "learning_rate": 4.994717846432032e-06, "loss": 0.9505, "step": 2655 }, { "epoch": 0.05, "learning_rate": 4.99470791641221e-06, "loss": 1.2771, "step": 2656 }, { "epoch": 0.05, "learning_rate": 4.994697977077226e-06, "loss": 1.2365, "step": 2657 }, { "epoch": 0.05, "learning_rate": 4.994688028427116e-06, "loss": 0.8694, "step": 2658 }, { "epoch": 0.05, "learning_rate": 4.994678070461918e-06, "loss": 0.8075, "step": 2659 }, { "epoch": 0.05, "learning_rate": 4.994668103181668e-06, "loss": 0.9161, "step": 2660 }, { "epoch": 0.05, "learning_rate": 4.994658126586403e-06, "loss": 1.0065, "step": 2661 }, { "epoch": 0.05, "learning_rate": 4.994648140676163e-06, "loss": 1.1195, "step": 2662 }, { "epoch": 0.05, "learning_rate": 4.994638145450982e-06, "loss": 0.9483, "step": 2663 }, { "epoch": 0.05, "learning_rate": 4.994628140910899e-06, "loss": 0.9597, "step": 2664 }, { "epoch": 0.05, "learning_rate": 4.9946181270559506e-06, "loss": 0.8582, "step": 2665 }, { "epoch": 0.05, "learning_rate": 4.994608103886174e-06, "loss": 1.0046, "step": 2666 }, { "epoch": 0.05, "learning_rate": 4.994598071401609e-06, "loss": 0.9625, "step": 2667 }, { "epoch": 0.05, "learning_rate": 4.99458802960229e-06, "loss": 1.0352, "step": 2668 }, { "epoch": 0.05, "learning_rate": 4.994577978488256e-06, "loss": 1.1684, "step": 2669 }, { "epoch": 0.05, "learning_rate": 4.994567918059544e-06, "loss": 0.9285, "step": 2670 }, { "epoch": 0.05, "learning_rate": 4.994557848316192e-06, "loss": 1.022, "step": 2671 }, { "epoch": 0.05, "learning_rate": 4.9945477692582385e-06, "loss": 0.9651, "step": 2672 }, { "epoch": 0.05, "learning_rate": 4.994537680885719e-06, "loss": 0.9258, "step": 2673 }, { "epoch": 0.05, "learning_rate": 4.994527583198672e-06, "loss": 1.1833, "step": 2674 }, { "epoch": 0.05, "learning_rate": 4.994517476197137e-06, "loss": 1.0613, "step": 2675 }, { "epoch": 0.05, "learning_rate": 4.99450735988115e-06, "loss": 1.0483, "step": 2676 }, { "epoch": 0.05, "learning_rate": 4.994497234250748e-06, "loss": 0.8525, "step": 2677 }, { "epoch": 0.05, "learning_rate": 4.9944870993059704e-06, "loss": 0.9965, "step": 2678 }, { "epoch": 0.05, "learning_rate": 4.994476955046854e-06, "loss": 0.8488, "step": 2679 }, { "epoch": 0.05, "learning_rate": 4.994466801473438e-06, "loss": 0.9603, "step": 2680 }, { "epoch": 0.05, "learning_rate": 4.994456638585759e-06, "loss": 1.1788, "step": 2681 }, { "epoch": 0.05, "learning_rate": 4.994446466383854e-06, "loss": 0.826, "step": 2682 }, { "epoch": 0.05, "learning_rate": 4.994436284867764e-06, "loss": 0.9893, "step": 2683 }, { "epoch": 0.05, "learning_rate": 4.994426094037525e-06, "loss": 0.901, "step": 2684 }, { "epoch": 0.05, "learning_rate": 4.994415893893175e-06, "loss": 0.8683, "step": 2685 }, { "epoch": 0.05, "learning_rate": 4.994405684434753e-06, "loss": 1.0256, "step": 2686 }, { "epoch": 0.05, "learning_rate": 4.9943954656622976e-06, "loss": 1.2193, "step": 2687 }, { "epoch": 0.05, "learning_rate": 4.994385237575845e-06, "loss": 1.0732, "step": 2688 }, { "epoch": 0.05, "learning_rate": 4.994375000175434e-06, "loss": 0.9147, "step": 2689 }, { "epoch": 0.05, "learning_rate": 4.994364753461104e-06, "loss": 0.9514, "step": 2690 }, { "epoch": 0.05, "learning_rate": 4.994354497432892e-06, "loss": 1.112, "step": 2691 }, { "epoch": 0.05, "learning_rate": 4.994344232090837e-06, "loss": 0.8881, "step": 2692 }, { "epoch": 0.05, "learning_rate": 4.994333957434977e-06, "loss": 1.1686, "step": 2693 }, { "epoch": 0.05, "learning_rate": 4.99432367346535e-06, "loss": 1.1999, "step": 2694 }, { "epoch": 0.05, "learning_rate": 4.994313380181996e-06, "loss": 1.0084, "step": 2695 }, { "epoch": 0.05, "learning_rate": 4.994303077584952e-06, "loss": 0.9053, "step": 2696 }, { "epoch": 0.05, "learning_rate": 4.9942927656742565e-06, "loss": 1.0984, "step": 2697 }, { "epoch": 0.05, "learning_rate": 4.994282444449948e-06, "loss": 1.1332, "step": 2698 }, { "epoch": 0.05, "learning_rate": 4.994272113912065e-06, "loss": 0.9934, "step": 2699 }, { "epoch": 0.05, "learning_rate": 4.994261774060648e-06, "loss": 1.2371, "step": 2700 }, { "epoch": 0.05, "learning_rate": 4.994251424895733e-06, "loss": 1.0723, "step": 2701 }, { "epoch": 0.05, "learning_rate": 4.9942410664173595e-06, "loss": 0.9532, "step": 2702 }, { "epoch": 0.05, "learning_rate": 4.994230698625567e-06, "loss": 0.9346, "step": 2703 }, { "epoch": 0.05, "learning_rate": 4.994220321520392e-06, "loss": 1.0663, "step": 2704 }, { "epoch": 0.05, "learning_rate": 4.994209935101877e-06, "loss": 0.9339, "step": 2705 }, { "epoch": 0.05, "learning_rate": 4.994199539370057e-06, "loss": 1.1631, "step": 2706 }, { "epoch": 0.05, "learning_rate": 4.994189134324973e-06, "loss": 1.1042, "step": 2707 }, { "epoch": 0.05, "learning_rate": 4.994178719966663e-06, "loss": 0.8663, "step": 2708 }, { "epoch": 0.05, "learning_rate": 4.994168296295166e-06, "loss": 0.8533, "step": 2709 }, { "epoch": 0.05, "learning_rate": 4.994157863310521e-06, "loss": 0.8435, "step": 2710 }, { "epoch": 0.05, "learning_rate": 4.994147421012768e-06, "loss": 0.9923, "step": 2711 }, { "epoch": 0.05, "learning_rate": 4.994136969401944e-06, "loss": 1.1809, "step": 2712 }, { "epoch": 0.05, "learning_rate": 4.99412650847809e-06, "loss": 0.9525, "step": 2713 }, { "epoch": 0.05, "learning_rate": 4.994116038241243e-06, "loss": 0.846, "step": 2714 }, { "epoch": 0.05, "learning_rate": 4.994105558691443e-06, "loss": 0.908, "step": 2715 }, { "epoch": 0.05, "learning_rate": 4.99409506982873e-06, "loss": 0.9375, "step": 2716 }, { "epoch": 0.05, "learning_rate": 4.994084571653143e-06, "loss": 1.0984, "step": 2717 }, { "epoch": 0.05, "learning_rate": 4.99407406416472e-06, "loss": 1.1478, "step": 2718 }, { "epoch": 0.05, "learning_rate": 4.994063547363501e-06, "loss": 1.1064, "step": 2719 }, { "epoch": 0.05, "learning_rate": 4.994053021249526e-06, "loss": 0.9073, "step": 2720 }, { "epoch": 0.05, "learning_rate": 4.994042485822832e-06, "loss": 0.887, "step": 2721 }, { "epoch": 0.05, "learning_rate": 4.99403194108346e-06, "loss": 0.9714, "step": 2722 }, { "epoch": 0.05, "learning_rate": 4.99402138703145e-06, "loss": 0.9615, "step": 2723 }, { "epoch": 0.05, "learning_rate": 4.99401082366684e-06, "loss": 1.0449, "step": 2724 }, { "epoch": 0.05, "learning_rate": 4.9940002509896706e-06, "loss": 1.2104, "step": 2725 }, { "epoch": 0.05, "learning_rate": 4.993989668999981e-06, "loss": 0.9659, "step": 2726 }, { "epoch": 0.05, "learning_rate": 4.993979077697809e-06, "loss": 0.7904, "step": 2727 }, { "epoch": 0.05, "learning_rate": 4.993968477083197e-06, "loss": 0.8714, "step": 2728 }, { "epoch": 0.05, "learning_rate": 4.993957867156182e-06, "loss": 1.0182, "step": 2729 }, { "epoch": 0.05, "learning_rate": 4.993947247916806e-06, "loss": 1.128, "step": 2730 }, { "epoch": 0.05, "learning_rate": 4.993936619365107e-06, "loss": 0.9667, "step": 2731 }, { "epoch": 0.05, "learning_rate": 4.993925981501126e-06, "loss": 1.0634, "step": 2732 }, { "epoch": 0.05, "learning_rate": 4.9939153343249e-06, "loss": 0.9558, "step": 2733 }, { "epoch": 0.05, "learning_rate": 4.993904677836472e-06, "loss": 0.8553, "step": 2734 }, { "epoch": 0.05, "learning_rate": 4.993894012035879e-06, "loss": 0.9969, "step": 2735 }, { "epoch": 0.05, "learning_rate": 4.993883336923164e-06, "loss": 0.858, "step": 2736 }, { "epoch": 0.05, "learning_rate": 4.993872652498364e-06, "loss": 0.9623, "step": 2737 }, { "epoch": 0.05, "learning_rate": 4.99386195876152e-06, "loss": 1.0987, "step": 2738 }, { "epoch": 0.05, "learning_rate": 4.993851255712672e-06, "loss": 1.0352, "step": 2739 }, { "epoch": 0.05, "learning_rate": 4.99384054335186e-06, "loss": 0.9397, "step": 2740 }, { "epoch": 0.05, "learning_rate": 4.993829821679124e-06, "loss": 0.9489, "step": 2741 }, { "epoch": 0.05, "learning_rate": 4.993819090694504e-06, "loss": 1.101, "step": 2742 }, { "epoch": 0.05, "learning_rate": 4.99380835039804e-06, "loss": 1.0765, "step": 2743 }, { "epoch": 0.05, "learning_rate": 4.993797600789771e-06, "loss": 1.0568, "step": 2744 }, { "epoch": 0.05, "learning_rate": 4.99378684186974e-06, "loss": 1.0123, "step": 2745 }, { "epoch": 0.05, "learning_rate": 4.993776073637984e-06, "loss": 0.9364, "step": 2746 }, { "epoch": 0.05, "learning_rate": 4.993765296094545e-06, "loss": 0.9392, "step": 2747 }, { "epoch": 0.05, "learning_rate": 4.9937545092394626e-06, "loss": 0.8505, "step": 2748 }, { "epoch": 0.05, "learning_rate": 4.993743713072778e-06, "loss": 0.9966, "step": 2749 }, { "epoch": 0.05, "learning_rate": 4.993732907594531e-06, "loss": 1.0881, "step": 2750 }, { "epoch": 0.05, "learning_rate": 4.99372209280476e-06, "loss": 0.9383, "step": 2751 }, { "epoch": 0.05, "learning_rate": 4.993711268703509e-06, "loss": 0.9072, "step": 2752 }, { "epoch": 0.05, "learning_rate": 4.993700435290816e-06, "loss": 0.8502, "step": 2753 }, { "epoch": 0.05, "learning_rate": 4.9936895925667215e-06, "loss": 0.7446, "step": 2754 }, { "epoch": 0.05, "learning_rate": 4.993678740531267e-06, "loss": 1.1566, "step": 2755 }, { "epoch": 0.05, "learning_rate": 4.9936678791844924e-06, "loss": 1.1096, "step": 2756 }, { "epoch": 0.05, "learning_rate": 4.9936570085264395e-06, "loss": 1.0303, "step": 2757 }, { "epoch": 0.05, "learning_rate": 4.993646128557147e-06, "loss": 1.0741, "step": 2758 }, { "epoch": 0.05, "learning_rate": 4.993635239276656e-06, "loss": 0.9648, "step": 2759 }, { "epoch": 0.05, "learning_rate": 4.993624340685007e-06, "loss": 1.0359, "step": 2760 }, { "epoch": 0.05, "learning_rate": 4.993613432782242e-06, "loss": 0.9688, "step": 2761 }, { "epoch": 0.05, "learning_rate": 4.993602515568401e-06, "loss": 1.2955, "step": 2762 }, { "epoch": 0.05, "learning_rate": 4.993591589043524e-06, "loss": 1.0609, "step": 2763 }, { "epoch": 0.05, "learning_rate": 4.9935806532076535e-06, "loss": 0.9961, "step": 2764 }, { "epoch": 0.05, "learning_rate": 4.993569708060828e-06, "loss": 0.8407, "step": 2765 }, { "epoch": 0.05, "learning_rate": 4.9935587536030905e-06, "loss": 0.8852, "step": 2766 }, { "epoch": 0.05, "learning_rate": 4.993547789834481e-06, "loss": 0.8705, "step": 2767 }, { "epoch": 0.05, "learning_rate": 4.99353681675504e-06, "loss": 1.1878, "step": 2768 }, { "epoch": 0.05, "learning_rate": 4.9935258343648095e-06, "loss": 0.9937, "step": 2769 }, { "epoch": 0.05, "learning_rate": 4.99351484266383e-06, "loss": 0.7997, "step": 2770 }, { "epoch": 0.05, "learning_rate": 4.993503841652142e-06, "loss": 0.891, "step": 2771 }, { "epoch": 0.05, "learning_rate": 4.993492831329788e-06, "loss": 0.961, "step": 2772 }, { "epoch": 0.05, "learning_rate": 4.993481811696807e-06, "loss": 0.906, "step": 2773 }, { "epoch": 0.05, "learning_rate": 4.9934707827532425e-06, "loss": 0.963, "step": 2774 }, { "epoch": 0.05, "learning_rate": 4.993459744499134e-06, "loss": 1.136, "step": 2775 }, { "epoch": 0.05, "learning_rate": 4.993448696934523e-06, "loss": 0.8707, "step": 2776 }, { "epoch": 0.05, "learning_rate": 4.993437640059452e-06, "loss": 0.9881, "step": 2777 }, { "epoch": 0.05, "learning_rate": 4.993426573873961e-06, "loss": 1.0052, "step": 2778 }, { "epoch": 0.05, "learning_rate": 4.9934154983780905e-06, "loss": 1.0029, "step": 2779 }, { "epoch": 0.05, "learning_rate": 4.993404413571884e-06, "loss": 1.0647, "step": 2780 }, { "epoch": 0.05, "learning_rate": 4.993393319455382e-06, "loss": 1.1412, "step": 2781 }, { "epoch": 0.05, "learning_rate": 4.993382216028625e-06, "loss": 1.2119, "step": 2782 }, { "epoch": 0.05, "learning_rate": 4.993371103291656e-06, "loss": 0.8403, "step": 2783 }, { "epoch": 0.05, "learning_rate": 4.9933599812445154e-06, "loss": 0.792, "step": 2784 }, { "epoch": 0.05, "learning_rate": 4.993348849887245e-06, "loss": 0.9162, "step": 2785 }, { "epoch": 0.05, "learning_rate": 4.993337709219887e-06, "loss": 0.9767, "step": 2786 }, { "epoch": 0.05, "learning_rate": 4.993326559242481e-06, "loss": 0.9968, "step": 2787 }, { "epoch": 0.05, "learning_rate": 4.993315399955072e-06, "loss": 1.0114, "step": 2788 }, { "epoch": 0.05, "learning_rate": 4.9933042313576985e-06, "loss": 0.7122, "step": 2789 }, { "epoch": 0.05, "learning_rate": 4.993293053450404e-06, "loss": 1.0216, "step": 2790 }, { "epoch": 0.05, "learning_rate": 4.993281866233229e-06, "loss": 0.9575, "step": 2791 }, { "epoch": 0.05, "learning_rate": 4.993270669706217e-06, "loss": 0.92, "step": 2792 }, { "epoch": 0.05, "learning_rate": 4.9932594638694075e-06, "loss": 1.1193, "step": 2793 }, { "epoch": 0.05, "learning_rate": 4.993248248722845e-06, "loss": 1.246, "step": 2794 }, { "epoch": 0.05, "learning_rate": 4.993237024266569e-06, "loss": 0.8428, "step": 2795 }, { "epoch": 0.05, "learning_rate": 4.993225790500622e-06, "loss": 0.9251, "step": 2796 }, { "epoch": 0.05, "learning_rate": 4.993214547425047e-06, "loss": 0.8477, "step": 2797 }, { "epoch": 0.05, "learning_rate": 4.993203295039886e-06, "loss": 0.9026, "step": 2798 }, { "epoch": 0.05, "learning_rate": 4.99319203334518e-06, "loss": 1.2482, "step": 2799 }, { "epoch": 0.05, "learning_rate": 4.993180762340971e-06, "loss": 1.1214, "step": 2800 }, { "epoch": 0.05, "learning_rate": 4.9931694820273015e-06, "loss": 1.0354, "step": 2801 }, { "epoch": 0.05, "learning_rate": 4.993158192404214e-06, "loss": 0.8364, "step": 2802 }, { "epoch": 0.05, "learning_rate": 4.993146893471749e-06, "loss": 0.9482, "step": 2803 }, { "epoch": 0.05, "learning_rate": 4.993135585229951e-06, "loss": 0.8655, "step": 2804 }, { "epoch": 0.05, "learning_rate": 4.993124267678862e-06, "loss": 1.0292, "step": 2805 }, { "epoch": 0.05, "learning_rate": 4.993112940818522e-06, "loss": 1.2242, "step": 2806 }, { "epoch": 0.05, "learning_rate": 4.993101604648975e-06, "loss": 0.9326, "step": 2807 }, { "epoch": 0.05, "learning_rate": 4.993090259170263e-06, "loss": 0.8167, "step": 2808 }, { "epoch": 0.05, "learning_rate": 4.993078904382429e-06, "loss": 0.8077, "step": 2809 }, { "epoch": 0.05, "learning_rate": 4.993067540285514e-06, "loss": 0.8836, "step": 2810 }, { "epoch": 0.05, "learning_rate": 4.993056166879562e-06, "loss": 0.9594, "step": 2811 }, { "epoch": 0.05, "learning_rate": 4.993044784164614e-06, "loss": 1.1695, "step": 2812 }, { "epoch": 0.05, "learning_rate": 4.993033392140714e-06, "loss": 0.9249, "step": 2813 }, { "epoch": 0.05, "learning_rate": 4.993021990807903e-06, "loss": 0.8645, "step": 2814 }, { "epoch": 0.05, "learning_rate": 4.9930105801662244e-06, "loss": 0.9649, "step": 2815 }, { "epoch": 0.05, "learning_rate": 4.992999160215721e-06, "loss": 0.9796, "step": 2816 }, { "epoch": 0.05, "learning_rate": 4.992987730956435e-06, "loss": 1.0475, "step": 2817 }, { "epoch": 0.05, "learning_rate": 4.99297629238841e-06, "loss": 1.141, "step": 2818 }, { "epoch": 0.05, "learning_rate": 4.992964844511688e-06, "loss": 1.1432, "step": 2819 }, { "epoch": 0.05, "learning_rate": 4.99295338732631e-06, "loss": 1.0332, "step": 2820 }, { "epoch": 0.05, "learning_rate": 4.992941920832321e-06, "loss": 0.8682, "step": 2821 }, { "epoch": 0.05, "learning_rate": 4.992930445029764e-06, "loss": 0.9958, "step": 2822 }, { "epoch": 0.05, "learning_rate": 4.992918959918682e-06, "loss": 0.9262, "step": 2823 }, { "epoch": 0.05, "learning_rate": 4.992907465499116e-06, "loss": 1.1375, "step": 2824 }, { "epoch": 0.05, "learning_rate": 4.99289596177111e-06, "loss": 1.0169, "step": 2825 }, { "epoch": 0.05, "learning_rate": 4.992884448734707e-06, "loss": 1.0983, "step": 2826 }, { "epoch": 0.05, "learning_rate": 4.99287292638995e-06, "loss": 1.0059, "step": 2827 }, { "epoch": 0.05, "learning_rate": 4.992861394736882e-06, "loss": 0.949, "step": 2828 }, { "epoch": 0.05, "learning_rate": 4.992849853775545e-06, "loss": 0.974, "step": 2829 }, { "epoch": 0.05, "learning_rate": 4.992838303505983e-06, "loss": 0.9093, "step": 2830 }, { "epoch": 0.05, "learning_rate": 4.9928267439282405e-06, "loss": 1.1237, "step": 2831 }, { "epoch": 0.05, "learning_rate": 4.99281517504236e-06, "loss": 1.0201, "step": 2832 }, { "epoch": 0.05, "learning_rate": 4.992803596848382e-06, "loss": 0.9254, "step": 2833 }, { "epoch": 0.05, "learning_rate": 4.9927920093463535e-06, "loss": 0.8816, "step": 2834 }, { "epoch": 0.05, "learning_rate": 4.9927804125363145e-06, "loss": 1.0389, "step": 2835 }, { "epoch": 0.05, "learning_rate": 4.992768806418311e-06, "loss": 1.2348, "step": 2836 }, { "epoch": 0.05, "learning_rate": 4.992757190992385e-06, "loss": 1.0944, "step": 2837 }, { "epoch": 0.05, "learning_rate": 4.99274556625858e-06, "loss": 0.9605, "step": 2838 }, { "epoch": 0.05, "learning_rate": 4.99273393221694e-06, "loss": 0.9128, "step": 2839 }, { "epoch": 0.05, "learning_rate": 4.992722288867507e-06, "loss": 0.9981, "step": 2840 }, { "epoch": 0.05, "learning_rate": 4.9927106362103264e-06, "loss": 0.9189, "step": 2841 }, { "epoch": 0.05, "learning_rate": 4.992698974245439e-06, "loss": 0.934, "step": 2842 }, { "epoch": 0.05, "learning_rate": 4.992687302972891e-06, "loss": 0.9237, "step": 2843 }, { "epoch": 0.05, "learning_rate": 4.9926756223927255e-06, "loss": 1.0502, "step": 2844 }, { "epoch": 0.05, "learning_rate": 4.9926639325049855e-06, "loss": 1.074, "step": 2845 }, { "epoch": 0.05, "learning_rate": 4.9926522333097145e-06, "loss": 0.8852, "step": 2846 }, { "epoch": 0.05, "learning_rate": 4.992640524806957e-06, "loss": 1.0273, "step": 2847 }, { "epoch": 0.05, "learning_rate": 4.992628806996756e-06, "loss": 1.0228, "step": 2848 }, { "epoch": 0.05, "learning_rate": 4.992617079879155e-06, "loss": 0.97, "step": 2849 }, { "epoch": 0.05, "learning_rate": 4.992605343454198e-06, "loss": 1.0921, "step": 2850 }, { "epoch": 0.05, "learning_rate": 4.992593597721931e-06, "loss": 0.8122, "step": 2851 }, { "epoch": 0.05, "learning_rate": 4.992581842682394e-06, "loss": 0.9315, "step": 2852 }, { "epoch": 0.05, "learning_rate": 4.992570078335634e-06, "loss": 0.9442, "step": 2853 }, { "epoch": 0.05, "learning_rate": 4.992558304681693e-06, "loss": 0.7969, "step": 2854 }, { "epoch": 0.05, "learning_rate": 4.9925465217206155e-06, "loss": 1.0598, "step": 2855 }, { "epoch": 0.05, "learning_rate": 4.992534729452446e-06, "loss": 1.2484, "step": 2856 }, { "epoch": 0.05, "learning_rate": 4.992522927877228e-06, "loss": 0.9503, "step": 2857 }, { "epoch": 0.05, "learning_rate": 4.992511116995006e-06, "loss": 1.2063, "step": 2858 }, { "epoch": 0.05, "learning_rate": 4.992499296805825e-06, "loss": 0.8314, "step": 2859 }, { "epoch": 0.05, "learning_rate": 4.9924874673097265e-06, "loss": 0.9597, "step": 2860 }, { "epoch": 0.05, "learning_rate": 4.992475628506756e-06, "loss": 1.0268, "step": 2861 }, { "epoch": 0.05, "learning_rate": 4.99246378039696e-06, "loss": 1.2639, "step": 2862 }, { "epoch": 0.05, "learning_rate": 4.99245192298038e-06, "loss": 0.9844, "step": 2863 }, { "epoch": 0.05, "learning_rate": 4.9924400562570596e-06, "loss": 1.0077, "step": 2864 }, { "epoch": 0.05, "learning_rate": 4.992428180227045e-06, "loss": 0.8131, "step": 2865 }, { "epoch": 0.05, "learning_rate": 4.99241629489038e-06, "loss": 0.9748, "step": 2866 }, { "epoch": 0.05, "learning_rate": 4.99240440024711e-06, "loss": 1.1544, "step": 2867 }, { "epoch": 0.05, "learning_rate": 4.992392496297277e-06, "loss": 0.9965, "step": 2868 }, { "epoch": 0.05, "learning_rate": 4.992380583040927e-06, "loss": 1.1735, "step": 2869 }, { "epoch": 0.05, "learning_rate": 4.992368660478105e-06, "loss": 0.7441, "step": 2870 }, { "epoch": 0.05, "learning_rate": 4.9923567286088545e-06, "loss": 1.0699, "step": 2871 }, { "epoch": 0.05, "learning_rate": 4.9923447874332205e-06, "loss": 0.9912, "step": 2872 }, { "epoch": 0.05, "learning_rate": 4.9923328369512465e-06, "loss": 0.8136, "step": 2873 }, { "epoch": 0.05, "learning_rate": 4.992320877162979e-06, "loss": 1.0886, "step": 2874 }, { "epoch": 0.05, "learning_rate": 4.9923089080684625e-06, "loss": 0.8939, "step": 2875 }, { "epoch": 0.05, "learning_rate": 4.9922969296677404e-06, "loss": 0.9216, "step": 2876 }, { "epoch": 0.05, "learning_rate": 4.992284941960858e-06, "loss": 1.0708, "step": 2877 }, { "epoch": 0.05, "learning_rate": 4.992272944947859e-06, "loss": 0.9984, "step": 2878 }, { "epoch": 0.05, "learning_rate": 4.992260938628791e-06, "loss": 0.9136, "step": 2879 }, { "epoch": 0.05, "learning_rate": 4.9922489230036955e-06, "loss": 1.1014, "step": 2880 }, { "epoch": 0.05, "learning_rate": 4.9922368980726196e-06, "loss": 1.0153, "step": 2881 }, { "epoch": 0.05, "learning_rate": 4.992224863835608e-06, "loss": 1.0148, "step": 2882 }, { "epoch": 0.05, "learning_rate": 4.992212820292705e-06, "loss": 0.8997, "step": 2883 }, { "epoch": 0.05, "learning_rate": 4.9922007674439555e-06, "loss": 0.9852, "step": 2884 }, { "epoch": 0.05, "learning_rate": 4.992188705289404e-06, "loss": 1.0574, "step": 2885 }, { "epoch": 0.05, "learning_rate": 4.9921766338290975e-06, "loss": 0.8135, "step": 2886 }, { "epoch": 0.05, "learning_rate": 4.992164553063079e-06, "loss": 1.319, "step": 2887 }, { "epoch": 0.05, "learning_rate": 4.9921524629913944e-06, "loss": 1.1005, "step": 2888 }, { "epoch": 0.05, "learning_rate": 4.99214036361409e-06, "loss": 0.89, "step": 2889 }, { "epoch": 0.05, "learning_rate": 4.992128254931209e-06, "loss": 0.9182, "step": 2890 }, { "epoch": 0.05, "learning_rate": 4.992116136942798e-06, "loss": 0.9705, "step": 2891 }, { "epoch": 0.05, "learning_rate": 4.992104009648901e-06, "loss": 1.0251, "step": 2892 }, { "epoch": 0.05, "learning_rate": 4.992091873049565e-06, "loss": 1.3105, "step": 2893 }, { "epoch": 0.05, "learning_rate": 4.992079727144833e-06, "loss": 1.1409, "step": 2894 }, { "epoch": 0.05, "learning_rate": 4.992067571934754e-06, "loss": 0.8538, "step": 2895 }, { "epoch": 0.05, "learning_rate": 4.992055407419369e-06, "loss": 1.0238, "step": 2896 }, { "epoch": 0.05, "learning_rate": 4.9920432335987255e-06, "loss": 0.9714, "step": 2897 }, { "epoch": 0.05, "learning_rate": 4.99203105047287e-06, "loss": 1.046, "step": 2898 }, { "epoch": 0.05, "learning_rate": 4.992018858041847e-06, "loss": 1.1396, "step": 2899 }, { "epoch": 0.05, "learning_rate": 4.992006656305701e-06, "loss": 1.0267, "step": 2900 }, { "epoch": 0.05, "learning_rate": 4.99199444526448e-06, "loss": 1.0261, "step": 2901 }, { "epoch": 0.05, "learning_rate": 4.9919822249182275e-06, "loss": 0.7495, "step": 2902 }, { "epoch": 0.05, "learning_rate": 4.9919699952669885e-06, "loss": 1.0355, "step": 2903 }, { "epoch": 0.05, "learning_rate": 4.991957756310811e-06, "loss": 0.9631, "step": 2904 }, { "epoch": 0.05, "learning_rate": 4.99194550804974e-06, "loss": 0.9181, "step": 2905 }, { "epoch": 0.05, "learning_rate": 4.991933250483821e-06, "loss": 1.0889, "step": 2906 }, { "epoch": 0.05, "learning_rate": 4.9919209836130985e-06, "loss": 1.1941, "step": 2907 }, { "epoch": 0.05, "learning_rate": 4.99190870743762e-06, "loss": 1.0316, "step": 2908 }, { "epoch": 0.05, "learning_rate": 4.991896421957432e-06, "loss": 1.0029, "step": 2909 }, { "epoch": 0.05, "learning_rate": 4.991884127172578e-06, "loss": 0.9789, "step": 2910 }, { "epoch": 0.05, "learning_rate": 4.9918718230831045e-06, "loss": 1.0032, "step": 2911 }, { "epoch": 0.05, "learning_rate": 4.991859509689059e-06, "loss": 1.0579, "step": 2912 }, { "epoch": 0.05, "learning_rate": 4.991847186990486e-06, "loss": 0.9685, "step": 2913 }, { "epoch": 0.05, "learning_rate": 4.991834854987433e-06, "loss": 1.0416, "step": 2914 }, { "epoch": 0.05, "learning_rate": 4.991822513679944e-06, "loss": 0.9617, "step": 2915 }, { "epoch": 0.06, "learning_rate": 4.991810163068066e-06, "loss": 1.0167, "step": 2916 }, { "epoch": 0.06, "learning_rate": 4.991797803151846e-06, "loss": 0.882, "step": 2917 }, { "epoch": 0.06, "learning_rate": 4.991785433931329e-06, "loss": 1.2213, "step": 2918 }, { "epoch": 0.06, "learning_rate": 4.991773055406561e-06, "loss": 1.1745, "step": 2919 }, { "epoch": 0.06, "learning_rate": 4.99176066757759e-06, "loss": 0.9599, "step": 2920 }, { "epoch": 0.06, "learning_rate": 4.99174827044446e-06, "loss": 0.9501, "step": 2921 }, { "epoch": 0.06, "learning_rate": 4.991735864007219e-06, "loss": 1.0077, "step": 2922 }, { "epoch": 0.06, "learning_rate": 4.991723448265913e-06, "loss": 0.9245, "step": 2923 }, { "epoch": 0.06, "learning_rate": 4.9917110232205876e-06, "loss": 0.881, "step": 2924 }, { "epoch": 0.06, "learning_rate": 4.991698588871289e-06, "loss": 1.1052, "step": 2925 }, { "epoch": 0.06, "learning_rate": 4.991686145218065e-06, "loss": 1.0809, "step": 2926 }, { "epoch": 0.06, "learning_rate": 4.991673692260961e-06, "loss": 0.8175, "step": 2927 }, { "epoch": 0.06, "learning_rate": 4.991661230000025e-06, "loss": 0.9996, "step": 2928 }, { "epoch": 0.06, "learning_rate": 4.991648758435301e-06, "loss": 0.8223, "step": 2929 }, { "epoch": 0.06, "learning_rate": 4.991636277566837e-06, "loss": 0.9269, "step": 2930 }, { "epoch": 0.06, "learning_rate": 4.991623787394681e-06, "loss": 1.1992, "step": 2931 }, { "epoch": 0.06, "learning_rate": 4.991611287918876e-06, "loss": 0.9279, "step": 2932 }, { "epoch": 0.06, "learning_rate": 4.991598779139472e-06, "loss": 0.9963, "step": 2933 }, { "epoch": 0.06, "learning_rate": 4.991586261056515e-06, "loss": 0.9094, "step": 2934 }, { "epoch": 0.06, "learning_rate": 4.991573733670051e-06, "loss": 1.0731, "step": 2935 }, { "epoch": 0.06, "learning_rate": 4.991561196980126e-06, "loss": 1.1173, "step": 2936 }, { "epoch": 0.06, "learning_rate": 4.991548650986789e-06, "loss": 0.997, "step": 2937 }, { "epoch": 0.06, "learning_rate": 4.991536095690085e-06, "loss": 1.0703, "step": 2938 }, { "epoch": 0.06, "learning_rate": 4.991523531090062e-06, "loss": 0.795, "step": 2939 }, { "epoch": 0.06, "learning_rate": 4.991510957186767e-06, "loss": 0.8875, "step": 2940 }, { "epoch": 0.06, "learning_rate": 4.991498373980246e-06, "loss": 0.9639, "step": 2941 }, { "epoch": 0.06, "learning_rate": 4.991485781470547e-06, "loss": 1.0435, "step": 2942 }, { "epoch": 0.06, "learning_rate": 4.991473179657716e-06, "loss": 1.1834, "step": 2943 }, { "epoch": 0.06, "learning_rate": 4.9914605685418e-06, "loss": 0.9697, "step": 2944 }, { "epoch": 0.06, "learning_rate": 4.991447948122847e-06, "loss": 0.9719, "step": 2945 }, { "epoch": 0.06, "learning_rate": 4.991435318400904e-06, "loss": 0.914, "step": 2946 }, { "epoch": 0.06, "learning_rate": 4.991422679376018e-06, "loss": 0.9472, "step": 2947 }, { "epoch": 0.06, "learning_rate": 4.991410031048236e-06, "loss": 0.9364, "step": 2948 }, { "epoch": 0.06, "learning_rate": 4.991397373417605e-06, "loss": 1.0586, "step": 2949 }, { "epoch": 0.06, "learning_rate": 4.991384706484173e-06, "loss": 1.0916, "step": 2950 }, { "epoch": 0.06, "learning_rate": 4.991372030247986e-06, "loss": 1.1481, "step": 2951 }, { "epoch": 0.06, "learning_rate": 4.991359344709094e-06, "loss": 0.9803, "step": 2952 }, { "epoch": 0.06, "learning_rate": 4.991346649867541e-06, "loss": 1.0609, "step": 2953 }, { "epoch": 0.06, "learning_rate": 4.991333945723377e-06, "loss": 0.8951, "step": 2954 }, { "epoch": 0.06, "learning_rate": 4.991321232276648e-06, "loss": 0.987, "step": 2955 }, { "epoch": 0.06, "learning_rate": 4.991308509527402e-06, "loss": 1.0411, "step": 2956 }, { "epoch": 0.06, "learning_rate": 4.991295777475686e-06, "loss": 0.7998, "step": 2957 }, { "epoch": 0.06, "learning_rate": 4.991283036121548e-06, "loss": 0.8128, "step": 2958 }, { "epoch": 0.06, "learning_rate": 4.991270285465036e-06, "loss": 0.8497, "step": 2959 }, { "epoch": 0.06, "learning_rate": 4.991257525506197e-06, "loss": 1.0289, "step": 2960 }, { "epoch": 0.06, "learning_rate": 4.991244756245079e-06, "loss": 0.8086, "step": 2961 }, { "epoch": 0.06, "learning_rate": 4.9912319776817286e-06, "loss": 1.296, "step": 2962 }, { "epoch": 0.06, "learning_rate": 4.991219189816196e-06, "loss": 1.0208, "step": 2963 }, { "epoch": 0.06, "learning_rate": 4.991206392648526e-06, "loss": 0.8918, "step": 2964 }, { "epoch": 0.06, "learning_rate": 4.991193586178767e-06, "loss": 0.9347, "step": 2965 }, { "epoch": 0.06, "learning_rate": 4.991180770406969e-06, "loss": 0.9348, "step": 2966 }, { "epoch": 0.06, "learning_rate": 4.991167945333178e-06, "loss": 0.9582, "step": 2967 }, { "epoch": 0.06, "learning_rate": 4.991155110957442e-06, "loss": 1.0994, "step": 2968 }, { "epoch": 0.06, "learning_rate": 4.991142267279809e-06, "loss": 1.0027, "step": 2969 }, { "epoch": 0.06, "learning_rate": 4.991129414300327e-06, "loss": 0.8467, "step": 2970 }, { "epoch": 0.06, "learning_rate": 4.991116552019045e-06, "loss": 0.9877, "step": 2971 }, { "epoch": 0.06, "learning_rate": 4.99110368043601e-06, "loss": 0.9912, "step": 2972 }, { "epoch": 0.06, "learning_rate": 4.99109079955127e-06, "loss": 1.0361, "step": 2973 }, { "epoch": 0.06, "learning_rate": 4.9910779093648744e-06, "loss": 1.0164, "step": 2974 }, { "epoch": 0.06, "learning_rate": 4.991065009876869e-06, "loss": 1.1809, "step": 2975 }, { "epoch": 0.06, "learning_rate": 4.991052101087304e-06, "loss": 1.0189, "step": 2976 }, { "epoch": 0.06, "learning_rate": 4.991039182996225e-06, "loss": 0.9995, "step": 2977 }, { "epoch": 0.06, "learning_rate": 4.991026255603684e-06, "loss": 1.0989, "step": 2978 }, { "epoch": 0.06, "learning_rate": 4.9910133189097265e-06, "loss": 0.7271, "step": 2979 }, { "epoch": 0.06, "learning_rate": 4.991000372914402e-06, "loss": 0.95, "step": 2980 }, { "epoch": 0.06, "learning_rate": 4.990987417617759e-06, "loss": 1.018, "step": 2981 }, { "epoch": 0.06, "learning_rate": 4.990974453019845e-06, "loss": 1.0146, "step": 2982 }, { "epoch": 0.06, "learning_rate": 4.990961479120708e-06, "loss": 0.9246, "step": 2983 }, { "epoch": 0.06, "learning_rate": 4.990948495920397e-06, "loss": 1.0107, "step": 2984 }, { "epoch": 0.06, "learning_rate": 4.9909355034189625e-06, "loss": 0.8235, "step": 2985 }, { "epoch": 0.06, "learning_rate": 4.9909225016164495e-06, "loss": 0.9512, "step": 2986 }, { "epoch": 0.06, "learning_rate": 4.990909490512908e-06, "loss": 1.1443, "step": 2987 }, { "epoch": 0.06, "learning_rate": 4.990896470108388e-06, "loss": 1.1619, "step": 2988 }, { "epoch": 0.06, "learning_rate": 4.990883440402937e-06, "loss": 1.0112, "step": 2989 }, { "epoch": 0.06, "learning_rate": 4.990870401396603e-06, "loss": 0.9397, "step": 2990 }, { "epoch": 0.06, "learning_rate": 4.990857353089436e-06, "loss": 0.9126, "step": 2991 }, { "epoch": 0.06, "learning_rate": 4.990844295481484e-06, "loss": 0.8039, "step": 2992 }, { "epoch": 0.06, "learning_rate": 4.990831228572795e-06, "loss": 0.9835, "step": 2993 }, { "epoch": 0.06, "learning_rate": 4.990818152363419e-06, "loss": 1.1816, "step": 2994 }, { "epoch": 0.06, "learning_rate": 4.9908050668534044e-06, "loss": 1.0558, "step": 2995 }, { "epoch": 0.06, "learning_rate": 4.9907919720428e-06, "loss": 1.0055, "step": 2996 }, { "epoch": 0.06, "learning_rate": 4.990778867931654e-06, "loss": 1.0423, "step": 2997 }, { "epoch": 0.06, "learning_rate": 4.990765754520017e-06, "loss": 0.975, "step": 2998 }, { "epoch": 0.06, "learning_rate": 4.990752631807937e-06, "loss": 1.1774, "step": 2999 }, { "epoch": 0.06, "learning_rate": 4.990739499795463e-06, "loss": 1.3658, "step": 3000 }, { "epoch": 0.06, "learning_rate": 4.990726358482644e-06, "loss": 0.8747, "step": 3001 }, { "epoch": 0.06, "learning_rate": 4.990713207869529e-06, "loss": 0.9927, "step": 3002 }, { "epoch": 0.06, "learning_rate": 4.990700047956167e-06, "loss": 1.106, "step": 3003 }, { "epoch": 0.06, "learning_rate": 4.990686878742608e-06, "loss": 0.8291, "step": 3004 }, { "epoch": 0.06, "learning_rate": 4.9906737002289e-06, "loss": 0.9567, "step": 3005 }, { "epoch": 0.06, "learning_rate": 4.990660512415093e-06, "loss": 0.9908, "step": 3006 }, { "epoch": 0.06, "learning_rate": 4.990647315301236e-06, "loss": 1.0634, "step": 3007 }, { "epoch": 0.06, "learning_rate": 4.990634108887379e-06, "loss": 0.9618, "step": 3008 }, { "epoch": 0.06, "learning_rate": 4.9906208931735685e-06, "loss": 0.7997, "step": 3009 }, { "epoch": 0.06, "learning_rate": 4.990607668159858e-06, "loss": 0.9898, "step": 3010 }, { "epoch": 0.06, "learning_rate": 4.990594433846294e-06, "loss": 0.9872, "step": 3011 }, { "epoch": 0.06, "learning_rate": 4.990581190232927e-06, "loss": 1.1832, "step": 3012 }, { "epoch": 0.06, "learning_rate": 4.990567937319807e-06, "loss": 0.9783, "step": 3013 }, { "epoch": 0.06, "learning_rate": 4.990554675106981e-06, "loss": 0.7966, "step": 3014 }, { "epoch": 0.06, "learning_rate": 4.990541403594501e-06, "loss": 0.925, "step": 3015 }, { "epoch": 0.06, "learning_rate": 4.990528122782416e-06, "loss": 0.844, "step": 3016 }, { "epoch": 0.06, "learning_rate": 4.990514832670775e-06, "loss": 0.861, "step": 3017 }, { "epoch": 0.06, "learning_rate": 4.990501533259629e-06, "loss": 0.9582, "step": 3018 }, { "epoch": 0.06, "learning_rate": 4.990488224549025e-06, "loss": 1.0263, "step": 3019 }, { "epoch": 0.06, "learning_rate": 4.9904749065390155e-06, "loss": 0.9466, "step": 3020 }, { "epoch": 0.06, "learning_rate": 4.990461579229649e-06, "loss": 0.9637, "step": 3021 }, { "epoch": 0.06, "learning_rate": 4.990448242620974e-06, "loss": 0.9375, "step": 3022 }, { "epoch": 0.06, "learning_rate": 4.990434896713043e-06, "loss": 0.9559, "step": 3023 }, { "epoch": 0.06, "learning_rate": 4.990421541505905e-06, "loss": 1.1808, "step": 3024 }, { "epoch": 0.06, "learning_rate": 4.990408176999607e-06, "loss": 1.3267, "step": 3025 }, { "epoch": 0.06, "learning_rate": 4.990394803194203e-06, "loss": 0.9981, "step": 3026 }, { "epoch": 0.06, "learning_rate": 4.99038142008974e-06, "loss": 0.905, "step": 3027 }, { "epoch": 0.06, "learning_rate": 4.990368027686271e-06, "loss": 1.0922, "step": 3028 }, { "epoch": 0.06, "learning_rate": 4.990354625983843e-06, "loss": 0.9432, "step": 3029 }, { "epoch": 0.06, "learning_rate": 4.990341214982507e-06, "loss": 0.9378, "step": 3030 }, { "epoch": 0.06, "learning_rate": 4.990327794682314e-06, "loss": 1.1582, "step": 3031 }, { "epoch": 0.06, "learning_rate": 4.990314365083312e-06, "loss": 0.9763, "step": 3032 }, { "epoch": 0.06, "learning_rate": 4.990300926185554e-06, "loss": 1.0413, "step": 3033 }, { "epoch": 0.06, "learning_rate": 4.990287477989088e-06, "loss": 1.0574, "step": 3034 }, { "epoch": 0.06, "learning_rate": 4.990274020493965e-06, "loss": 0.8566, "step": 3035 }, { "epoch": 0.06, "learning_rate": 4.990260553700234e-06, "loss": 0.8005, "step": 3036 }, { "epoch": 0.06, "learning_rate": 4.990247077607948e-06, "loss": 1.0707, "step": 3037 }, { "epoch": 0.06, "learning_rate": 4.9902335922171555e-06, "loss": 1.0575, "step": 3038 }, { "epoch": 0.06, "learning_rate": 4.990220097527907e-06, "loss": 0.8068, "step": 3039 }, { "epoch": 0.06, "learning_rate": 4.9902065935402535e-06, "loss": 0.8204, "step": 3040 }, { "epoch": 0.06, "learning_rate": 4.990193080254244e-06, "loss": 0.9744, "step": 3041 }, { "epoch": 0.06, "learning_rate": 4.990179557669931e-06, "loss": 1.1531, "step": 3042 }, { "epoch": 0.06, "learning_rate": 4.990166025787362e-06, "loss": 1.1928, "step": 3043 }, { "epoch": 0.06, "learning_rate": 4.990152484606591e-06, "loss": 0.9937, "step": 3044 }, { "epoch": 0.06, "learning_rate": 4.990138934127666e-06, "loss": 1.0208, "step": 3045 }, { "epoch": 0.06, "learning_rate": 4.990125374350639e-06, "loss": 0.8124, "step": 3046 }, { "epoch": 0.06, "learning_rate": 4.990111805275561e-06, "loss": 0.945, "step": 3047 }, { "epoch": 0.06, "learning_rate": 4.9900982269024814e-06, "loss": 1.0076, "step": 3048 }, { "epoch": 0.06, "learning_rate": 4.990084639231451e-06, "loss": 1.2097, "step": 3049 }, { "epoch": 0.06, "learning_rate": 4.9900710422625206e-06, "loss": 1.2946, "step": 3050 }, { "epoch": 0.06, "learning_rate": 4.990057435995742e-06, "loss": 0.7395, "step": 3051 }, { "epoch": 0.06, "learning_rate": 4.990043820431165e-06, "loss": 0.9291, "step": 3052 }, { "epoch": 0.06, "learning_rate": 4.990030195568841e-06, "loss": 0.9236, "step": 3053 }, { "epoch": 0.06, "learning_rate": 4.99001656140882e-06, "loss": 1.0226, "step": 3054 }, { "epoch": 0.06, "learning_rate": 4.9900029179511544e-06, "loss": 0.9263, "step": 3055 }, { "epoch": 0.06, "learning_rate": 4.989989265195893e-06, "loss": 1.3044, "step": 3056 }, { "epoch": 0.06, "learning_rate": 4.989975603143089e-06, "loss": 1.1543, "step": 3057 }, { "epoch": 0.06, "learning_rate": 4.989961931792792e-06, "loss": 0.905, "step": 3058 }, { "epoch": 0.06, "learning_rate": 4.989948251145054e-06, "loss": 1.0479, "step": 3059 }, { "epoch": 0.06, "learning_rate": 4.989934561199925e-06, "loss": 0.9968, "step": 3060 }, { "epoch": 0.06, "learning_rate": 4.989920861957457e-06, "loss": 0.9054, "step": 3061 }, { "epoch": 0.06, "learning_rate": 4.989907153417701e-06, "loss": 0.9664, "step": 3062 }, { "epoch": 0.06, "learning_rate": 4.9898934355807074e-06, "loss": 1.1486, "step": 3063 }, { "epoch": 0.06, "learning_rate": 4.989879708446529e-06, "loss": 0.8341, "step": 3064 }, { "epoch": 0.06, "learning_rate": 4.989865972015215e-06, "loss": 1.0579, "step": 3065 }, { "epoch": 0.06, "learning_rate": 4.9898522262868185e-06, "loss": 0.9538, "step": 3066 }, { "epoch": 0.06, "learning_rate": 4.98983847126139e-06, "loss": 0.877, "step": 3067 }, { "epoch": 0.06, "learning_rate": 4.989824706938981e-06, "loss": 0.8275, "step": 3068 }, { "epoch": 0.06, "learning_rate": 4.989810933319643e-06, "loss": 0.9432, "step": 3069 }, { "epoch": 0.06, "learning_rate": 4.989797150403427e-06, "loss": 1.0398, "step": 3070 }, { "epoch": 0.06, "learning_rate": 4.989783358190385e-06, "loss": 0.927, "step": 3071 }, { "epoch": 0.06, "learning_rate": 4.989769556680568e-06, "loss": 1.0139, "step": 3072 }, { "epoch": 0.06, "learning_rate": 4.989755745874029e-06, "loss": 0.9642, "step": 3073 }, { "epoch": 0.06, "learning_rate": 4.989741925770817e-06, "loss": 0.8838, "step": 3074 }, { "epoch": 0.06, "learning_rate": 4.9897280963709845e-06, "loss": 1.0351, "step": 3075 }, { "epoch": 0.06, "learning_rate": 4.989714257674585e-06, "loss": 0.8913, "step": 3076 }, { "epoch": 0.06, "learning_rate": 4.989700409681668e-06, "loss": 0.9339, "step": 3077 }, { "epoch": 0.06, "learning_rate": 4.9896865523922866e-06, "loss": 0.8716, "step": 3078 }, { "epoch": 0.06, "learning_rate": 4.989672685806492e-06, "loss": 0.9738, "step": 3079 }, { "epoch": 0.06, "learning_rate": 4.9896588099243355e-06, "loss": 1.0805, "step": 3080 }, { "epoch": 0.06, "learning_rate": 4.98964492474587e-06, "loss": 1.2432, "step": 3081 }, { "epoch": 0.06, "learning_rate": 4.989631030271146e-06, "loss": 1.0682, "step": 3082 }, { "epoch": 0.06, "learning_rate": 4.9896171265002154e-06, "loss": 1.0269, "step": 3083 }, { "epoch": 0.06, "learning_rate": 4.989603213433132e-06, "loss": 1.0381, "step": 3084 }, { "epoch": 0.06, "learning_rate": 4.989589291069946e-06, "loss": 0.8075, "step": 3085 }, { "epoch": 0.06, "learning_rate": 4.98957535941071e-06, "loss": 0.906, "step": 3086 }, { "epoch": 0.06, "learning_rate": 4.989561418455477e-06, "loss": 0.9886, "step": 3087 }, { "epoch": 0.06, "learning_rate": 4.989547468204297e-06, "loss": 1.1287, "step": 3088 }, { "epoch": 0.06, "learning_rate": 4.9895335086572224e-06, "loss": 0.8645, "step": 3089 }, { "epoch": 0.06, "learning_rate": 4.989519539814306e-06, "loss": 1.0349, "step": 3090 }, { "epoch": 0.06, "learning_rate": 4.989505561675601e-06, "loss": 0.7534, "step": 3091 }, { "epoch": 0.06, "learning_rate": 4.989491574241158e-06, "loss": 1.0955, "step": 3092 }, { "epoch": 0.06, "learning_rate": 4.989477577511031e-06, "loss": 1.1472, "step": 3093 }, { "epoch": 0.06, "learning_rate": 4.989463571485269e-06, "loss": 1.199, "step": 3094 }, { "epoch": 0.06, "learning_rate": 4.989449556163928e-06, "loss": 0.9755, "step": 3095 }, { "epoch": 0.06, "learning_rate": 4.989435531547057e-06, "loss": 0.9068, "step": 3096 }, { "epoch": 0.06, "learning_rate": 4.989421497634712e-06, "loss": 0.8045, "step": 3097 }, { "epoch": 0.06, "learning_rate": 4.989407454426943e-06, "loss": 0.9982, "step": 3098 }, { "epoch": 0.06, "learning_rate": 4.989393401923802e-06, "loss": 1.1908, "step": 3099 }, { "epoch": 0.06, "learning_rate": 4.989379340125343e-06, "loss": 1.1175, "step": 3100 }, { "epoch": 0.06, "learning_rate": 4.989365269031617e-06, "loss": 1.0824, "step": 3101 }, { "epoch": 0.06, "learning_rate": 4.989351188642679e-06, "loss": 0.6606, "step": 3102 }, { "epoch": 0.06, "learning_rate": 4.989337098958579e-06, "loss": 0.8926, "step": 3103 }, { "epoch": 0.06, "learning_rate": 4.989322999979371e-06, "loss": 0.9283, "step": 3104 }, { "epoch": 0.06, "learning_rate": 4.989308891705107e-06, "loss": 1.0765, "step": 3105 }, { "epoch": 0.06, "learning_rate": 4.989294774135839e-06, "loss": 1.2771, "step": 3106 }, { "epoch": 0.06, "learning_rate": 4.989280647271622e-06, "loss": 1.0687, "step": 3107 }, { "epoch": 0.06, "learning_rate": 4.989266511112507e-06, "loss": 0.9925, "step": 3108 }, { "epoch": 0.06, "learning_rate": 4.989252365658547e-06, "loss": 0.8943, "step": 3109 }, { "epoch": 0.06, "learning_rate": 4.989238210909795e-06, "loss": 0.8666, "step": 3110 }, { "epoch": 0.06, "learning_rate": 4.989224046866304e-06, "loss": 0.998, "step": 3111 }, { "epoch": 0.06, "learning_rate": 4.989209873528127e-06, "loss": 1.0463, "step": 3112 }, { "epoch": 0.06, "learning_rate": 4.989195690895316e-06, "loss": 0.931, "step": 3113 }, { "epoch": 0.06, "learning_rate": 4.989181498967924e-06, "loss": 0.9564, "step": 3114 }, { "epoch": 0.06, "learning_rate": 4.989167297746006e-06, "loss": 0.7587, "step": 3115 }, { "epoch": 0.06, "learning_rate": 4.989153087229613e-06, "loss": 1.0289, "step": 3116 }, { "epoch": 0.06, "learning_rate": 4.989138867418799e-06, "loss": 0.8306, "step": 3117 }, { "epoch": 0.06, "learning_rate": 4.989124638313617e-06, "loss": 0.8817, "step": 3118 }, { "epoch": 0.06, "learning_rate": 4.989110399914119e-06, "loss": 1.0621, "step": 3119 }, { "epoch": 0.06, "learning_rate": 4.98909615222036e-06, "loss": 1.0587, "step": 3120 }, { "epoch": 0.06, "learning_rate": 4.989081895232391e-06, "loss": 0.857, "step": 3121 }, { "epoch": 0.06, "learning_rate": 4.989067628950269e-06, "loss": 0.978, "step": 3122 }, { "epoch": 0.06, "learning_rate": 4.989053353374043e-06, "loss": 0.8757, "step": 3123 }, { "epoch": 0.06, "learning_rate": 4.9890390685037685e-06, "loss": 1.0547, "step": 3124 }, { "epoch": 0.06, "learning_rate": 4.989024774339498e-06, "loss": 1.2765, "step": 3125 }, { "epoch": 0.06, "learning_rate": 4.9890104708812845e-06, "loss": 0.8421, "step": 3126 }, { "epoch": 0.06, "learning_rate": 4.988996158129183e-06, "loss": 0.9113, "step": 3127 }, { "epoch": 0.06, "learning_rate": 4.988981836083248e-06, "loss": 0.9473, "step": 3128 }, { "epoch": 0.06, "learning_rate": 4.988967504743529e-06, "loss": 1.0098, "step": 3129 }, { "epoch": 0.06, "learning_rate": 4.988953164110082e-06, "loss": 0.8546, "step": 3130 }, { "epoch": 0.06, "learning_rate": 4.98893881418296e-06, "loss": 1.0229, "step": 3131 }, { "epoch": 0.06, "learning_rate": 4.988924454962217e-06, "loss": 0.9527, "step": 3132 }, { "epoch": 0.06, "learning_rate": 4.988910086447907e-06, "loss": 0.9166, "step": 3133 }, { "epoch": 0.06, "learning_rate": 4.988895708640082e-06, "loss": 0.8656, "step": 3134 }, { "epoch": 0.06, "learning_rate": 4.988881321538799e-06, "loss": 1.1969, "step": 3135 }, { "epoch": 0.06, "learning_rate": 4.9888669251441065e-06, "loss": 1.1079, "step": 3136 }, { "epoch": 0.06, "learning_rate": 4.988852519456063e-06, "loss": 1.1923, "step": 3137 }, { "epoch": 0.06, "learning_rate": 4.98883810447472e-06, "loss": 1.1058, "step": 3138 }, { "epoch": 0.06, "learning_rate": 4.988823680200132e-06, "loss": 0.7438, "step": 3139 }, { "epoch": 0.06, "learning_rate": 4.988809246632353e-06, "loss": 0.9133, "step": 3140 }, { "epoch": 0.06, "learning_rate": 4.9887948037714356e-06, "loss": 0.9059, "step": 3141 }, { "epoch": 0.06, "learning_rate": 4.988780351617435e-06, "loss": 1.041, "step": 3142 }, { "epoch": 0.06, "learning_rate": 4.988765890170405e-06, "loss": 1.1438, "step": 3143 }, { "epoch": 0.06, "learning_rate": 4.9887514194304e-06, "loss": 1.0888, "step": 3144 }, { "epoch": 0.06, "learning_rate": 4.988736939397472e-06, "loss": 0.8024, "step": 3145 }, { "epoch": 0.06, "learning_rate": 4.988722450071679e-06, "loss": 0.9752, "step": 3146 }, { "epoch": 0.06, "learning_rate": 4.988707951453071e-06, "loss": 0.8837, "step": 3147 }, { "epoch": 0.06, "learning_rate": 4.988693443541704e-06, "loss": 1.1167, "step": 3148 }, { "epoch": 0.06, "learning_rate": 4.988678926337633e-06, "loss": 1.1029, "step": 3149 }, { "epoch": 0.06, "learning_rate": 4.98866439984091e-06, "loss": 0.9937, "step": 3150 }, { "epoch": 0.06, "learning_rate": 4.988649864051591e-06, "loss": 0.8687, "step": 3151 }, { "epoch": 0.06, "learning_rate": 4.988635318969729e-06, "loss": 0.9001, "step": 3152 }, { "epoch": 0.06, "learning_rate": 4.98862076459538e-06, "loss": 0.8509, "step": 3153 }, { "epoch": 0.06, "learning_rate": 4.988606200928596e-06, "loss": 1.0383, "step": 3154 }, { "epoch": 0.06, "learning_rate": 4.9885916279694345e-06, "loss": 0.8553, "step": 3155 }, { "epoch": 0.06, "learning_rate": 4.988577045717947e-06, "loss": 1.1555, "step": 3156 }, { "epoch": 0.06, "learning_rate": 4.988562454174189e-06, "loss": 1.1799, "step": 3157 }, { "epoch": 0.06, "learning_rate": 4.988547853338216e-06, "loss": 1.0651, "step": 3158 }, { "epoch": 0.06, "learning_rate": 4.9885332432100804e-06, "loss": 0.9075, "step": 3159 }, { "epoch": 0.06, "learning_rate": 4.988518623789839e-06, "loss": 0.9981, "step": 3160 }, { "epoch": 0.06, "learning_rate": 4.988503995077545e-06, "loss": 0.8577, "step": 3161 }, { "epoch": 0.06, "learning_rate": 4.988489357073254e-06, "loss": 1.2635, "step": 3162 }, { "epoch": 0.06, "learning_rate": 4.988474709777019e-06, "loss": 0.8554, "step": 3163 }, { "epoch": 0.06, "learning_rate": 4.988460053188896e-06, "loss": 0.9026, "step": 3164 }, { "epoch": 0.06, "learning_rate": 4.98844538730894e-06, "loss": 0.9818, "step": 3165 }, { "epoch": 0.06, "learning_rate": 4.988430712137205e-06, "loss": 1.0841, "step": 3166 }, { "epoch": 0.06, "learning_rate": 4.988416027673746e-06, "loss": 1.0762, "step": 3167 }, { "epoch": 0.06, "learning_rate": 4.9884013339186174e-06, "loss": 1.0861, "step": 3168 }, { "epoch": 0.06, "learning_rate": 4.988386630871875e-06, "loss": 1.015, "step": 3169 }, { "epoch": 0.06, "learning_rate": 4.9883719185335735e-06, "loss": 0.945, "step": 3170 }, { "epoch": 0.06, "learning_rate": 4.988357196903767e-06, "loss": 0.8581, "step": 3171 }, { "epoch": 0.06, "learning_rate": 4.988342465982511e-06, "loss": 0.9077, "step": 3172 }, { "epoch": 0.06, "learning_rate": 4.9883277257698605e-06, "loss": 0.8629, "step": 3173 }, { "epoch": 0.06, "learning_rate": 4.988312976265871e-06, "loss": 0.9734, "step": 3174 }, { "epoch": 0.06, "learning_rate": 4.988298217470597e-06, "loss": 1.1397, "step": 3175 }, { "epoch": 0.06, "learning_rate": 4.988283449384094e-06, "loss": 1.0792, "step": 3176 }, { "epoch": 0.06, "learning_rate": 4.9882686720064155e-06, "loss": 0.8495, "step": 3177 }, { "epoch": 0.06, "learning_rate": 4.988253885337619e-06, "loss": 1.0378, "step": 3178 }, { "epoch": 0.06, "learning_rate": 4.9882390893777595e-06, "loss": 1.1332, "step": 3179 }, { "epoch": 0.06, "learning_rate": 4.988224284126891e-06, "loss": 1.0424, "step": 3180 }, { "epoch": 0.06, "learning_rate": 4.988209469585069e-06, "loss": 1.1986, "step": 3181 }, { "epoch": 0.06, "learning_rate": 4.98819464575235e-06, "loss": 1.1047, "step": 3182 }, { "epoch": 0.06, "learning_rate": 4.988179812628787e-06, "loss": 0.9634, "step": 3183 }, { "epoch": 0.06, "learning_rate": 4.988164970214438e-06, "loss": 0.9499, "step": 3184 }, { "epoch": 0.06, "learning_rate": 4.988150118509357e-06, "loss": 0.9357, "step": 3185 }, { "epoch": 0.06, "learning_rate": 4.9881352575136e-06, "loss": 0.8742, "step": 3186 }, { "epoch": 0.06, "learning_rate": 4.988120387227222e-06, "loss": 1.0876, "step": 3187 }, { "epoch": 0.06, "learning_rate": 4.9881055076502785e-06, "loss": 1.2155, "step": 3188 }, { "epoch": 0.06, "learning_rate": 4.9880906187828255e-06, "loss": 1.0182, "step": 3189 }, { "epoch": 0.06, "learning_rate": 4.988075720624919e-06, "loss": 0.8809, "step": 3190 }, { "epoch": 0.06, "learning_rate": 4.988060813176613e-06, "loss": 0.9521, "step": 3191 }, { "epoch": 0.06, "learning_rate": 4.988045896437964e-06, "loss": 0.9178, "step": 3192 }, { "epoch": 0.06, "learning_rate": 4.988030970409029e-06, "loss": 1.2318, "step": 3193 }, { "epoch": 0.06, "learning_rate": 4.988016035089863e-06, "loss": 1.0329, "step": 3194 }, { "epoch": 0.06, "learning_rate": 4.988001090480521e-06, "loss": 0.9101, "step": 3195 }, { "epoch": 0.06, "learning_rate": 4.987986136581059e-06, "loss": 0.8961, "step": 3196 }, { "epoch": 0.06, "learning_rate": 4.987971173391532e-06, "loss": 1.0169, "step": 3197 }, { "epoch": 0.06, "learning_rate": 4.987956200911998e-06, "loss": 0.9439, "step": 3198 }, { "epoch": 0.06, "learning_rate": 4.9879412191425114e-06, "loss": 1.3158, "step": 3199 }, { "epoch": 0.06, "learning_rate": 4.9879262280831295e-06, "loss": 1.0399, "step": 3200 }, { "epoch": 0.06, "learning_rate": 4.987911227733906e-06, "loss": 0.9493, "step": 3201 }, { "epoch": 0.06, "learning_rate": 4.9878962180949e-06, "loss": 0.9516, "step": 3202 }, { "epoch": 0.06, "learning_rate": 4.987881199166164e-06, "loss": 1.1976, "step": 3203 }, { "epoch": 0.06, "learning_rate": 4.987866170947757e-06, "loss": 0.9925, "step": 3204 }, { "epoch": 0.06, "learning_rate": 4.9878511334397336e-06, "loss": 1.0796, "step": 3205 }, { "epoch": 0.06, "learning_rate": 4.987836086642151e-06, "loss": 1.119, "step": 3206 }, { "epoch": 0.06, "learning_rate": 4.987821030555063e-06, "loss": 0.9375, "step": 3207 }, { "epoch": 0.06, "learning_rate": 4.987805965178529e-06, "loss": 0.8961, "step": 3208 }, { "epoch": 0.06, "learning_rate": 4.987790890512604e-06, "loss": 0.9719, "step": 3209 }, { "epoch": 0.06, "learning_rate": 4.987775806557343e-06, "loss": 0.8265, "step": 3210 }, { "epoch": 0.06, "learning_rate": 4.987760713312804e-06, "loss": 0.9056, "step": 3211 }, { "epoch": 0.06, "learning_rate": 4.987745610779043e-06, "loss": 1.0173, "step": 3212 }, { "epoch": 0.06, "learning_rate": 4.9877304989561155e-06, "loss": 1.0047, "step": 3213 }, { "epoch": 0.06, "learning_rate": 4.987715377844079e-06, "loss": 0.9512, "step": 3214 }, { "epoch": 0.06, "learning_rate": 4.98770024744299e-06, "loss": 0.7927, "step": 3215 }, { "epoch": 0.06, "learning_rate": 4.987685107752904e-06, "loss": 0.9536, "step": 3216 }, { "epoch": 0.06, "learning_rate": 4.987669958773878e-06, "loss": 0.9841, "step": 3217 }, { "epoch": 0.06, "learning_rate": 4.987654800505969e-06, "loss": 1.0417, "step": 3218 }, { "epoch": 0.06, "learning_rate": 4.9876396329492335e-06, "loss": 1.0021, "step": 3219 }, { "epoch": 0.06, "learning_rate": 4.987624456103728e-06, "loss": 1.0852, "step": 3220 }, { "epoch": 0.06, "learning_rate": 4.987609269969508e-06, "loss": 0.7628, "step": 3221 }, { "epoch": 0.06, "learning_rate": 4.987594074546632e-06, "loss": 0.9393, "step": 3222 }, { "epoch": 0.06, "learning_rate": 4.987578869835156e-06, "loss": 0.91, "step": 3223 }, { "epoch": 0.06, "learning_rate": 4.987563655835136e-06, "loss": 0.9846, "step": 3224 }, { "epoch": 0.06, "learning_rate": 4.987548432546631e-06, "loss": 1.1769, "step": 3225 }, { "epoch": 0.06, "learning_rate": 4.987533199969694e-06, "loss": 0.7743, "step": 3226 }, { "epoch": 0.06, "learning_rate": 4.987517958104386e-06, "loss": 0.8277, "step": 3227 }, { "epoch": 0.06, "learning_rate": 4.987502706950763e-06, "loss": 1.0798, "step": 3228 }, { "epoch": 0.06, "learning_rate": 4.987487446508879e-06, "loss": 0.9589, "step": 3229 }, { "epoch": 0.06, "learning_rate": 4.987472176778795e-06, "loss": 1.1636, "step": 3230 }, { "epoch": 0.06, "learning_rate": 4.987456897760566e-06, "loss": 1.2269, "step": 3231 }, { "epoch": 0.06, "learning_rate": 4.987441609454249e-06, "loss": 1.1173, "step": 3232 }, { "epoch": 0.06, "learning_rate": 4.987426311859901e-06, "loss": 0.9407, "step": 3233 }, { "epoch": 0.06, "learning_rate": 4.987411004977579e-06, "loss": 0.9544, "step": 3234 }, { "epoch": 0.06, "learning_rate": 4.987395688807341e-06, "loss": 0.8386, "step": 3235 }, { "epoch": 0.06, "learning_rate": 4.987380363349244e-06, "loss": 0.9368, "step": 3236 }, { "epoch": 0.06, "learning_rate": 4.987365028603345e-06, "loss": 1.209, "step": 3237 }, { "epoch": 0.06, "learning_rate": 4.9873496845697016e-06, "loss": 1.1279, "step": 3238 }, { "epoch": 0.06, "learning_rate": 4.987334331248369e-06, "loss": 0.944, "step": 3239 }, { "epoch": 0.06, "learning_rate": 4.987318968639408e-06, "loss": 0.8348, "step": 3240 }, { "epoch": 0.06, "learning_rate": 4.987303596742874e-06, "loss": 0.9882, "step": 3241 }, { "epoch": 0.06, "learning_rate": 4.987288215558824e-06, "loss": 0.9528, "step": 3242 }, { "epoch": 0.06, "learning_rate": 4.987272825087316e-06, "loss": 1.2251, "step": 3243 }, { "epoch": 0.06, "learning_rate": 4.987257425328409e-06, "loss": 1.1044, "step": 3244 }, { "epoch": 0.06, "learning_rate": 4.987242016282157e-06, "loss": 0.8309, "step": 3245 }, { "epoch": 0.06, "learning_rate": 4.987226597948621e-06, "loss": 0.98, "step": 3246 }, { "epoch": 0.06, "learning_rate": 4.987211170327857e-06, "loss": 0.7759, "step": 3247 }, { "epoch": 0.06, "learning_rate": 4.987195733419922e-06, "loss": 1.0422, "step": 3248 }, { "epoch": 0.06, "learning_rate": 4.987180287224875e-06, "loss": 0.826, "step": 3249 }, { "epoch": 0.06, "learning_rate": 4.987164831742772e-06, "loss": 1.0439, "step": 3250 }, { "epoch": 0.06, "learning_rate": 4.9871493669736735e-06, "loss": 0.9876, "step": 3251 }, { "epoch": 0.06, "learning_rate": 4.987133892917635e-06, "loss": 0.9244, "step": 3252 }, { "epoch": 0.06, "learning_rate": 4.987118409574714e-06, "loss": 1.1338, "step": 3253 }, { "epoch": 0.06, "learning_rate": 4.9871029169449695e-06, "loss": 1.0198, "step": 3254 }, { "epoch": 0.06, "learning_rate": 4.9870874150284585e-06, "loss": 1.0354, "step": 3255 }, { "epoch": 0.06, "learning_rate": 4.98707190382524e-06, "loss": 1.0929, "step": 3256 }, { "epoch": 0.06, "learning_rate": 4.987056383335372e-06, "loss": 0.9416, "step": 3257 }, { "epoch": 0.06, "learning_rate": 4.98704085355891e-06, "loss": 1.0615, "step": 3258 }, { "epoch": 0.06, "learning_rate": 4.987025314495915e-06, "loss": 1.0106, "step": 3259 }, { "epoch": 0.06, "learning_rate": 4.9870097661464434e-06, "loss": 1.0046, "step": 3260 }, { "epoch": 0.06, "learning_rate": 4.986994208510554e-06, "loss": 0.9888, "step": 3261 }, { "epoch": 0.06, "learning_rate": 4.986978641588304e-06, "loss": 1.0519, "step": 3262 }, { "epoch": 0.06, "learning_rate": 4.986963065379752e-06, "loss": 1.2354, "step": 3263 }, { "epoch": 0.06, "learning_rate": 4.986947479884956e-06, "loss": 1.0435, "step": 3264 }, { "epoch": 0.06, "learning_rate": 4.986931885103974e-06, "loss": 0.9267, "step": 3265 }, { "epoch": 0.06, "learning_rate": 4.986916281036865e-06, "loss": 0.9966, "step": 3266 }, { "epoch": 0.06, "learning_rate": 4.986900667683687e-06, "loss": 1.0261, "step": 3267 }, { "epoch": 0.06, "learning_rate": 4.986885045044498e-06, "loss": 1.0242, "step": 3268 }, { "epoch": 0.06, "learning_rate": 4.9868694131193575e-06, "loss": 1.1085, "step": 3269 }, { "epoch": 0.06, "learning_rate": 4.9868537719083215e-06, "loss": 1.0251, "step": 3270 }, { "epoch": 0.06, "learning_rate": 4.9868381214114504e-06, "loss": 0.9031, "step": 3271 }, { "epoch": 0.06, "learning_rate": 4.986822461628802e-06, "loss": 0.8771, "step": 3272 }, { "epoch": 0.06, "learning_rate": 4.986806792560435e-06, "loss": 0.8441, "step": 3273 }, { "epoch": 0.06, "learning_rate": 4.986791114206407e-06, "loss": 1.1312, "step": 3274 }, { "epoch": 0.06, "learning_rate": 4.9867754265667775e-06, "loss": 1.0825, "step": 3275 }, { "epoch": 0.06, "learning_rate": 4.986759729641605e-06, "loss": 0.9547, "step": 3276 }, { "epoch": 0.06, "learning_rate": 4.986744023430947e-06, "loss": 1.0443, "step": 3277 }, { "epoch": 0.06, "learning_rate": 4.986728307934864e-06, "loss": 1.0334, "step": 3278 }, { "epoch": 0.06, "learning_rate": 4.986712583153413e-06, "loss": 0.8243, "step": 3279 }, { "epoch": 0.06, "learning_rate": 4.986696849086655e-06, "loss": 0.8359, "step": 3280 }, { "epoch": 0.06, "learning_rate": 4.986681105734646e-06, "loss": 1.0269, "step": 3281 }, { "epoch": 0.06, "learning_rate": 4.986665353097446e-06, "loss": 0.9498, "step": 3282 }, { "epoch": 0.06, "learning_rate": 4.9866495911751146e-06, "loss": 0.8754, "step": 3283 }, { "epoch": 0.06, "learning_rate": 4.986633819967709e-06, "loss": 0.9857, "step": 3284 }, { "epoch": 0.06, "learning_rate": 4.986618039475289e-06, "loss": 1.1011, "step": 3285 }, { "epoch": 0.06, "learning_rate": 4.9866022496979135e-06, "loss": 0.9033, "step": 3286 }, { "epoch": 0.06, "learning_rate": 4.986586450635642e-06, "loss": 1.2705, "step": 3287 }, { "epoch": 0.06, "learning_rate": 4.986570642288533e-06, "loss": 0.9719, "step": 3288 }, { "epoch": 0.06, "learning_rate": 4.986554824656645e-06, "loss": 1.0591, "step": 3289 }, { "epoch": 0.06, "learning_rate": 4.986538997740038e-06, "loss": 0.8485, "step": 3290 }, { "epoch": 0.06, "learning_rate": 4.98652316153877e-06, "loss": 0.9046, "step": 3291 }, { "epoch": 0.06, "learning_rate": 4.986507316052901e-06, "loss": 1.0261, "step": 3292 }, { "epoch": 0.06, "learning_rate": 4.98649146128249e-06, "loss": 1.0469, "step": 3293 }, { "epoch": 0.06, "learning_rate": 4.986475597227596e-06, "loss": 1.3395, "step": 3294 }, { "epoch": 0.06, "learning_rate": 4.986459723888278e-06, "loss": 0.6858, "step": 3295 }, { "epoch": 0.06, "learning_rate": 4.986443841264596e-06, "loss": 0.8892, "step": 3296 }, { "epoch": 0.06, "learning_rate": 4.986427949356609e-06, "loss": 1.0475, "step": 3297 }, { "epoch": 0.06, "learning_rate": 4.986412048164376e-06, "loss": 1.101, "step": 3298 }, { "epoch": 0.06, "learning_rate": 4.986396137687957e-06, "loss": 0.8019, "step": 3299 }, { "epoch": 0.06, "learning_rate": 4.986380217927411e-06, "loss": 1.2884, "step": 3300 }, { "epoch": 0.06, "learning_rate": 4.9863642888827975e-06, "loss": 0.901, "step": 3301 }, { "epoch": 0.06, "learning_rate": 4.986348350554176e-06, "loss": 0.9324, "step": 3302 }, { "epoch": 0.06, "learning_rate": 4.9863324029416055e-06, "loss": 1.0622, "step": 3303 }, { "epoch": 0.06, "learning_rate": 4.986316446045147e-06, "loss": 0.8926, "step": 3304 }, { "epoch": 0.06, "learning_rate": 4.986300479864858e-06, "loss": 0.9856, "step": 3305 }, { "epoch": 0.06, "learning_rate": 4.9862845044008005e-06, "loss": 1.2387, "step": 3306 }, { "epoch": 0.06, "learning_rate": 4.986268519653032e-06, "loss": 0.886, "step": 3307 }, { "epoch": 0.06, "learning_rate": 4.9862525256216126e-06, "loss": 0.7635, "step": 3308 }, { "epoch": 0.06, "learning_rate": 4.986236522306603e-06, "loss": 0.9803, "step": 3309 }, { "epoch": 0.06, "learning_rate": 4.986220509708063e-06, "loss": 0.9197, "step": 3310 }, { "epoch": 0.06, "learning_rate": 4.986204487826052e-06, "loss": 0.9761, "step": 3311 }, { "epoch": 0.06, "learning_rate": 4.986188456660628e-06, "loss": 1.1687, "step": 3312 }, { "epoch": 0.06, "learning_rate": 4.9861724162118545e-06, "loss": 1.0812, "step": 3313 }, { "epoch": 0.06, "learning_rate": 4.986156366479788e-06, "loss": 0.8012, "step": 3314 }, { "epoch": 0.06, "learning_rate": 4.986140307464491e-06, "loss": 0.7918, "step": 3315 }, { "epoch": 0.06, "learning_rate": 4.986124239166022e-06, "loss": 0.8142, "step": 3316 }, { "epoch": 0.06, "learning_rate": 4.986108161584441e-06, "loss": 0.8393, "step": 3317 }, { "epoch": 0.06, "learning_rate": 4.986092074719808e-06, "loss": 0.9592, "step": 3318 }, { "epoch": 0.06, "learning_rate": 4.986075978572184e-06, "loss": 1.2522, "step": 3319 }, { "epoch": 0.06, "learning_rate": 4.986059873141628e-06, "loss": 0.8287, "step": 3320 }, { "epoch": 0.06, "learning_rate": 4.986043758428201e-06, "loss": 0.9483, "step": 3321 }, { "epoch": 0.06, "learning_rate": 4.986027634431963e-06, "loss": 0.9608, "step": 3322 }, { "epoch": 0.06, "learning_rate": 4.9860115011529745e-06, "loss": 0.7852, "step": 3323 }, { "epoch": 0.06, "learning_rate": 4.985995358591294e-06, "loss": 0.9073, "step": 3324 }, { "epoch": 0.06, "learning_rate": 4.9859792067469835e-06, "loss": 1.2498, "step": 3325 }, { "epoch": 0.06, "learning_rate": 4.985963045620103e-06, "loss": 0.9654, "step": 3326 }, { "epoch": 0.06, "learning_rate": 4.985946875210713e-06, "loss": 1.0272, "step": 3327 }, { "epoch": 0.06, "learning_rate": 4.985930695518874e-06, "loss": 1.0158, "step": 3328 }, { "epoch": 0.06, "learning_rate": 4.985914506544645e-06, "loss": 0.9723, "step": 3329 }, { "epoch": 0.06, "learning_rate": 4.985898308288087e-06, "loss": 0.9924, "step": 3330 }, { "epoch": 0.06, "learning_rate": 4.985882100749262e-06, "loss": 1.1497, "step": 3331 }, { "epoch": 0.06, "learning_rate": 4.9858658839282295e-06, "loss": 1.1221, "step": 3332 }, { "epoch": 0.06, "learning_rate": 4.9858496578250505e-06, "loss": 0.7697, "step": 3333 }, { "epoch": 0.06, "learning_rate": 4.985833422439784e-06, "loss": 0.9643, "step": 3334 }, { "epoch": 0.06, "learning_rate": 4.985817177772492e-06, "loss": 0.8783, "step": 3335 }, { "epoch": 0.06, "learning_rate": 4.985800923823235e-06, "loss": 1.1376, "step": 3336 }, { "epoch": 0.06, "learning_rate": 4.985784660592073e-06, "loss": 1.1425, "step": 3337 }, { "epoch": 0.06, "learning_rate": 4.985768388079068e-06, "loss": 1.0952, "step": 3338 }, { "epoch": 0.06, "learning_rate": 4.98575210628428e-06, "loss": 0.9715, "step": 3339 }, { "epoch": 0.06, "learning_rate": 4.985735815207769e-06, "loss": 0.8719, "step": 3340 }, { "epoch": 0.06, "learning_rate": 4.985719514849598e-06, "loss": 0.834, "step": 3341 }, { "epoch": 0.06, "learning_rate": 4.985703205209826e-06, "loss": 1.0515, "step": 3342 }, { "epoch": 0.06, "learning_rate": 4.985686886288514e-06, "loss": 1.0801, "step": 3343 }, { "epoch": 0.06, "learning_rate": 4.985670558085724e-06, "loss": 0.8957, "step": 3344 }, { "epoch": 0.06, "learning_rate": 4.985654220601516e-06, "loss": 1.0396, "step": 3345 }, { "epoch": 0.06, "learning_rate": 4.985637873835951e-06, "loss": 0.7057, "step": 3346 }, { "epoch": 0.06, "learning_rate": 4.985621517789091e-06, "loss": 0.9119, "step": 3347 }, { "epoch": 0.06, "learning_rate": 4.985605152460996e-06, "loss": 1.0679, "step": 3348 }, { "epoch": 0.06, "learning_rate": 4.9855887778517285e-06, "loss": 1.0089, "step": 3349 }, { "epoch": 0.06, "learning_rate": 4.985572393961348e-06, "loss": 0.8199, "step": 3350 }, { "epoch": 0.06, "learning_rate": 4.9855560007899165e-06, "loss": 1.1477, "step": 3351 }, { "epoch": 0.06, "learning_rate": 4.985539598337496e-06, "loss": 0.9941, "step": 3352 }, { "epoch": 0.06, "learning_rate": 4.985523186604145e-06, "loss": 0.9819, "step": 3353 }, { "epoch": 0.06, "learning_rate": 4.985506765589928e-06, "loss": 0.8709, "step": 3354 }, { "epoch": 0.06, "learning_rate": 4.985490335294904e-06, "loss": 0.9753, "step": 3355 }, { "epoch": 0.06, "learning_rate": 4.985473895719136e-06, "loss": 1.2631, "step": 3356 }, { "epoch": 0.06, "learning_rate": 4.985457446862684e-06, "loss": 0.9479, "step": 3357 }, { "epoch": 0.06, "learning_rate": 4.9854409887256105e-06, "loss": 0.741, "step": 3358 }, { "epoch": 0.06, "learning_rate": 4.985424521307977e-06, "loss": 0.9309, "step": 3359 }, { "epoch": 0.06, "learning_rate": 4.985408044609844e-06, "loss": 0.8267, "step": 3360 }, { "epoch": 0.06, "learning_rate": 4.985391558631274e-06, "loss": 0.8033, "step": 3361 }, { "epoch": 0.06, "learning_rate": 4.985375063372327e-06, "loss": 0.9872, "step": 3362 }, { "epoch": 0.06, "learning_rate": 4.9853585588330675e-06, "loss": 0.9213, "step": 3363 }, { "epoch": 0.06, "learning_rate": 4.9853420450135545e-06, "loss": 0.9058, "step": 3364 }, { "epoch": 0.06, "learning_rate": 4.98532552191385e-06, "loss": 0.9578, "step": 3365 }, { "epoch": 0.06, "learning_rate": 4.985308989534017e-06, "loss": 1.0745, "step": 3366 }, { "epoch": 0.06, "learning_rate": 4.985292447874116e-06, "loss": 0.8031, "step": 3367 }, { "epoch": 0.06, "learning_rate": 4.985275896934209e-06, "loss": 1.1948, "step": 3368 }, { "epoch": 0.06, "learning_rate": 4.985259336714359e-06, "loss": 1.1099, "step": 3369 }, { "epoch": 0.06, "learning_rate": 4.985242767214625e-06, "loss": 0.9993, "step": 3370 }, { "epoch": 0.06, "learning_rate": 4.985226188435072e-06, "loss": 0.9001, "step": 3371 }, { "epoch": 0.06, "learning_rate": 4.98520960037576e-06, "loss": 0.9054, "step": 3372 }, { "epoch": 0.06, "learning_rate": 4.985193003036752e-06, "loss": 1.0052, "step": 3373 }, { "epoch": 0.06, "learning_rate": 4.9851763964181095e-06, "loss": 1.0768, "step": 3374 }, { "epoch": 0.06, "learning_rate": 4.985159780519895e-06, "loss": 1.1218, "step": 3375 }, { "epoch": 0.06, "learning_rate": 4.98514315534217e-06, "loss": 0.9449, "step": 3376 }, { "epoch": 0.06, "learning_rate": 4.985126520884996e-06, "loss": 1.0088, "step": 3377 }, { "epoch": 0.06, "learning_rate": 4.985109877148437e-06, "loss": 0.9756, "step": 3378 }, { "epoch": 0.06, "learning_rate": 4.985093224132552e-06, "loss": 0.9083, "step": 3379 }, { "epoch": 0.06, "learning_rate": 4.9850765618374055e-06, "loss": 1.1695, "step": 3380 }, { "epoch": 0.06, "learning_rate": 4.98505989026306e-06, "loss": 0.9372, "step": 3381 }, { "epoch": 0.06, "learning_rate": 4.985043209409577e-06, "loss": 1.037, "step": 3382 }, { "epoch": 0.06, "learning_rate": 4.985026519277019e-06, "loss": 0.8373, "step": 3383 }, { "epoch": 0.06, "learning_rate": 4.985009819865448e-06, "loss": 0.922, "step": 3384 }, { "epoch": 0.06, "learning_rate": 4.9849931111749265e-06, "loss": 0.9286, "step": 3385 }, { "epoch": 0.06, "learning_rate": 4.984976393205516e-06, "loss": 0.8646, "step": 3386 }, { "epoch": 0.06, "learning_rate": 4.984959665957281e-06, "loss": 1.1438, "step": 3387 }, { "epoch": 0.06, "learning_rate": 4.984942929430283e-06, "loss": 1.1383, "step": 3388 }, { "epoch": 0.06, "learning_rate": 4.984926183624584e-06, "loss": 0.9304, "step": 3389 }, { "epoch": 0.06, "learning_rate": 4.984909428540246e-06, "loss": 0.8123, "step": 3390 }, { "epoch": 0.06, "learning_rate": 4.984892664177333e-06, "loss": 1.0558, "step": 3391 }, { "epoch": 0.06, "learning_rate": 4.9848758905359075e-06, "loss": 0.9451, "step": 3392 }, { "epoch": 0.06, "learning_rate": 4.9848591076160305e-06, "loss": 1.1002, "step": 3393 }, { "epoch": 0.06, "learning_rate": 4.984842315417766e-06, "loss": 0.89, "step": 3394 }, { "epoch": 0.06, "learning_rate": 4.984825513941177e-06, "loss": 0.9983, "step": 3395 }, { "epoch": 0.06, "learning_rate": 4.984808703186326e-06, "loss": 0.7284, "step": 3396 }, { "epoch": 0.06, "learning_rate": 4.984791883153275e-06, "loss": 0.92, "step": 3397 }, { "epoch": 0.06, "learning_rate": 4.984775053842087e-06, "loss": 0.9078, "step": 3398 }, { "epoch": 0.06, "learning_rate": 4.9847582152528265e-06, "loss": 1.0881, "step": 3399 }, { "epoch": 0.06, "learning_rate": 4.984741367385553e-06, "loss": 1.201, "step": 3400 }, { "epoch": 0.06, "learning_rate": 4.984724510240333e-06, "loss": 0.9286, "step": 3401 }, { "epoch": 0.06, "learning_rate": 4.984707643817227e-06, "loss": 0.8136, "step": 3402 }, { "epoch": 0.06, "learning_rate": 4.9846907681163e-06, "loss": 0.886, "step": 3403 }, { "epoch": 0.06, "learning_rate": 4.984673883137612e-06, "loss": 0.9653, "step": 3404 }, { "epoch": 0.06, "learning_rate": 4.984656988881229e-06, "loss": 0.9803, "step": 3405 }, { "epoch": 0.06, "learning_rate": 4.9846400853472125e-06, "loss": 1.1031, "step": 3406 }, { "epoch": 0.06, "learning_rate": 4.984623172535627e-06, "loss": 0.9873, "step": 3407 }, { "epoch": 0.06, "learning_rate": 4.984606250446534e-06, "loss": 1.0143, "step": 3408 }, { "epoch": 0.06, "learning_rate": 4.984589319079998e-06, "loss": 0.892, "step": 3409 }, { "epoch": 0.06, "learning_rate": 4.984572378436081e-06, "loss": 0.9776, "step": 3410 }, { "epoch": 0.06, "learning_rate": 4.984555428514847e-06, "loss": 1.1361, "step": 3411 }, { "epoch": 0.06, "learning_rate": 4.984538469316359e-06, "loss": 0.9258, "step": 3412 }, { "epoch": 0.06, "learning_rate": 4.984521500840681e-06, "loss": 1.0599, "step": 3413 }, { "epoch": 0.06, "learning_rate": 4.984504523087876e-06, "loss": 1.073, "step": 3414 }, { "epoch": 0.06, "learning_rate": 4.984487536058007e-06, "loss": 0.962, "step": 3415 }, { "epoch": 0.06, "learning_rate": 4.984470539751138e-06, "loss": 0.9725, "step": 3416 }, { "epoch": 0.06, "learning_rate": 4.984453534167332e-06, "loss": 0.9012, "step": 3417 }, { "epoch": 0.06, "learning_rate": 4.984436519306653e-06, "loss": 1.4097, "step": 3418 }, { "epoch": 0.06, "learning_rate": 4.984419495169164e-06, "loss": 1.041, "step": 3419 }, { "epoch": 0.06, "learning_rate": 4.984402461754929e-06, "loss": 1.1088, "step": 3420 }, { "epoch": 0.06, "learning_rate": 4.984385419064011e-06, "loss": 0.7985, "step": 3421 }, { "epoch": 0.06, "learning_rate": 4.984368367096474e-06, "loss": 0.9913, "step": 3422 }, { "epoch": 0.06, "learning_rate": 4.984351305852382e-06, "loss": 1.1429, "step": 3423 }, { "epoch": 0.06, "learning_rate": 4.984334235331798e-06, "loss": 1.1038, "step": 3424 }, { "epoch": 0.06, "learning_rate": 4.9843171555347865e-06, "loss": 1.2264, "step": 3425 }, { "epoch": 0.06, "learning_rate": 4.984300066461411e-06, "loss": 1.0391, "step": 3426 }, { "epoch": 0.06, "learning_rate": 4.9842829681117346e-06, "loss": 0.9355, "step": 3427 }, { "epoch": 0.06, "learning_rate": 4.984265860485822e-06, "loss": 0.8754, "step": 3428 }, { "epoch": 0.06, "learning_rate": 4.984248743583737e-06, "loss": 0.954, "step": 3429 }, { "epoch": 0.06, "learning_rate": 4.984231617405544e-06, "loss": 1.0671, "step": 3430 }, { "epoch": 0.06, "learning_rate": 4.984214481951305e-06, "loss": 1.1972, "step": 3431 }, { "epoch": 0.06, "learning_rate": 4.984197337221086e-06, "loss": 0.6765, "step": 3432 }, { "epoch": 0.06, "learning_rate": 4.98418018321495e-06, "loss": 0.9624, "step": 3433 }, { "epoch": 0.06, "learning_rate": 4.984163019932961e-06, "loss": 0.9665, "step": 3434 }, { "epoch": 0.06, "learning_rate": 4.984145847375185e-06, "loss": 1.012, "step": 3435 }, { "epoch": 0.06, "learning_rate": 4.984128665541683e-06, "loss": 1.0443, "step": 3436 }, { "epoch": 0.06, "learning_rate": 4.9841114744325215e-06, "loss": 1.1357, "step": 3437 }, { "epoch": 0.06, "learning_rate": 4.984094274047764e-06, "loss": 1.1496, "step": 3438 }, { "epoch": 0.06, "learning_rate": 4.9840770643874745e-06, "loss": 0.7585, "step": 3439 }, { "epoch": 0.06, "learning_rate": 4.984059845451718e-06, "loss": 0.9147, "step": 3440 }, { "epoch": 0.06, "learning_rate": 4.9840426172405565e-06, "loss": 1.0243, "step": 3441 }, { "epoch": 0.06, "learning_rate": 4.9840253797540574e-06, "loss": 0.95, "step": 3442 }, { "epoch": 0.06, "learning_rate": 4.984008132992283e-06, "loss": 1.0657, "step": 3443 }, { "epoch": 0.06, "learning_rate": 4.983990876955299e-06, "loss": 1.2659, "step": 3444 }, { "epoch": 0.06, "learning_rate": 4.983973611643169e-06, "loss": 0.9196, "step": 3445 }, { "epoch": 0.07, "learning_rate": 4.983956337055957e-06, "loss": 0.8163, "step": 3446 }, { "epoch": 0.07, "learning_rate": 4.983939053193729e-06, "loss": 0.9787, "step": 3447 }, { "epoch": 0.07, "learning_rate": 4.98392176005655e-06, "loss": 1.1091, "step": 3448 }, { "epoch": 0.07, "learning_rate": 4.983904457644481e-06, "loss": 1.1213, "step": 3449 }, { "epoch": 0.07, "learning_rate": 4.98388714595759e-06, "loss": 1.2307, "step": 3450 }, { "epoch": 0.07, "learning_rate": 4.98386982499594e-06, "loss": 1.0691, "step": 3451 }, { "epoch": 0.07, "learning_rate": 4.983852494759597e-06, "loss": 0.8289, "step": 3452 }, { "epoch": 0.07, "learning_rate": 4.983835155248624e-06, "loss": 1.1523, "step": 3453 }, { "epoch": 0.07, "learning_rate": 4.983817806463087e-06, "loss": 0.922, "step": 3454 }, { "epoch": 0.07, "learning_rate": 4.983800448403051e-06, "loss": 0.7886, "step": 3455 }, { "epoch": 0.07, "learning_rate": 4.98378308106858e-06, "loss": 1.0953, "step": 3456 }, { "epoch": 0.07, "learning_rate": 4.9837657044597396e-06, "loss": 1.0296, "step": 3457 }, { "epoch": 0.07, "learning_rate": 4.9837483185765935e-06, "loss": 0.9193, "step": 3458 }, { "epoch": 0.07, "learning_rate": 4.9837309234192075e-06, "loss": 1.0933, "step": 3459 }, { "epoch": 0.07, "learning_rate": 4.983713518987646e-06, "loss": 0.9803, "step": 3460 }, { "epoch": 0.07, "learning_rate": 4.9836961052819756e-06, "loss": 1.0379, "step": 3461 }, { "epoch": 0.07, "learning_rate": 4.983678682302258e-06, "loss": 1.0993, "step": 3462 }, { "epoch": 0.07, "learning_rate": 4.983661250048563e-06, "loss": 1.0132, "step": 3463 }, { "epoch": 0.07, "learning_rate": 4.983643808520951e-06, "loss": 0.9798, "step": 3464 }, { "epoch": 0.07, "learning_rate": 4.98362635771949e-06, "loss": 0.9752, "step": 3465 }, { "epoch": 0.07, "learning_rate": 4.983608897644244e-06, "loss": 0.9523, "step": 3466 }, { "epoch": 0.07, "learning_rate": 4.983591428295279e-06, "loss": 1.1161, "step": 3467 }, { "epoch": 0.07, "learning_rate": 4.98357394967266e-06, "loss": 1.1685, "step": 3468 }, { "epoch": 0.07, "learning_rate": 4.983556461776451e-06, "loss": 0.9863, "step": 3469 }, { "epoch": 0.07, "learning_rate": 4.983538964606719e-06, "loss": 1.0465, "step": 3470 }, { "epoch": 0.07, "learning_rate": 4.9835214581635285e-06, "loss": 0.9827, "step": 3471 }, { "epoch": 0.07, "learning_rate": 4.983503942446945e-06, "loss": 0.9097, "step": 3472 }, { "epoch": 0.07, "learning_rate": 4.983486417457034e-06, "loss": 0.8707, "step": 3473 }, { "epoch": 0.07, "learning_rate": 4.98346888319386e-06, "loss": 1.2969, "step": 3474 }, { "epoch": 0.07, "learning_rate": 4.983451339657491e-06, "loss": 0.9245, "step": 3475 }, { "epoch": 0.07, "learning_rate": 4.98343378684799e-06, "loss": 1.1124, "step": 3476 }, { "epoch": 0.07, "learning_rate": 4.983416224765423e-06, "loss": 0.8481, "step": 3477 }, { "epoch": 0.07, "learning_rate": 4.983398653409857e-06, "loss": 0.8283, "step": 3478 }, { "epoch": 0.07, "learning_rate": 4.983381072781355e-06, "loss": 0.9929, "step": 3479 }, { "epoch": 0.07, "learning_rate": 4.983363482879986e-06, "loss": 1.0548, "step": 3480 }, { "epoch": 0.07, "learning_rate": 4.983345883705812e-06, "loss": 1.3278, "step": 3481 }, { "epoch": 0.07, "learning_rate": 4.983328275258902e-06, "loss": 0.883, "step": 3482 }, { "epoch": 0.07, "learning_rate": 4.98331065753932e-06, "loss": 0.7419, "step": 3483 }, { "epoch": 0.07, "learning_rate": 4.983293030547131e-06, "loss": 1.0169, "step": 3484 }, { "epoch": 0.07, "learning_rate": 4.983275394282404e-06, "loss": 0.7661, "step": 3485 }, { "epoch": 0.07, "learning_rate": 4.983257748745202e-06, "loss": 0.9375, "step": 3486 }, { "epoch": 0.07, "learning_rate": 4.9832400939355916e-06, "loss": 1.1981, "step": 3487 }, { "epoch": 0.07, "learning_rate": 4.983222429853639e-06, "loss": 1.1357, "step": 3488 }, { "epoch": 0.07, "learning_rate": 4.983204756499409e-06, "loss": 0.9289, "step": 3489 }, { "epoch": 0.07, "learning_rate": 4.98318707387297e-06, "loss": 0.9131, "step": 3490 }, { "epoch": 0.07, "learning_rate": 4.983169381974385e-06, "loss": 0.9901, "step": 3491 }, { "epoch": 0.07, "learning_rate": 4.983151680803723e-06, "loss": 0.903, "step": 3492 }, { "epoch": 0.07, "learning_rate": 4.983133970361049e-06, "loss": 1.1494, "step": 3493 }, { "epoch": 0.07, "learning_rate": 4.9831162506464285e-06, "loss": 1.1173, "step": 3494 }, { "epoch": 0.07, "learning_rate": 4.983098521659927e-06, "loss": 1.1018, "step": 3495 }, { "epoch": 0.07, "learning_rate": 4.983080783401612e-06, "loss": 1.0258, "step": 3496 }, { "epoch": 0.07, "learning_rate": 4.983063035871552e-06, "loss": 0.8746, "step": 3497 }, { "epoch": 0.07, "learning_rate": 4.983045279069808e-06, "loss": 1.0488, "step": 3498 }, { "epoch": 0.07, "learning_rate": 4.98302751299645e-06, "loss": 1.1529, "step": 3499 }, { "epoch": 0.07, "learning_rate": 4.983009737651543e-06, "loss": 1.0449, "step": 3500 }, { "epoch": 0.07, "learning_rate": 4.982991953035155e-06, "loss": 1.0703, "step": 3501 }, { "epoch": 0.07, "learning_rate": 4.982974159147349e-06, "loss": 0.8403, "step": 3502 }, { "epoch": 0.07, "learning_rate": 4.982956355988196e-06, "loss": 0.9276, "step": 3503 }, { "epoch": 0.07, "learning_rate": 4.982938543557758e-06, "loss": 0.8747, "step": 3504 }, { "epoch": 0.07, "learning_rate": 4.982920721856105e-06, "loss": 1.0419, "step": 3505 }, { "epoch": 0.07, "learning_rate": 4.9829028908833015e-06, "loss": 1.1227, "step": 3506 }, { "epoch": 0.07, "learning_rate": 4.982885050639415e-06, "loss": 1.0032, "step": 3507 }, { "epoch": 0.07, "learning_rate": 4.982867201124511e-06, "loss": 1.1064, "step": 3508 }, { "epoch": 0.07, "learning_rate": 4.982849342338658e-06, "loss": 0.99, "step": 3509 }, { "epoch": 0.07, "learning_rate": 4.982831474281922e-06, "loss": 0.9724, "step": 3510 }, { "epoch": 0.07, "learning_rate": 4.982813596954369e-06, "loss": 1.0575, "step": 3511 }, { "epoch": 0.07, "learning_rate": 4.982795710356066e-06, "loss": 1.3264, "step": 3512 }, { "epoch": 0.07, "learning_rate": 4.98277781448708e-06, "loss": 1.0287, "step": 3513 }, { "epoch": 0.07, "learning_rate": 4.982759909347478e-06, "loss": 0.8437, "step": 3514 }, { "epoch": 0.07, "learning_rate": 4.982741994937326e-06, "loss": 0.9621, "step": 3515 }, { "epoch": 0.07, "learning_rate": 4.982724071256691e-06, "loss": 1.0903, "step": 3516 }, { "epoch": 0.07, "learning_rate": 4.9827061383056415e-06, "loss": 0.8887, "step": 3517 }, { "epoch": 0.07, "learning_rate": 4.982688196084244e-06, "loss": 0.9669, "step": 3518 }, { "epoch": 0.07, "learning_rate": 4.982670244592564e-06, "loss": 0.9403, "step": 3519 }, { "epoch": 0.07, "learning_rate": 4.9826522838306695e-06, "loss": 0.892, "step": 3520 }, { "epoch": 0.07, "learning_rate": 4.982634313798627e-06, "loss": 0.9143, "step": 3521 }, { "epoch": 0.07, "learning_rate": 4.982616334496505e-06, "loss": 1.0369, "step": 3522 }, { "epoch": 0.07, "learning_rate": 4.98259834592437e-06, "loss": 1.0155, "step": 3523 }, { "epoch": 0.07, "learning_rate": 4.982580348082287e-06, "loss": 1.0428, "step": 3524 }, { "epoch": 0.07, "learning_rate": 4.982562340970328e-06, "loss": 1.1319, "step": 3525 }, { "epoch": 0.07, "learning_rate": 4.9825443245885545e-06, "loss": 0.9814, "step": 3526 }, { "epoch": 0.07, "learning_rate": 4.982526298937038e-06, "loss": 0.5773, "step": 3527 }, { "epoch": 0.07, "learning_rate": 4.982508264015844e-06, "loss": 1.1201, "step": 3528 }, { "epoch": 0.07, "learning_rate": 4.982490219825041e-06, "loss": 0.9039, "step": 3529 }, { "epoch": 0.07, "learning_rate": 4.9824721663646945e-06, "loss": 1.0887, "step": 3530 }, { "epoch": 0.07, "learning_rate": 4.982454103634874e-06, "loss": 1.077, "step": 3531 }, { "epoch": 0.07, "learning_rate": 4.982436031635646e-06, "loss": 0.9588, "step": 3532 }, { "epoch": 0.07, "learning_rate": 4.982417950367077e-06, "loss": 0.9642, "step": 3533 }, { "epoch": 0.07, "learning_rate": 4.982399859829236e-06, "loss": 0.9312, "step": 3534 }, { "epoch": 0.07, "learning_rate": 4.98238176002219e-06, "loss": 0.8981, "step": 3535 }, { "epoch": 0.07, "learning_rate": 4.982363650946007e-06, "loss": 1.0914, "step": 3536 }, { "epoch": 0.07, "learning_rate": 4.982345532600754e-06, "loss": 1.0825, "step": 3537 }, { "epoch": 0.07, "learning_rate": 4.982327404986499e-06, "loss": 0.7268, "step": 3538 }, { "epoch": 0.07, "learning_rate": 4.982309268103309e-06, "loss": 0.9141, "step": 3539 }, { "epoch": 0.07, "learning_rate": 4.982291121951254e-06, "loss": 0.7985, "step": 3540 }, { "epoch": 0.07, "learning_rate": 4.982272966530398e-06, "loss": 0.8312, "step": 3541 }, { "epoch": 0.07, "learning_rate": 4.982254801840811e-06, "loss": 0.9158, "step": 3542 }, { "epoch": 0.07, "learning_rate": 4.982236627882562e-06, "loss": 1.1357, "step": 3543 }, { "epoch": 0.07, "learning_rate": 4.982218444655716e-06, "loss": 0.9841, "step": 3544 }, { "epoch": 0.07, "learning_rate": 4.982200252160344e-06, "loss": 0.8072, "step": 3545 }, { "epoch": 0.07, "learning_rate": 4.982182050396512e-06, "loss": 0.9999, "step": 3546 }, { "epoch": 0.07, "learning_rate": 4.982163839364288e-06, "loss": 1.0732, "step": 3547 }, { "epoch": 0.07, "learning_rate": 4.98214561906374e-06, "loss": 0.8331, "step": 3548 }, { "epoch": 0.07, "learning_rate": 4.982127389494937e-06, "loss": 1.2279, "step": 3549 }, { "epoch": 0.07, "learning_rate": 4.982109150657945e-06, "loss": 1.131, "step": 3550 }, { "epoch": 0.07, "learning_rate": 4.982090902552835e-06, "loss": 0.9823, "step": 3551 }, { "epoch": 0.07, "learning_rate": 4.982072645179674e-06, "loss": 0.8272, "step": 3552 }, { "epoch": 0.07, "learning_rate": 4.982054378538529e-06, "loss": 0.8274, "step": 3553 }, { "epoch": 0.07, "learning_rate": 4.98203610262947e-06, "loss": 1.1018, "step": 3554 }, { "epoch": 0.07, "learning_rate": 4.9820178174525626e-06, "loss": 1.1415, "step": 3555 }, { "epoch": 0.07, "learning_rate": 4.981999523007877e-06, "loss": 1.0491, "step": 3556 }, { "epoch": 0.07, "learning_rate": 4.981981219295483e-06, "loss": 0.9949, "step": 3557 }, { "epoch": 0.07, "learning_rate": 4.981962906315446e-06, "loss": 0.9981, "step": 3558 }, { "epoch": 0.07, "learning_rate": 4.981944584067836e-06, "loss": 0.8421, "step": 3559 }, { "epoch": 0.07, "learning_rate": 4.981926252552721e-06, "loss": 0.8864, "step": 3560 }, { "epoch": 0.07, "learning_rate": 4.981907911770169e-06, "loss": 1.0494, "step": 3561 }, { "epoch": 0.07, "learning_rate": 4.981889561720249e-06, "loss": 1.0132, "step": 3562 }, { "epoch": 0.07, "learning_rate": 4.98187120240303e-06, "loss": 1.2029, "step": 3563 }, { "epoch": 0.07, "learning_rate": 4.98185283381858e-06, "loss": 0.8888, "step": 3564 }, { "epoch": 0.07, "learning_rate": 4.981834455966967e-06, "loss": 0.8184, "step": 3565 }, { "epoch": 0.07, "learning_rate": 4.981816068848261e-06, "loss": 1.1011, "step": 3566 }, { "epoch": 0.07, "learning_rate": 4.9817976724625295e-06, "loss": 0.9119, "step": 3567 }, { "epoch": 0.07, "learning_rate": 4.981779266809842e-06, "loss": 1.037, "step": 3568 }, { "epoch": 0.07, "learning_rate": 4.981760851890266e-06, "loss": 1.1219, "step": 3569 }, { "epoch": 0.07, "learning_rate": 4.981742427703871e-06, "loss": 1.165, "step": 3570 }, { "epoch": 0.07, "learning_rate": 4.9817239942507265e-06, "loss": 1.0653, "step": 3571 }, { "epoch": 0.07, "learning_rate": 4.9817055515309e-06, "loss": 0.8035, "step": 3572 }, { "epoch": 0.07, "learning_rate": 4.981687099544462e-06, "loss": 0.922, "step": 3573 }, { "epoch": 0.07, "learning_rate": 4.98166863829148e-06, "loss": 0.9923, "step": 3574 }, { "epoch": 0.07, "learning_rate": 4.981650167772023e-06, "loss": 0.8646, "step": 3575 }, { "epoch": 0.07, "learning_rate": 4.981631687986162e-06, "loss": 0.9171, "step": 3576 }, { "epoch": 0.07, "learning_rate": 4.981613198933962e-06, "loss": 0.752, "step": 3577 }, { "epoch": 0.07, "learning_rate": 4.981594700615496e-06, "loss": 0.9963, "step": 3578 }, { "epoch": 0.07, "learning_rate": 4.981576193030831e-06, "loss": 0.9006, "step": 3579 }, { "epoch": 0.07, "learning_rate": 4.981557676180037e-06, "loss": 1.2506, "step": 3580 }, { "epoch": 0.07, "learning_rate": 4.981539150063182e-06, "loss": 1.2732, "step": 3581 }, { "epoch": 0.07, "learning_rate": 4.981520614680336e-06, "loss": 1.1622, "step": 3582 }, { "epoch": 0.07, "learning_rate": 4.981502070031569e-06, "loss": 1.171, "step": 3583 }, { "epoch": 0.07, "learning_rate": 4.9814835161169486e-06, "loss": 1.0374, "step": 3584 }, { "epoch": 0.07, "learning_rate": 4.981464952936544e-06, "loss": 0.8188, "step": 3585 }, { "epoch": 0.07, "learning_rate": 4.9814463804904265e-06, "loss": 0.868, "step": 3586 }, { "epoch": 0.07, "learning_rate": 4.981427798778664e-06, "loss": 1.0541, "step": 3587 }, { "epoch": 0.07, "learning_rate": 4.981409207801327e-06, "loss": 1.1121, "step": 3588 }, { "epoch": 0.07, "learning_rate": 4.981390607558483e-06, "loss": 0.8928, "step": 3589 }, { "epoch": 0.07, "learning_rate": 4.9813719980502025e-06, "loss": 0.9643, "step": 3590 }, { "epoch": 0.07, "learning_rate": 4.981353379276556e-06, "loss": 0.8542, "step": 3591 }, { "epoch": 0.07, "learning_rate": 4.981334751237612e-06, "loss": 0.7961, "step": 3592 }, { "epoch": 0.07, "learning_rate": 4.98131611393344e-06, "loss": 1.1609, "step": 3593 }, { "epoch": 0.07, "learning_rate": 4.981297467364109e-06, "loss": 1.0157, "step": 3594 }, { "epoch": 0.07, "learning_rate": 4.98127881152969e-06, "loss": 0.8755, "step": 3595 }, { "epoch": 0.07, "learning_rate": 4.981260146430251e-06, "loss": 0.8318, "step": 3596 }, { "epoch": 0.07, "learning_rate": 4.981241472065864e-06, "loss": 0.9958, "step": 3597 }, { "epoch": 0.07, "learning_rate": 4.981222788436596e-06, "loss": 0.8707, "step": 3598 }, { "epoch": 0.07, "learning_rate": 4.981204095542519e-06, "loss": 0.9767, "step": 3599 }, { "epoch": 0.07, "learning_rate": 4.981185393383702e-06, "loss": 1.0353, "step": 3600 }, { "epoch": 0.07, "learning_rate": 4.981166681960215e-06, "loss": 0.9965, "step": 3601 }, { "epoch": 0.07, "learning_rate": 4.981147961272127e-06, "loss": 1.0183, "step": 3602 }, { "epoch": 0.07, "learning_rate": 4.98112923131951e-06, "loss": 0.956, "step": 3603 }, { "epoch": 0.07, "learning_rate": 4.981110492102431e-06, "loss": 1.0024, "step": 3604 }, { "epoch": 0.07, "learning_rate": 4.981091743620962e-06, "loss": 0.9692, "step": 3605 }, { "epoch": 0.07, "learning_rate": 4.9810729858751724e-06, "loss": 1.0798, "step": 3606 }, { "epoch": 0.07, "learning_rate": 4.9810542188651326e-06, "loss": 0.9623, "step": 3607 }, { "epoch": 0.07, "learning_rate": 4.981035442590912e-06, "loss": 0.9279, "step": 3608 }, { "epoch": 0.07, "learning_rate": 4.981016657052582e-06, "loss": 0.9354, "step": 3609 }, { "epoch": 0.07, "learning_rate": 4.980997862250211e-06, "loss": 0.9401, "step": 3610 }, { "epoch": 0.07, "learning_rate": 4.980979058183871e-06, "loss": 0.8644, "step": 3611 }, { "epoch": 0.07, "learning_rate": 4.98096024485363e-06, "loss": 1.2329, "step": 3612 }, { "epoch": 0.07, "learning_rate": 4.980941422259561e-06, "loss": 0.9398, "step": 3613 }, { "epoch": 0.07, "learning_rate": 4.980922590401732e-06, "loss": 0.9586, "step": 3614 }, { "epoch": 0.07, "learning_rate": 4.980903749280214e-06, "loss": 1.0322, "step": 3615 }, { "epoch": 0.07, "learning_rate": 4.980884898895078e-06, "loss": 0.8812, "step": 3616 }, { "epoch": 0.07, "learning_rate": 4.980866039246393e-06, "loss": 0.9194, "step": 3617 }, { "epoch": 0.07, "learning_rate": 4.98084717033423e-06, "loss": 1.2552, "step": 3618 }, { "epoch": 0.07, "learning_rate": 4.980828292158661e-06, "loss": 1.0254, "step": 3619 }, { "epoch": 0.07, "learning_rate": 4.980809404719754e-06, "loss": 0.9337, "step": 3620 }, { "epoch": 0.07, "learning_rate": 4.9807905080175815e-06, "loss": 0.9212, "step": 3621 }, { "epoch": 0.07, "learning_rate": 4.980771602052214e-06, "loss": 0.8814, "step": 3622 }, { "epoch": 0.07, "learning_rate": 4.9807526868237196e-06, "loss": 0.8646, "step": 3623 }, { "epoch": 0.07, "learning_rate": 4.9807337623321715e-06, "loss": 1.0438, "step": 3624 }, { "epoch": 0.07, "learning_rate": 4.9807148285776405e-06, "loss": 1.2162, "step": 3625 }, { "epoch": 0.07, "learning_rate": 4.980695885560195e-06, "loss": 0.8445, "step": 3626 }, { "epoch": 0.07, "learning_rate": 4.9806769332799085e-06, "loss": 0.812, "step": 3627 }, { "epoch": 0.07, "learning_rate": 4.98065797173685e-06, "loss": 0.8084, "step": 3628 }, { "epoch": 0.07, "learning_rate": 4.98063900093109e-06, "loss": 0.9166, "step": 3629 }, { "epoch": 0.07, "learning_rate": 4.9806200208627e-06, "loss": 1.0562, "step": 3630 }, { "epoch": 0.07, "learning_rate": 4.9806010315317514e-06, "loss": 1.1666, "step": 3631 }, { "epoch": 0.07, "learning_rate": 4.9805820329383146e-06, "loss": 1.0232, "step": 3632 }, { "epoch": 0.07, "learning_rate": 4.980563025082461e-06, "loss": 0.8986, "step": 3633 }, { "epoch": 0.07, "learning_rate": 4.980544007964261e-06, "loss": 0.9328, "step": 3634 }, { "epoch": 0.07, "learning_rate": 4.980524981583784e-06, "loss": 0.9825, "step": 3635 }, { "epoch": 0.07, "learning_rate": 4.980505945941104e-06, "loss": 1.1586, "step": 3636 }, { "epoch": 0.07, "learning_rate": 4.980486901036292e-06, "loss": 1.196, "step": 3637 }, { "epoch": 0.07, "learning_rate": 4.980467846869417e-06, "loss": 0.9147, "step": 3638 }, { "epoch": 0.07, "learning_rate": 4.9804487834405505e-06, "loss": 1.0403, "step": 3639 }, { "epoch": 0.07, "learning_rate": 4.980429710749765e-06, "loss": 1.0285, "step": 3640 }, { "epoch": 0.07, "learning_rate": 4.980410628797131e-06, "loss": 0.9153, "step": 3641 }, { "epoch": 0.07, "learning_rate": 4.98039153758272e-06, "loss": 1.0002, "step": 3642 }, { "epoch": 0.07, "learning_rate": 4.980372437106602e-06, "loss": 1.1181, "step": 3643 }, { "epoch": 0.07, "learning_rate": 4.980353327368849e-06, "loss": 1.0051, "step": 3644 }, { "epoch": 0.07, "learning_rate": 4.980334208369535e-06, "loss": 0.9365, "step": 3645 }, { "epoch": 0.07, "learning_rate": 4.980315080108728e-06, "loss": 1.0734, "step": 3646 }, { "epoch": 0.07, "learning_rate": 4.9802959425864995e-06, "loss": 1.0977, "step": 3647 }, { "epoch": 0.07, "learning_rate": 4.980276795802923e-06, "loss": 0.7298, "step": 3648 }, { "epoch": 0.07, "learning_rate": 4.98025763975807e-06, "loss": 1.0435, "step": 3649 }, { "epoch": 0.07, "learning_rate": 4.98023847445201e-06, "loss": 1.2069, "step": 3650 }, { "epoch": 0.07, "learning_rate": 4.980219299884814e-06, "loss": 1.0683, "step": 3651 }, { "epoch": 0.07, "learning_rate": 4.9802001160565574e-06, "loss": 0.9041, "step": 3652 }, { "epoch": 0.07, "learning_rate": 4.9801809229673085e-06, "loss": 1.0063, "step": 3653 }, { "epoch": 0.07, "learning_rate": 4.980161720617141e-06, "loss": 0.8745, "step": 3654 }, { "epoch": 0.07, "learning_rate": 4.980142509006125e-06, "loss": 0.9386, "step": 3655 }, { "epoch": 0.07, "learning_rate": 4.980123288134332e-06, "loss": 1.0516, "step": 3656 }, { "epoch": 0.07, "learning_rate": 4.9801040580018364e-06, "loss": 0.9588, "step": 3657 }, { "epoch": 0.07, "learning_rate": 4.980084818608707e-06, "loss": 1.0179, "step": 3658 }, { "epoch": 0.07, "learning_rate": 4.9800655699550185e-06, "loss": 0.8201, "step": 3659 }, { "epoch": 0.07, "learning_rate": 4.98004631204084e-06, "loss": 0.8953, "step": 3660 }, { "epoch": 0.07, "learning_rate": 4.9800270448662445e-06, "loss": 1.1324, "step": 3661 }, { "epoch": 0.07, "learning_rate": 4.980007768431305e-06, "loss": 1.0825, "step": 3662 }, { "epoch": 0.07, "learning_rate": 4.979988482736092e-06, "loss": 0.9499, "step": 3663 }, { "epoch": 0.07, "learning_rate": 4.979969187780678e-06, "loss": 0.9874, "step": 3664 }, { "epoch": 0.07, "learning_rate": 4.979949883565135e-06, "loss": 0.8542, "step": 3665 }, { "epoch": 0.07, "learning_rate": 4.979930570089535e-06, "loss": 0.7964, "step": 3666 }, { "epoch": 0.07, "learning_rate": 4.97991124735395e-06, "loss": 1.0209, "step": 3667 }, { "epoch": 0.07, "learning_rate": 4.979891915358453e-06, "loss": 1.101, "step": 3668 }, { "epoch": 0.07, "learning_rate": 4.979872574103116e-06, "loss": 1.0065, "step": 3669 }, { "epoch": 0.07, "learning_rate": 4.97985322358801e-06, "loss": 0.8552, "step": 3670 }, { "epoch": 0.07, "learning_rate": 4.979833863813209e-06, "loss": 0.913, "step": 3671 }, { "epoch": 0.07, "learning_rate": 4.979814494778784e-06, "loss": 0.9487, "step": 3672 }, { "epoch": 0.07, "learning_rate": 4.979795116484808e-06, "loss": 0.9656, "step": 3673 }, { "epoch": 0.07, "learning_rate": 4.979775728931352e-06, "loss": 1.1848, "step": 3674 }, { "epoch": 0.07, "learning_rate": 4.97975633211849e-06, "loss": 1.344, "step": 3675 }, { "epoch": 0.07, "learning_rate": 4.979736926046295e-06, "loss": 0.9601, "step": 3676 }, { "epoch": 0.07, "learning_rate": 4.979717510714837e-06, "loss": 0.9229, "step": 3677 }, { "epoch": 0.07, "learning_rate": 4.97969808612419e-06, "loss": 1.0349, "step": 3678 }, { "epoch": 0.07, "learning_rate": 4.979678652274427e-06, "loss": 0.8598, "step": 3679 }, { "epoch": 0.07, "learning_rate": 4.979659209165619e-06, "loss": 0.9028, "step": 3680 }, { "epoch": 0.07, "learning_rate": 4.97963975679784e-06, "loss": 1.1285, "step": 3681 }, { "epoch": 0.07, "learning_rate": 4.979620295171163e-06, "loss": 1.2078, "step": 3682 }, { "epoch": 0.07, "learning_rate": 4.979600824285659e-06, "loss": 0.8224, "step": 3683 }, { "epoch": 0.07, "learning_rate": 4.979581344141401e-06, "loss": 0.7488, "step": 3684 }, { "epoch": 0.07, "learning_rate": 4.979561854738463e-06, "loss": 0.8998, "step": 3685 }, { "epoch": 0.07, "learning_rate": 4.979542356076918e-06, "loss": 1.068, "step": 3686 }, { "epoch": 0.07, "learning_rate": 4.979522848156836e-06, "loss": 1.1832, "step": 3687 }, { "epoch": 0.07, "learning_rate": 4.979503330978293e-06, "loss": 0.9995, "step": 3688 }, { "epoch": 0.07, "learning_rate": 4.9794838045413596e-06, "loss": 0.8135, "step": 3689 }, { "epoch": 0.07, "learning_rate": 4.9794642688461104e-06, "loss": 0.862, "step": 3690 }, { "epoch": 0.07, "learning_rate": 4.979444723892618e-06, "loss": 1.0151, "step": 3691 }, { "epoch": 0.07, "learning_rate": 4.979425169680955e-06, "loss": 0.9325, "step": 3692 }, { "epoch": 0.07, "learning_rate": 4.979405606211193e-06, "loss": 1.0247, "step": 3693 }, { "epoch": 0.07, "learning_rate": 4.979386033483407e-06, "loss": 1.1231, "step": 3694 }, { "epoch": 0.07, "learning_rate": 4.9793664514976705e-06, "loss": 0.9477, "step": 3695 }, { "epoch": 0.07, "learning_rate": 4.979346860254055e-06, "loss": 0.9156, "step": 3696 }, { "epoch": 0.07, "learning_rate": 4.979327259752635e-06, "loss": 0.8607, "step": 3697 }, { "epoch": 0.07, "learning_rate": 4.9793076499934824e-06, "loss": 0.8752, "step": 3698 }, { "epoch": 0.07, "learning_rate": 4.979288030976671e-06, "loss": 1.103, "step": 3699 }, { "epoch": 0.07, "learning_rate": 4.9792684027022744e-06, "loss": 1.0961, "step": 3700 }, { "epoch": 0.07, "learning_rate": 4.979248765170366e-06, "loss": 1.0062, "step": 3701 }, { "epoch": 0.07, "learning_rate": 4.979229118381018e-06, "loss": 0.844, "step": 3702 }, { "epoch": 0.07, "learning_rate": 4.979209462334305e-06, "loss": 0.9437, "step": 3703 }, { "epoch": 0.07, "learning_rate": 4.979189797030299e-06, "loss": 0.9199, "step": 3704 }, { "epoch": 0.07, "learning_rate": 4.979170122469075e-06, "loss": 1.0142, "step": 3705 }, { "epoch": 0.07, "learning_rate": 4.9791504386507065e-06, "loss": 1.2106, "step": 3706 }, { "epoch": 0.07, "learning_rate": 4.979130745575265e-06, "loss": 0.9476, "step": 3707 }, { "epoch": 0.07, "learning_rate": 4.9791110432428255e-06, "loss": 0.9694, "step": 3708 }, { "epoch": 0.07, "learning_rate": 4.979091331653462e-06, "loss": 0.9162, "step": 3709 }, { "epoch": 0.07, "learning_rate": 4.9790716108072474e-06, "loss": 0.8182, "step": 3710 }, { "epoch": 0.07, "learning_rate": 4.979051880704256e-06, "loss": 1.107, "step": 3711 }, { "epoch": 0.07, "learning_rate": 4.979032141344559e-06, "loss": 1.1675, "step": 3712 }, { "epoch": 0.07, "learning_rate": 4.979012392728233e-06, "loss": 1.0885, "step": 3713 }, { "epoch": 0.07, "learning_rate": 4.978992634855351e-06, "loss": 1.1115, "step": 3714 }, { "epoch": 0.07, "learning_rate": 4.978972867725986e-06, "loss": 0.8426, "step": 3715 }, { "epoch": 0.07, "learning_rate": 4.978953091340213e-06, "loss": 0.8027, "step": 3716 }, { "epoch": 0.07, "learning_rate": 4.978933305698105e-06, "loss": 1.0245, "step": 3717 }, { "epoch": 0.07, "learning_rate": 4.9789135107997354e-06, "loss": 1.0195, "step": 3718 }, { "epoch": 0.07, "learning_rate": 4.97889370664518e-06, "loss": 1.0836, "step": 3719 }, { "epoch": 0.07, "learning_rate": 4.9788738932345095e-06, "loss": 1.0291, "step": 3720 }, { "epoch": 0.07, "learning_rate": 4.978854070567801e-06, "loss": 0.9451, "step": 3721 }, { "epoch": 0.07, "learning_rate": 4.978834238645129e-06, "loss": 0.8564, "step": 3722 }, { "epoch": 0.07, "learning_rate": 4.978814397466564e-06, "loss": 0.8019, "step": 3723 }, { "epoch": 0.07, "learning_rate": 4.978794547032182e-06, "loss": 0.8813, "step": 3724 }, { "epoch": 0.07, "learning_rate": 4.978774687342057e-06, "loss": 1.1394, "step": 3725 }, { "epoch": 0.07, "learning_rate": 4.978754818396264e-06, "loss": 0.7776, "step": 3726 }, { "epoch": 0.07, "learning_rate": 4.978734940194877e-06, "loss": 0.8604, "step": 3727 }, { "epoch": 0.07, "learning_rate": 4.978715052737969e-06, "loss": 1.1328, "step": 3728 }, { "epoch": 0.07, "learning_rate": 4.978695156025615e-06, "loss": 1.0308, "step": 3729 }, { "epoch": 0.07, "learning_rate": 4.97867525005789e-06, "loss": 0.9891, "step": 3730 }, { "epoch": 0.07, "learning_rate": 4.9786553348348664e-06, "loss": 1.1271, "step": 3731 }, { "epoch": 0.07, "learning_rate": 4.978635410356621e-06, "loss": 0.9789, "step": 3732 }, { "epoch": 0.07, "learning_rate": 4.978615476623226e-06, "loss": 0.9322, "step": 3733 }, { "epoch": 0.07, "learning_rate": 4.978595533634758e-06, "loss": 0.9089, "step": 3734 }, { "epoch": 0.07, "learning_rate": 4.97857558139129e-06, "loss": 1.0579, "step": 3735 }, { "epoch": 0.07, "learning_rate": 4.978555619892896e-06, "loss": 0.9351, "step": 3736 }, { "epoch": 0.07, "learning_rate": 4.978535649139651e-06, "loss": 0.8878, "step": 3737 }, { "epoch": 0.07, "learning_rate": 4.9785156691316304e-06, "loss": 1.0033, "step": 3738 }, { "epoch": 0.07, "learning_rate": 4.978495679868909e-06, "loss": 0.9702, "step": 3739 }, { "epoch": 0.07, "learning_rate": 4.97847568135156e-06, "loss": 0.9442, "step": 3740 }, { "epoch": 0.07, "learning_rate": 4.978455673579659e-06, "loss": 0.9145, "step": 3741 }, { "epoch": 0.07, "learning_rate": 4.97843565655328e-06, "loss": 1.0471, "step": 3742 }, { "epoch": 0.07, "learning_rate": 4.978415630272499e-06, "loss": 0.9273, "step": 3743 }, { "epoch": 0.07, "learning_rate": 4.978395594737389e-06, "loss": 1.0178, "step": 3744 }, { "epoch": 0.07, "learning_rate": 4.978375549948027e-06, "loss": 1.0748, "step": 3745 }, { "epoch": 0.07, "learning_rate": 4.978355495904485e-06, "loss": 0.9439, "step": 3746 }, { "epoch": 0.07, "learning_rate": 4.9783354326068415e-06, "loss": 1.199, "step": 3747 }, { "epoch": 0.07, "learning_rate": 4.978315360055169e-06, "loss": 0.8748, "step": 3748 }, { "epoch": 0.07, "learning_rate": 4.978295278249542e-06, "loss": 1.1298, "step": 3749 }, { "epoch": 0.07, "learning_rate": 4.978275187190038e-06, "loss": 0.9539, "step": 3750 }, { "epoch": 0.07, "learning_rate": 4.978255086876729e-06, "loss": 0.9055, "step": 3751 }, { "epoch": 0.07, "learning_rate": 4.978234977309692e-06, "loss": 0.7688, "step": 3752 }, { "epoch": 0.07, "learning_rate": 4.978214858489002e-06, "loss": 1.0659, "step": 3753 }, { "epoch": 0.07, "learning_rate": 4.978194730414733e-06, "loss": 0.8212, "step": 3754 }, { "epoch": 0.07, "learning_rate": 4.978174593086961e-06, "loss": 0.908, "step": 3755 }, { "epoch": 0.07, "learning_rate": 4.978154446505762e-06, "loss": 1.0976, "step": 3756 }, { "epoch": 0.07, "learning_rate": 4.9781342906712096e-06, "loss": 1.0159, "step": 3757 }, { "epoch": 0.07, "learning_rate": 4.978114125583379e-06, "loss": 0.8536, "step": 3758 }, { "epoch": 0.07, "learning_rate": 4.978093951242347e-06, "loss": 0.8913, "step": 3759 }, { "epoch": 0.07, "learning_rate": 4.978073767648189e-06, "loss": 0.8714, "step": 3760 }, { "epoch": 0.07, "learning_rate": 4.978053574800977e-06, "loss": 1.0112, "step": 3761 }, { "epoch": 0.07, "learning_rate": 4.978033372700791e-06, "loss": 0.9559, "step": 3762 }, { "epoch": 0.07, "learning_rate": 4.978013161347703e-06, "loss": 1.1418, "step": 3763 }, { "epoch": 0.07, "learning_rate": 4.9779929407417915e-06, "loss": 0.7731, "step": 3764 }, { "epoch": 0.07, "learning_rate": 4.977972710883129e-06, "loss": 0.8939, "step": 3765 }, { "epoch": 0.07, "learning_rate": 4.977952471771793e-06, "loss": 0.884, "step": 3766 }, { "epoch": 0.07, "learning_rate": 4.977932223407859e-06, "loss": 1.0027, "step": 3767 }, { "epoch": 0.07, "learning_rate": 4.977911965791401e-06, "loss": 1.2309, "step": 3768 }, { "epoch": 0.07, "learning_rate": 4.977891698922496e-06, "loss": 0.9195, "step": 3769 }, { "epoch": 0.07, "learning_rate": 4.97787142280122e-06, "loss": 0.9739, "step": 3770 }, { "epoch": 0.07, "learning_rate": 4.977851137427647e-06, "loss": 0.8149, "step": 3771 }, { "epoch": 0.07, "learning_rate": 4.977830842801855e-06, "loss": 0.9088, "step": 3772 }, { "epoch": 0.07, "learning_rate": 4.977810538923917e-06, "loss": 0.9686, "step": 3773 }, { "epoch": 0.07, "learning_rate": 4.977790225793912e-06, "loss": 1.079, "step": 3774 }, { "epoch": 0.07, "learning_rate": 4.977769903411914e-06, "loss": 1.3582, "step": 3775 }, { "epoch": 0.07, "learning_rate": 4.977749571777998e-06, "loss": 1.061, "step": 3776 }, { "epoch": 0.07, "learning_rate": 4.977729230892242e-06, "loss": 0.8937, "step": 3777 }, { "epoch": 0.07, "learning_rate": 4.977708880754721e-06, "loss": 0.8828, "step": 3778 }, { "epoch": 0.07, "learning_rate": 4.977688521365512e-06, "loss": 0.8947, "step": 3779 }, { "epoch": 0.07, "learning_rate": 4.977668152724689e-06, "loss": 0.9257, "step": 3780 }, { "epoch": 0.07, "learning_rate": 4.977647774832328e-06, "loss": 1.2372, "step": 3781 }, { "epoch": 0.07, "learning_rate": 4.977627387688507e-06, "loss": 1.1165, "step": 3782 }, { "epoch": 0.07, "learning_rate": 4.977606991293301e-06, "loss": 0.6917, "step": 3783 }, { "epoch": 0.07, "learning_rate": 4.977586585646788e-06, "loss": 1.0601, "step": 3784 }, { "epoch": 0.07, "learning_rate": 4.977566170749042e-06, "loss": 1.0621, "step": 3785 }, { "epoch": 0.07, "learning_rate": 4.977545746600139e-06, "loss": 1.0172, "step": 3786 }, { "epoch": 0.07, "learning_rate": 4.9775253132001564e-06, "loss": 1.2426, "step": 3787 }, { "epoch": 0.07, "learning_rate": 4.97750487054917e-06, "loss": 1.1674, "step": 3788 }, { "epoch": 0.07, "learning_rate": 4.977484418647257e-06, "loss": 0.8859, "step": 3789 }, { "epoch": 0.07, "learning_rate": 4.977463957494493e-06, "loss": 0.7819, "step": 3790 }, { "epoch": 0.07, "learning_rate": 4.977443487090955e-06, "loss": 0.8658, "step": 3791 }, { "epoch": 0.07, "learning_rate": 4.9774230074367184e-06, "loss": 0.832, "step": 3792 }, { "epoch": 0.07, "learning_rate": 4.9774025185318605e-06, "loss": 0.973, "step": 3793 }, { "epoch": 0.07, "learning_rate": 4.977382020376457e-06, "loss": 0.9369, "step": 3794 }, { "epoch": 0.07, "learning_rate": 4.9773615129705855e-06, "loss": 1.0889, "step": 3795 }, { "epoch": 0.07, "learning_rate": 4.977340996314323e-06, "loss": 0.8191, "step": 3796 }, { "epoch": 0.07, "learning_rate": 4.9773204704077436e-06, "loss": 0.9746, "step": 3797 }, { "epoch": 0.07, "learning_rate": 4.977299935250926e-06, "loss": 0.9837, "step": 3798 }, { "epoch": 0.07, "learning_rate": 4.977279390843946e-06, "loss": 1.1594, "step": 3799 }, { "epoch": 0.07, "learning_rate": 4.977258837186881e-06, "loss": 1.3561, "step": 3800 }, { "epoch": 0.07, "learning_rate": 4.977238274279808e-06, "loss": 0.9386, "step": 3801 }, { "epoch": 0.07, "learning_rate": 4.977217702122803e-06, "loss": 0.7007, "step": 3802 }, { "epoch": 0.07, "learning_rate": 4.977197120715943e-06, "loss": 1.0199, "step": 3803 }, { "epoch": 0.07, "learning_rate": 4.977176530059305e-06, "loss": 0.9286, "step": 3804 }, { "epoch": 0.07, "learning_rate": 4.977155930152965e-06, "loss": 1.1139, "step": 3805 }, { "epoch": 0.07, "learning_rate": 4.977135320997002e-06, "loss": 1.0304, "step": 3806 }, { "epoch": 0.07, "learning_rate": 4.977114702591491e-06, "loss": 1.0961, "step": 3807 }, { "epoch": 0.07, "learning_rate": 4.977094074936509e-06, "loss": 1.1013, "step": 3808 }, { "epoch": 0.07, "learning_rate": 4.977073438032135e-06, "loss": 0.8455, "step": 3809 }, { "epoch": 0.07, "learning_rate": 4.977052791878444e-06, "loss": 1.0335, "step": 3810 }, { "epoch": 0.07, "learning_rate": 4.977032136475514e-06, "loss": 0.8773, "step": 3811 }, { "epoch": 0.07, "learning_rate": 4.977011471823422e-06, "loss": 1.0486, "step": 3812 }, { "epoch": 0.07, "learning_rate": 4.976990797922244e-06, "loss": 1.1914, "step": 3813 }, { "epoch": 0.07, "learning_rate": 4.976970114772059e-06, "loss": 0.9557, "step": 3814 }, { "epoch": 0.07, "learning_rate": 4.976949422372944e-06, "loss": 0.8121, "step": 3815 }, { "epoch": 0.07, "learning_rate": 4.976928720724976e-06, "loss": 0.8326, "step": 3816 }, { "epoch": 0.07, "learning_rate": 4.976908009828232e-06, "loss": 0.8237, "step": 3817 }, { "epoch": 0.07, "learning_rate": 4.976887289682789e-06, "loss": 1.0934, "step": 3818 }, { "epoch": 0.07, "learning_rate": 4.976866560288724e-06, "loss": 1.1943, "step": 3819 }, { "epoch": 0.07, "learning_rate": 4.976845821646117e-06, "loss": 0.9642, "step": 3820 }, { "epoch": 0.07, "learning_rate": 4.976825073755043e-06, "loss": 0.9846, "step": 3821 }, { "epoch": 0.07, "learning_rate": 4.97680431661558e-06, "loss": 0.8671, "step": 3822 }, { "epoch": 0.07, "learning_rate": 4.976783550227805e-06, "loss": 0.9437, "step": 3823 }, { "epoch": 0.07, "learning_rate": 4.976762774591797e-06, "loss": 1.1081, "step": 3824 }, { "epoch": 0.07, "learning_rate": 4.9767419897076315e-06, "loss": 1.114, "step": 3825 }, { "epoch": 0.07, "learning_rate": 4.9767211955753895e-06, "loss": 1.0949, "step": 3826 }, { "epoch": 0.07, "learning_rate": 4.976700392195145e-06, "loss": 0.7855, "step": 3827 }, { "epoch": 0.07, "learning_rate": 4.9766795795669775e-06, "loss": 0.9514, "step": 3828 }, { "epoch": 0.07, "learning_rate": 4.976658757690964e-06, "loss": 0.8779, "step": 3829 }, { "epoch": 0.07, "learning_rate": 4.976637926567183e-06, "loss": 1.0879, "step": 3830 }, { "epoch": 0.07, "learning_rate": 4.976617086195712e-06, "loss": 0.9839, "step": 3831 }, { "epoch": 0.07, "learning_rate": 4.976596236576628e-06, "loss": 1.2102, "step": 3832 }, { "epoch": 0.07, "learning_rate": 4.976575377710011e-06, "loss": 0.8121, "step": 3833 }, { "epoch": 0.07, "learning_rate": 4.976554509595937e-06, "loss": 1.0455, "step": 3834 }, { "epoch": 0.07, "learning_rate": 4.976533632234484e-06, "loss": 0.8283, "step": 3835 }, { "epoch": 0.07, "learning_rate": 4.97651274562573e-06, "loss": 1.0037, "step": 3836 }, { "epoch": 0.07, "learning_rate": 4.976491849769753e-06, "loss": 0.7627, "step": 3837 }, { "epoch": 0.07, "learning_rate": 4.976470944666633e-06, "loss": 1.0099, "step": 3838 }, { "epoch": 0.07, "learning_rate": 4.9764500303164455e-06, "loss": 0.9846, "step": 3839 }, { "epoch": 0.07, "learning_rate": 4.97642910671927e-06, "loss": 0.8997, "step": 3840 }, { "epoch": 0.07, "learning_rate": 4.976408173875183e-06, "loss": 0.7609, "step": 3841 }, { "epoch": 0.07, "learning_rate": 4.976387231784265e-06, "loss": 0.9171, "step": 3842 }, { "epoch": 0.07, "learning_rate": 4.976366280446592e-06, "loss": 0.9107, "step": 3843 }, { "epoch": 0.07, "learning_rate": 4.976345319862244e-06, "loss": 1.0169, "step": 3844 }, { "epoch": 0.07, "learning_rate": 4.976324350031298e-06, "loss": 1.0068, "step": 3845 }, { "epoch": 0.07, "learning_rate": 4.976303370953833e-06, "loss": 0.7914, "step": 3846 }, { "epoch": 0.07, "learning_rate": 4.976282382629927e-06, "loss": 0.8511, "step": 3847 }, { "epoch": 0.07, "learning_rate": 4.976261385059658e-06, "loss": 0.8972, "step": 3848 }, { "epoch": 0.07, "learning_rate": 4.9762403782431065e-06, "loss": 1.1442, "step": 3849 }, { "epoch": 0.07, "learning_rate": 4.976219362180348e-06, "loss": 1.1052, "step": 3850 }, { "epoch": 0.07, "learning_rate": 4.976198336871463e-06, "loss": 1.0191, "step": 3851 }, { "epoch": 0.07, "learning_rate": 4.976177302316529e-06, "loss": 1.0275, "step": 3852 }, { "epoch": 0.07, "learning_rate": 4.976156258515626e-06, "loss": 1.0981, "step": 3853 }, { "epoch": 0.07, "learning_rate": 4.9761352054688296e-06, "loss": 0.9512, "step": 3854 }, { "epoch": 0.07, "learning_rate": 4.976114143176221e-06, "loss": 0.9174, "step": 3855 }, { "epoch": 0.07, "learning_rate": 4.976093071637879e-06, "loss": 0.9856, "step": 3856 }, { "epoch": 0.07, "learning_rate": 4.97607199085388e-06, "loss": 1.0963, "step": 3857 }, { "epoch": 0.07, "learning_rate": 4.976050900824304e-06, "loss": 1.0305, "step": 3858 }, { "epoch": 0.07, "learning_rate": 4.976029801549232e-06, "loss": 0.8409, "step": 3859 }, { "epoch": 0.07, "learning_rate": 4.9760086930287385e-06, "loss": 0.9193, "step": 3860 }, { "epoch": 0.07, "learning_rate": 4.975987575262905e-06, "loss": 0.9218, "step": 3861 }, { "epoch": 0.07, "learning_rate": 4.97596644825181e-06, "loss": 1.1969, "step": 3862 }, { "epoch": 0.07, "learning_rate": 4.975945311995533e-06, "loss": 1.0385, "step": 3863 }, { "epoch": 0.07, "learning_rate": 4.97592416649415e-06, "loss": 0.9554, "step": 3864 }, { "epoch": 0.07, "learning_rate": 4.975903011747744e-06, "loss": 0.9333, "step": 3865 }, { "epoch": 0.07, "learning_rate": 4.975881847756391e-06, "loss": 1.0499, "step": 3866 }, { "epoch": 0.07, "learning_rate": 4.975860674520172e-06, "loss": 0.9231, "step": 3867 }, { "epoch": 0.07, "learning_rate": 4.975839492039165e-06, "loss": 1.2477, "step": 3868 }, { "epoch": 0.07, "learning_rate": 4.9758183003134485e-06, "loss": 1.0789, "step": 3869 }, { "epoch": 0.07, "learning_rate": 4.975797099343103e-06, "loss": 1.0739, "step": 3870 }, { "epoch": 0.07, "learning_rate": 4.975775889128207e-06, "loss": 1.0067, "step": 3871 }, { "epoch": 0.07, "learning_rate": 4.975754669668839e-06, "loss": 0.8505, "step": 3872 }, { "epoch": 0.07, "learning_rate": 4.9757334409650795e-06, "loss": 0.8099, "step": 3873 }, { "epoch": 0.07, "learning_rate": 4.975712203017007e-06, "loss": 1.2428, "step": 3874 }, { "epoch": 0.07, "learning_rate": 4.975690955824701e-06, "loss": 1.1491, "step": 3875 }, { "epoch": 0.07, "learning_rate": 4.975669699388242e-06, "loss": 0.9119, "step": 3876 }, { "epoch": 0.07, "learning_rate": 4.975648433707707e-06, "loss": 0.8892, "step": 3877 }, { "epoch": 0.07, "learning_rate": 4.9756271587831776e-06, "loss": 0.9938, "step": 3878 }, { "epoch": 0.07, "learning_rate": 4.975605874614732e-06, "loss": 0.9202, "step": 3879 }, { "epoch": 0.07, "learning_rate": 4.9755845812024495e-06, "loss": 1.2784, "step": 3880 }, { "epoch": 0.07, "learning_rate": 4.97556327854641e-06, "loss": 1.1349, "step": 3881 }, { "epoch": 0.07, "learning_rate": 4.975541966646694e-06, "loss": 1.2244, "step": 3882 }, { "epoch": 0.07, "learning_rate": 4.975520645503379e-06, "loss": 0.7502, "step": 3883 }, { "epoch": 0.07, "learning_rate": 4.975499315116547e-06, "loss": 0.8, "step": 3884 }, { "epoch": 0.07, "learning_rate": 4.975477975486276e-06, "loss": 0.8865, "step": 3885 }, { "epoch": 0.07, "learning_rate": 4.9754566266126454e-06, "loss": 1.0075, "step": 3886 }, { "epoch": 0.07, "learning_rate": 4.9754352684957365e-06, "loss": 1.1052, "step": 3887 }, { "epoch": 0.07, "learning_rate": 4.975413901135629e-06, "loss": 0.9263, "step": 3888 }, { "epoch": 0.07, "learning_rate": 4.975392524532399e-06, "loss": 1.0759, "step": 3889 }, { "epoch": 0.07, "learning_rate": 4.975371138686132e-06, "loss": 0.7293, "step": 3890 }, { "epoch": 0.07, "learning_rate": 4.975349743596904e-06, "loss": 1.1114, "step": 3891 }, { "epoch": 0.07, "learning_rate": 4.975328339264797e-06, "loss": 0.9938, "step": 3892 }, { "epoch": 0.07, "learning_rate": 4.975306925689888e-06, "loss": 1.0812, "step": 3893 }, { "epoch": 0.07, "learning_rate": 4.97528550287226e-06, "loss": 1.2065, "step": 3894 }, { "epoch": 0.07, "learning_rate": 4.975264070811992e-06, "loss": 0.9875, "step": 3895 }, { "epoch": 0.07, "learning_rate": 4.975242629509164e-06, "loss": 0.7175, "step": 3896 }, { "epoch": 0.07, "learning_rate": 4.975221178963855e-06, "loss": 0.7041, "step": 3897 }, { "epoch": 0.07, "learning_rate": 4.975199719176146e-06, "loss": 0.8685, "step": 3898 }, { "epoch": 0.07, "learning_rate": 4.975178250146117e-06, "loss": 0.8256, "step": 3899 }, { "epoch": 0.07, "learning_rate": 4.97515677187385e-06, "loss": 1.2334, "step": 3900 }, { "epoch": 0.07, "learning_rate": 4.975135284359423e-06, "loss": 0.9751, "step": 3901 }, { "epoch": 0.07, "learning_rate": 4.975113787602916e-06, "loss": 0.9695, "step": 3902 }, { "epoch": 0.07, "learning_rate": 4.97509228160441e-06, "loss": 1.122, "step": 3903 }, { "epoch": 0.07, "learning_rate": 4.975070766363985e-06, "loss": 0.7853, "step": 3904 }, { "epoch": 0.07, "learning_rate": 4.975049241881722e-06, "loss": 1.1747, "step": 3905 }, { "epoch": 0.07, "learning_rate": 4.975027708157701e-06, "loss": 1.1812, "step": 3906 }, { "epoch": 0.07, "learning_rate": 4.975006165192003e-06, "loss": 0.8913, "step": 3907 }, { "epoch": 0.07, "learning_rate": 4.9749846129847075e-06, "loss": 0.7385, "step": 3908 }, { "epoch": 0.07, "learning_rate": 4.974963051535895e-06, "loss": 1.1142, "step": 3909 }, { "epoch": 0.07, "learning_rate": 4.9749414808456465e-06, "loss": 0.9731, "step": 3910 }, { "epoch": 0.07, "learning_rate": 4.974919900914043e-06, "loss": 1.0775, "step": 3911 }, { "epoch": 0.07, "learning_rate": 4.974898311741164e-06, "loss": 1.275, "step": 3912 }, { "epoch": 0.07, "learning_rate": 4.97487671332709e-06, "loss": 0.9505, "step": 3913 }, { "epoch": 0.07, "learning_rate": 4.974855105671903e-06, "loss": 1.0584, "step": 3914 }, { "epoch": 0.07, "learning_rate": 4.974833488775682e-06, "loss": 0.8509, "step": 3915 }, { "epoch": 0.07, "learning_rate": 4.97481186263851e-06, "loss": 0.7829, "step": 3916 }, { "epoch": 0.07, "learning_rate": 4.974790227260466e-06, "loss": 1.0163, "step": 3917 }, { "epoch": 0.07, "learning_rate": 4.97476858264163e-06, "loss": 1.1557, "step": 3918 }, { "epoch": 0.07, "learning_rate": 4.974746928782086e-06, "loss": 1.0769, "step": 3919 }, { "epoch": 0.07, "learning_rate": 4.974725265681911e-06, "loss": 1.0295, "step": 3920 }, { "epoch": 0.07, "learning_rate": 4.974703593341189e-06, "loss": 1.0438, "step": 3921 }, { "epoch": 0.07, "learning_rate": 4.974681911759999e-06, "loss": 1.0585, "step": 3922 }, { "epoch": 0.07, "learning_rate": 4.974660220938422e-06, "loss": 0.846, "step": 3923 }, { "epoch": 0.07, "learning_rate": 4.974638520876541e-06, "loss": 0.8881, "step": 3924 }, { "epoch": 0.07, "learning_rate": 4.974616811574435e-06, "loss": 0.9895, "step": 3925 }, { "epoch": 0.07, "learning_rate": 4.974595093032185e-06, "loss": 0.7957, "step": 3926 }, { "epoch": 0.07, "learning_rate": 4.974573365249874e-06, "loss": 0.9982, "step": 3927 }, { "epoch": 0.07, "learning_rate": 4.974551628227582e-06, "loss": 1.1215, "step": 3928 }, { "epoch": 0.07, "learning_rate": 4.974529881965389e-06, "loss": 0.9199, "step": 3929 }, { "epoch": 0.07, "learning_rate": 4.9745081264633774e-06, "loss": 0.938, "step": 3930 }, { "epoch": 0.07, "learning_rate": 4.974486361721628e-06, "loss": 1.3779, "step": 3931 }, { "epoch": 0.07, "learning_rate": 4.974464587740225e-06, "loss": 0.802, "step": 3932 }, { "epoch": 0.07, "learning_rate": 4.974442804519244e-06, "loss": 0.8661, "step": 3933 }, { "epoch": 0.07, "learning_rate": 4.974421012058771e-06, "loss": 1.0377, "step": 3934 }, { "epoch": 0.07, "learning_rate": 4.974399210358886e-06, "loss": 0.8987, "step": 3935 }, { "epoch": 0.07, "learning_rate": 4.9743773994196684e-06, "loss": 1.0711, "step": 3936 }, { "epoch": 0.07, "learning_rate": 4.974355579241204e-06, "loss": 1.1873, "step": 3937 }, { "epoch": 0.07, "learning_rate": 4.97433374982357e-06, "loss": 1.0342, "step": 3938 }, { "epoch": 0.07, "learning_rate": 4.97431191116685e-06, "loss": 0.9335, "step": 3939 }, { "epoch": 0.07, "learning_rate": 4.974290063271125e-06, "loss": 0.949, "step": 3940 }, { "epoch": 0.07, "learning_rate": 4.974268206136477e-06, "loss": 0.9611, "step": 3941 }, { "epoch": 0.07, "learning_rate": 4.974246339762987e-06, "loss": 1.0013, "step": 3942 }, { "epoch": 0.07, "learning_rate": 4.974224464150738e-06, "loss": 1.1625, "step": 3943 }, { "epoch": 0.07, "learning_rate": 4.974202579299811e-06, "loss": 1.002, "step": 3944 }, { "epoch": 0.07, "learning_rate": 4.974180685210286e-06, "loss": 0.8806, "step": 3945 }, { "epoch": 0.07, "learning_rate": 4.974158781882247e-06, "loss": 0.965, "step": 3946 }, { "epoch": 0.07, "learning_rate": 4.974136869315774e-06, "loss": 0.989, "step": 3947 }, { "epoch": 0.07, "learning_rate": 4.974114947510951e-06, "loss": 0.7887, "step": 3948 }, { "epoch": 0.07, "learning_rate": 4.974093016467858e-06, "loss": 0.9343, "step": 3949 }, { "epoch": 0.07, "learning_rate": 4.974071076186578e-06, "loss": 1.0756, "step": 3950 }, { "epoch": 0.07, "learning_rate": 4.974049126667192e-06, "loss": 0.9724, "step": 3951 }, { "epoch": 0.07, "learning_rate": 4.974027167909782e-06, "loss": 0.8852, "step": 3952 }, { "epoch": 0.07, "learning_rate": 4.974005199914431e-06, "loss": 0.991, "step": 3953 }, { "epoch": 0.07, "learning_rate": 4.973983222681222e-06, "loss": 0.9803, "step": 3954 }, { "epoch": 0.07, "learning_rate": 4.973961236210233e-06, "loss": 0.9916, "step": 3955 }, { "epoch": 0.07, "learning_rate": 4.973939240501549e-06, "loss": 0.965, "step": 3956 }, { "epoch": 0.07, "learning_rate": 4.973917235555252e-06, "loss": 0.9819, "step": 3957 }, { "epoch": 0.07, "learning_rate": 4.973895221371425e-06, "loss": 0.8902, "step": 3958 }, { "epoch": 0.07, "learning_rate": 4.973873197950148e-06, "loss": 0.9692, "step": 3959 }, { "epoch": 0.07, "learning_rate": 4.973851165291504e-06, "loss": 0.9435, "step": 3960 }, { "epoch": 0.07, "learning_rate": 4.9738291233955775e-06, "loss": 0.8471, "step": 3961 }, { "epoch": 0.07, "learning_rate": 4.973807072262446e-06, "loss": 1.0884, "step": 3962 }, { "epoch": 0.07, "learning_rate": 4.973785011892197e-06, "loss": 1.1969, "step": 3963 }, { "epoch": 0.07, "learning_rate": 4.97376294228491e-06, "loss": 1.0203, "step": 3964 }, { "epoch": 0.07, "learning_rate": 4.973740863440668e-06, "loss": 1.0667, "step": 3965 }, { "epoch": 0.07, "learning_rate": 4.973718775359554e-06, "loss": 1.1339, "step": 3966 }, { "epoch": 0.07, "learning_rate": 4.973696678041649e-06, "loss": 1.1981, "step": 3967 }, { "epoch": 0.07, "learning_rate": 4.973674571487037e-06, "loss": 1.0098, "step": 3968 }, { "epoch": 0.07, "learning_rate": 4.9736524556958e-06, "loss": 1.0874, "step": 3969 }, { "epoch": 0.07, "learning_rate": 4.97363033066802e-06, "loss": 1.0778, "step": 3970 }, { "epoch": 0.07, "learning_rate": 4.97360819640378e-06, "loss": 0.9659, "step": 3971 }, { "epoch": 0.07, "learning_rate": 4.973586052903164e-06, "loss": 0.6995, "step": 3972 }, { "epoch": 0.07, "learning_rate": 4.973563900166253e-06, "loss": 0.8518, "step": 3973 }, { "epoch": 0.07, "learning_rate": 4.97354173819313e-06, "loss": 1.0796, "step": 3974 }, { "epoch": 0.07, "learning_rate": 4.973519566983878e-06, "loss": 1.0592, "step": 3975 }, { "epoch": 0.08, "learning_rate": 4.97349738653858e-06, "loss": 0.9473, "step": 3976 }, { "epoch": 0.08, "learning_rate": 4.973475196857319e-06, "loss": 0.9872, "step": 3977 }, { "epoch": 0.08, "learning_rate": 4.9734529979401765e-06, "loss": 0.9114, "step": 3978 }, { "epoch": 0.08, "learning_rate": 4.973430789787237e-06, "loss": 0.8654, "step": 3979 }, { "epoch": 0.08, "learning_rate": 4.973408572398582e-06, "loss": 1.1313, "step": 3980 }, { "epoch": 0.08, "learning_rate": 4.973386345774296e-06, "loss": 0.9998, "step": 3981 }, { "epoch": 0.08, "learning_rate": 4.973364109914462e-06, "loss": 1.0906, "step": 3982 }, { "epoch": 0.08, "learning_rate": 4.97334186481916e-06, "loss": 1.0518, "step": 3983 }, { "epoch": 0.08, "learning_rate": 4.973319610488477e-06, "loss": 1.0513, "step": 3984 }, { "epoch": 0.08, "learning_rate": 4.973297346922494e-06, "loss": 0.9551, "step": 3985 }, { "epoch": 0.08, "learning_rate": 4.973275074121295e-06, "loss": 0.9144, "step": 3986 }, { "epoch": 0.08, "learning_rate": 4.973252792084962e-06, "loss": 1.3331, "step": 3987 }, { "epoch": 0.08, "learning_rate": 4.9732305008135796e-06, "loss": 1.0516, "step": 3988 }, { "epoch": 0.08, "learning_rate": 4.973208200307229e-06, "loss": 0.7835, "step": 3989 }, { "epoch": 0.08, "learning_rate": 4.973185890565996e-06, "loss": 1.0506, "step": 3990 }, { "epoch": 0.08, "learning_rate": 4.973163571589963e-06, "loss": 0.839, "step": 3991 }, { "epoch": 0.08, "learning_rate": 4.973141243379212e-06, "loss": 1.1716, "step": 3992 }, { "epoch": 0.08, "learning_rate": 4.973118905933828e-06, "loss": 1.1033, "step": 3993 }, { "epoch": 0.08, "learning_rate": 4.973096559253894e-06, "loss": 1.1318, "step": 3994 }, { "epoch": 0.08, "learning_rate": 4.973074203339493e-06, "loss": 0.881, "step": 3995 }, { "epoch": 0.08, "learning_rate": 4.973051838190709e-06, "loss": 0.9504, "step": 3996 }, { "epoch": 0.08, "learning_rate": 4.973029463807625e-06, "loss": 0.8263, "step": 3997 }, { "epoch": 0.08, "learning_rate": 4.973007080190324e-06, "loss": 0.9774, "step": 3998 }, { "epoch": 0.08, "learning_rate": 4.972984687338892e-06, "loss": 1.123, "step": 3999 }, { "epoch": 0.08, "learning_rate": 4.97296228525341e-06, "loss": 0.9974, "step": 4000 }, { "epoch": 0.08, "learning_rate": 4.972939873933963e-06, "loss": 1.0161, "step": 4001 }, { "epoch": 0.08, "learning_rate": 4.972917453380634e-06, "loss": 1.0013, "step": 4002 }, { "epoch": 0.08, "learning_rate": 4.972895023593507e-06, "loss": 0.9112, "step": 4003 }, { "epoch": 0.08, "learning_rate": 4.972872584572666e-06, "loss": 0.8322, "step": 4004 }, { "epoch": 0.08, "learning_rate": 4.9728501363181945e-06, "loss": 1.0377, "step": 4005 }, { "epoch": 0.08, "learning_rate": 4.972827678830177e-06, "loss": 1.1037, "step": 4006 }, { "epoch": 0.08, "learning_rate": 4.972805212108696e-06, "loss": 0.9789, "step": 4007 }, { "epoch": 0.08, "learning_rate": 4.9727827361538365e-06, "loss": 0.7654, "step": 4008 }, { "epoch": 0.08, "learning_rate": 4.9727602509656824e-06, "loss": 0.9598, "step": 4009 }, { "epoch": 0.08, "learning_rate": 4.972737756544317e-06, "loss": 0.7646, "step": 4010 }, { "epoch": 0.08, "learning_rate": 4.972715252889824e-06, "loss": 0.81, "step": 4011 }, { "epoch": 0.08, "learning_rate": 4.972692740002289e-06, "loss": 1.224, "step": 4012 }, { "epoch": 0.08, "learning_rate": 4.972670217881795e-06, "loss": 0.8992, "step": 4013 }, { "epoch": 0.08, "learning_rate": 4.972647686528426e-06, "loss": 0.866, "step": 4014 }, { "epoch": 0.08, "learning_rate": 4.972625145942266e-06, "loss": 0.8111, "step": 4015 }, { "epoch": 0.08, "learning_rate": 4.9726025961234e-06, "loss": 0.9653, "step": 4016 }, { "epoch": 0.08, "learning_rate": 4.972580037071912e-06, "loss": 0.8862, "step": 4017 }, { "epoch": 0.08, "learning_rate": 4.972557468787885e-06, "loss": 1.0807, "step": 4018 }, { "epoch": 0.08, "learning_rate": 4.972534891271405e-06, "loss": 0.9989, "step": 4019 }, { "epoch": 0.08, "learning_rate": 4.972512304522556e-06, "loss": 1.0668, "step": 4020 }, { "epoch": 0.08, "learning_rate": 4.972489708541421e-06, "loss": 1.0374, "step": 4021 }, { "epoch": 0.08, "learning_rate": 4.972467103328085e-06, "loss": 1.0063, "step": 4022 }, { "epoch": 0.08, "learning_rate": 4.9724444888826325e-06, "loss": 0.8506, "step": 4023 }, { "epoch": 0.08, "learning_rate": 4.972421865205149e-06, "loss": 1.0149, "step": 4024 }, { "epoch": 0.08, "learning_rate": 4.9723992322957185e-06, "loss": 1.1061, "step": 4025 }, { "epoch": 0.08, "learning_rate": 4.972376590154424e-06, "loss": 0.7591, "step": 4026 }, { "epoch": 0.08, "learning_rate": 4.972353938781351e-06, "loss": 0.9596, "step": 4027 }, { "epoch": 0.08, "learning_rate": 4.972331278176585e-06, "loss": 0.948, "step": 4028 }, { "epoch": 0.08, "learning_rate": 4.97230860834021e-06, "loss": 0.8984, "step": 4029 }, { "epoch": 0.08, "learning_rate": 4.972285929272309e-06, "loss": 0.8568, "step": 4030 }, { "epoch": 0.08, "learning_rate": 4.972263240972968e-06, "loss": 1.1038, "step": 4031 }, { "epoch": 0.08, "learning_rate": 4.972240543442274e-06, "loss": 1.0721, "step": 4032 }, { "epoch": 0.08, "learning_rate": 4.972217836680308e-06, "loss": 1.1136, "step": 4033 }, { "epoch": 0.08, "learning_rate": 4.972195120687157e-06, "loss": 0.9102, "step": 4034 }, { "epoch": 0.08, "learning_rate": 4.9721723954629056e-06, "loss": 1.0699, "step": 4035 }, { "epoch": 0.08, "learning_rate": 4.9721496610076375e-06, "loss": 0.9326, "step": 4036 }, { "epoch": 0.08, "learning_rate": 4.972126917321438e-06, "loss": 0.8661, "step": 4037 }, { "epoch": 0.08, "learning_rate": 4.9721041644043935e-06, "loss": 0.9681, "step": 4038 }, { "epoch": 0.08, "learning_rate": 4.972081402256588e-06, "loss": 0.9625, "step": 4039 }, { "epoch": 0.08, "learning_rate": 4.972058630878105e-06, "loss": 1.032, "step": 4040 }, { "epoch": 0.08, "learning_rate": 4.9720358502690315e-06, "loss": 0.9325, "step": 4041 }, { "epoch": 0.08, "learning_rate": 4.972013060429453e-06, "loss": 0.8094, "step": 4042 }, { "epoch": 0.08, "learning_rate": 4.971990261359452e-06, "loss": 1.0721, "step": 4043 }, { "epoch": 0.08, "learning_rate": 4.971967453059116e-06, "loss": 1.0936, "step": 4044 }, { "epoch": 0.08, "learning_rate": 4.971944635528528e-06, "loss": 1.0499, "step": 4045 }, { "epoch": 0.08, "learning_rate": 4.971921808767775e-06, "loss": 0.7694, "step": 4046 }, { "epoch": 0.08, "learning_rate": 4.9718989727769425e-06, "loss": 0.9828, "step": 4047 }, { "epoch": 0.08, "learning_rate": 4.971876127556115e-06, "loss": 1.0026, "step": 4048 }, { "epoch": 0.08, "learning_rate": 4.9718532731053785e-06, "loss": 0.9886, "step": 4049 }, { "epoch": 0.08, "learning_rate": 4.971830409424817e-06, "loss": 1.1384, "step": 4050 }, { "epoch": 0.08, "learning_rate": 4.9718075365145156e-06, "loss": 0.856, "step": 4051 }, { "epoch": 0.08, "learning_rate": 4.971784654374562e-06, "loss": 0.9657, "step": 4052 }, { "epoch": 0.08, "learning_rate": 4.97176176300504e-06, "loss": 1.0109, "step": 4053 }, { "epoch": 0.08, "learning_rate": 4.9717388624060345e-06, "loss": 0.8744, "step": 4054 }, { "epoch": 0.08, "learning_rate": 4.971715952577633e-06, "loss": 0.9203, "step": 4055 }, { "epoch": 0.08, "learning_rate": 4.971693033519919e-06, "loss": 1.0618, "step": 4056 }, { "epoch": 0.08, "learning_rate": 4.971670105232979e-06, "loss": 0.8271, "step": 4057 }, { "epoch": 0.08, "learning_rate": 4.971647167716899e-06, "loss": 1.1389, "step": 4058 }, { "epoch": 0.08, "learning_rate": 4.971624220971764e-06, "loss": 0.8531, "step": 4059 }, { "epoch": 0.08, "learning_rate": 4.97160126499766e-06, "loss": 0.9952, "step": 4060 }, { "epoch": 0.08, "learning_rate": 4.971578299794673e-06, "loss": 0.8353, "step": 4061 }, { "epoch": 0.08, "learning_rate": 4.971555325362888e-06, "loss": 1.0876, "step": 4062 }, { "epoch": 0.08, "learning_rate": 4.971532341702392e-06, "loss": 1.0522, "step": 4063 }, { "epoch": 0.08, "learning_rate": 4.9715093488132696e-06, "loss": 1.0976, "step": 4064 }, { "epoch": 0.08, "learning_rate": 4.971486346695606e-06, "loss": 0.8373, "step": 4065 }, { "epoch": 0.08, "learning_rate": 4.971463335349489e-06, "loss": 1.0663, "step": 4066 }, { "epoch": 0.08, "learning_rate": 4.971440314775004e-06, "loss": 0.862, "step": 4067 }, { "epoch": 0.08, "learning_rate": 4.971417284972236e-06, "loss": 1.0756, "step": 4068 }, { "epoch": 0.08, "learning_rate": 4.971394245941273e-06, "loss": 0.9253, "step": 4069 }, { "epoch": 0.08, "learning_rate": 4.971371197682198e-06, "loss": 1.0984, "step": 4070 }, { "epoch": 0.08, "learning_rate": 4.9713481401950995e-06, "loss": 0.9236, "step": 4071 }, { "epoch": 0.08, "learning_rate": 4.971325073480062e-06, "loss": 0.8433, "step": 4072 }, { "epoch": 0.08, "learning_rate": 4.9713019975371736e-06, "loss": 0.8807, "step": 4073 }, { "epoch": 0.08, "learning_rate": 4.971278912366519e-06, "loss": 1.0073, "step": 4074 }, { "epoch": 0.08, "learning_rate": 4.971255817968184e-06, "loss": 0.943, "step": 4075 }, { "epoch": 0.08, "learning_rate": 4.971232714342257e-06, "loss": 1.0944, "step": 4076 }, { "epoch": 0.08, "learning_rate": 4.971209601488821e-06, "loss": 0.8581, "step": 4077 }, { "epoch": 0.08, "learning_rate": 4.9711864794079655e-06, "loss": 1.0101, "step": 4078 }, { "epoch": 0.08, "learning_rate": 4.971163348099775e-06, "loss": 0.9661, "step": 4079 }, { "epoch": 0.08, "learning_rate": 4.971140207564337e-06, "loss": 1.1263, "step": 4080 }, { "epoch": 0.08, "learning_rate": 4.971117057801736e-06, "loss": 1.0644, "step": 4081 }, { "epoch": 0.08, "learning_rate": 4.971093898812061e-06, "loss": 0.8292, "step": 4082 }, { "epoch": 0.08, "learning_rate": 4.971070730595396e-06, "loss": 0.9676, "step": 4083 }, { "epoch": 0.08, "learning_rate": 4.9710475531518285e-06, "loss": 0.9421, "step": 4084 }, { "epoch": 0.08, "learning_rate": 4.971024366481446e-06, "loss": 1.0848, "step": 4085 }, { "epoch": 0.08, "learning_rate": 4.971001170584334e-06, "loss": 1.028, "step": 4086 }, { "epoch": 0.08, "learning_rate": 4.970977965460579e-06, "loss": 1.1907, "step": 4087 }, { "epoch": 0.08, "learning_rate": 4.970954751110269e-06, "loss": 1.0212, "step": 4088 }, { "epoch": 0.08, "learning_rate": 4.970931527533489e-06, "loss": 1.0057, "step": 4089 }, { "epoch": 0.08, "learning_rate": 4.970908294730327e-06, "loss": 0.8924, "step": 4090 }, { "epoch": 0.08, "learning_rate": 4.970885052700869e-06, "loss": 1.0167, "step": 4091 }, { "epoch": 0.08, "learning_rate": 4.970861801445201e-06, "loss": 0.9969, "step": 4092 }, { "epoch": 0.08, "learning_rate": 4.970838540963412e-06, "loss": 1.0027, "step": 4093 }, { "epoch": 0.08, "learning_rate": 4.970815271255587e-06, "loss": 1.1368, "step": 4094 }, { "epoch": 0.08, "learning_rate": 4.970791992321814e-06, "loss": 0.867, "step": 4095 }, { "epoch": 0.08, "learning_rate": 4.970768704162179e-06, "loss": 0.8627, "step": 4096 }, { "epoch": 0.08, "learning_rate": 4.970745406776769e-06, "loss": 1.0916, "step": 4097 }, { "epoch": 0.08, "learning_rate": 4.970722100165673e-06, "loss": 0.9756, "step": 4098 }, { "epoch": 0.08, "learning_rate": 4.970698784328974e-06, "loss": 1.0463, "step": 4099 }, { "epoch": 0.08, "learning_rate": 4.970675459266764e-06, "loss": 1.3221, "step": 4100 }, { "epoch": 0.08, "learning_rate": 4.970652124979126e-06, "loss": 0.9503, "step": 4101 }, { "epoch": 0.08, "learning_rate": 4.970628781466149e-06, "loss": 0.9835, "step": 4102 }, { "epoch": 0.08, "learning_rate": 4.970605428727921e-06, "loss": 1.0888, "step": 4103 }, { "epoch": 0.08, "learning_rate": 4.970582066764526e-06, "loss": 0.9389, "step": 4104 }, { "epoch": 0.08, "learning_rate": 4.970558695576055e-06, "loss": 1.0648, "step": 4105 }, { "epoch": 0.08, "learning_rate": 4.9705353151625935e-06, "loss": 1.04, "step": 4106 }, { "epoch": 0.08, "learning_rate": 4.970511925524229e-06, "loss": 1.0437, "step": 4107 }, { "epoch": 0.08, "learning_rate": 4.9704885266610476e-06, "loss": 0.8802, "step": 4108 }, { "epoch": 0.08, "learning_rate": 4.970465118573138e-06, "loss": 0.8209, "step": 4109 }, { "epoch": 0.08, "learning_rate": 4.970441701260588e-06, "loss": 1.0726, "step": 4110 }, { "epoch": 0.08, "learning_rate": 4.970418274723484e-06, "loss": 0.8898, "step": 4111 }, { "epoch": 0.08, "learning_rate": 4.970394838961914e-06, "loss": 1.1096, "step": 4112 }, { "epoch": 0.08, "learning_rate": 4.9703713939759655e-06, "loss": 1.0998, "step": 4113 }, { "epoch": 0.08, "learning_rate": 4.970347939765726e-06, "loss": 0.9354, "step": 4114 }, { "epoch": 0.08, "learning_rate": 4.970324476331283e-06, "loss": 1.06, "step": 4115 }, { "epoch": 0.08, "learning_rate": 4.970301003672725e-06, "loss": 0.8527, "step": 4116 }, { "epoch": 0.08, "learning_rate": 4.9702775217901375e-06, "loss": 1.0089, "step": 4117 }, { "epoch": 0.08, "learning_rate": 4.97025403068361e-06, "loss": 1.23, "step": 4118 }, { "epoch": 0.08, "learning_rate": 4.9702305303532295e-06, "loss": 0.9514, "step": 4119 }, { "epoch": 0.08, "learning_rate": 4.970207020799084e-06, "loss": 1.0002, "step": 4120 }, { "epoch": 0.08, "learning_rate": 4.970183502021261e-06, "loss": 0.801, "step": 4121 }, { "epoch": 0.08, "learning_rate": 4.9701599740198495e-06, "loss": 0.9702, "step": 4122 }, { "epoch": 0.08, "learning_rate": 4.970136436794936e-06, "loss": 0.8022, "step": 4123 }, { "epoch": 0.08, "learning_rate": 4.970112890346608e-06, "loss": 1.1125, "step": 4124 }, { "epoch": 0.08, "learning_rate": 4.9700893346749545e-06, "loss": 1.507, "step": 4125 }, { "epoch": 0.08, "learning_rate": 4.970065769780064e-06, "loss": 0.8227, "step": 4126 }, { "epoch": 0.08, "learning_rate": 4.970042195662023e-06, "loss": 0.9167, "step": 4127 }, { "epoch": 0.08, "learning_rate": 4.97001861232092e-06, "loss": 0.8606, "step": 4128 }, { "epoch": 0.08, "learning_rate": 4.969995019756843e-06, "loss": 0.955, "step": 4129 }, { "epoch": 0.08, "learning_rate": 4.969971417969881e-06, "loss": 1.2213, "step": 4130 }, { "epoch": 0.08, "learning_rate": 4.969947806960122e-06, "loss": 0.9548, "step": 4131 }, { "epoch": 0.08, "learning_rate": 4.969924186727651e-06, "loss": 1.3192, "step": 4132 }, { "epoch": 0.08, "learning_rate": 4.9699005572725615e-06, "loss": 0.8076, "step": 4133 }, { "epoch": 0.08, "learning_rate": 4.969876918594938e-06, "loss": 1.0293, "step": 4134 }, { "epoch": 0.08, "learning_rate": 4.96985327069487e-06, "loss": 0.9581, "step": 4135 }, { "epoch": 0.08, "learning_rate": 4.969829613572445e-06, "loss": 0.8762, "step": 4136 }, { "epoch": 0.08, "learning_rate": 4.9698059472277535e-06, "loss": 1.0119, "step": 4137 }, { "epoch": 0.08, "learning_rate": 4.969782271660881e-06, "loss": 1.0408, "step": 4138 }, { "epoch": 0.08, "learning_rate": 4.969758586871918e-06, "loss": 1.1572, "step": 4139 }, { "epoch": 0.08, "learning_rate": 4.969734892860951e-06, "loss": 0.8336, "step": 4140 }, { "epoch": 0.08, "learning_rate": 4.969711189628071e-06, "loss": 1.0883, "step": 4141 }, { "epoch": 0.08, "learning_rate": 4.969687477173365e-06, "loss": 1.1004, "step": 4142 }, { "epoch": 0.08, "learning_rate": 4.96966375549692e-06, "loss": 1.0253, "step": 4143 }, { "epoch": 0.08, "learning_rate": 4.969640024598829e-06, "loss": 0.8337, "step": 4144 }, { "epoch": 0.08, "learning_rate": 4.969616284479176e-06, "loss": 1.0639, "step": 4145 }, { "epoch": 0.08, "learning_rate": 4.9695925351380515e-06, "loss": 0.8378, "step": 4146 }, { "epoch": 0.08, "learning_rate": 4.9695687765755445e-06, "loss": 0.8936, "step": 4147 }, { "epoch": 0.08, "learning_rate": 4.969545008791743e-06, "loss": 1.0146, "step": 4148 }, { "epoch": 0.08, "learning_rate": 4.969521231786737e-06, "loss": 0.9464, "step": 4149 }, { "epoch": 0.08, "learning_rate": 4.969497445560614e-06, "loss": 0.975, "step": 4150 }, { "epoch": 0.08, "learning_rate": 4.969473650113463e-06, "loss": 1.0736, "step": 4151 }, { "epoch": 0.08, "learning_rate": 4.969449845445375e-06, "loss": 0.8549, "step": 4152 }, { "epoch": 0.08, "learning_rate": 4.969426031556435e-06, "loss": 0.7929, "step": 4153 }, { "epoch": 0.08, "learning_rate": 4.969402208446733e-06, "loss": 0.9011, "step": 4154 }, { "epoch": 0.08, "learning_rate": 4.969378376116361e-06, "loss": 0.9211, "step": 4155 }, { "epoch": 0.08, "learning_rate": 4.9693545345654045e-06, "loss": 1.0417, "step": 4156 }, { "epoch": 0.08, "learning_rate": 4.969330683793955e-06, "loss": 0.9911, "step": 4157 }, { "epoch": 0.08, "learning_rate": 4.969306823802099e-06, "loss": 0.9203, "step": 4158 }, { "epoch": 0.08, "learning_rate": 4.9692829545899294e-06, "loss": 0.9541, "step": 4159 }, { "epoch": 0.08, "learning_rate": 4.969259076157531e-06, "loss": 0.809, "step": 4160 }, { "epoch": 0.08, "learning_rate": 4.969235188504995e-06, "loss": 1.1033, "step": 4161 }, { "epoch": 0.08, "learning_rate": 4.969211291632411e-06, "loss": 1.0602, "step": 4162 }, { "epoch": 0.08, "learning_rate": 4.9691873855398675e-06, "loss": 1.0274, "step": 4163 }, { "epoch": 0.08, "learning_rate": 4.969163470227454e-06, "loss": 0.9225, "step": 4164 }, { "epoch": 0.08, "learning_rate": 4.96913954569526e-06, "loss": 0.8922, "step": 4165 }, { "epoch": 0.08, "learning_rate": 4.969115611943375e-06, "loss": 0.7913, "step": 4166 }, { "epoch": 0.08, "learning_rate": 4.969091668971887e-06, "loss": 0.8524, "step": 4167 }, { "epoch": 0.08, "learning_rate": 4.969067716780888e-06, "loss": 1.1008, "step": 4168 }, { "epoch": 0.08, "learning_rate": 4.969043755370464e-06, "loss": 1.0591, "step": 4169 }, { "epoch": 0.08, "learning_rate": 4.969019784740707e-06, "loss": 0.952, "step": 4170 }, { "epoch": 0.08, "learning_rate": 4.968995804891706e-06, "loss": 0.9304, "step": 4171 }, { "epoch": 0.08, "learning_rate": 4.968971815823551e-06, "loss": 0.8922, "step": 4172 }, { "epoch": 0.08, "learning_rate": 4.96894781753633e-06, "loss": 0.8516, "step": 4173 }, { "epoch": 0.08, "learning_rate": 4.968923810030134e-06, "loss": 0.9925, "step": 4174 }, { "epoch": 0.08, "learning_rate": 4.968899793305052e-06, "loss": 1.1267, "step": 4175 }, { "epoch": 0.08, "learning_rate": 4.968875767361175e-06, "loss": 1.0306, "step": 4176 }, { "epoch": 0.08, "learning_rate": 4.968851732198589e-06, "loss": 0.7695, "step": 4177 }, { "epoch": 0.08, "learning_rate": 4.968827687817388e-06, "loss": 0.8921, "step": 4178 }, { "epoch": 0.08, "learning_rate": 4.96880363421766e-06, "loss": 0.8931, "step": 4179 }, { "epoch": 0.08, "learning_rate": 4.968779571399495e-06, "loss": 1.0189, "step": 4180 }, { "epoch": 0.08, "learning_rate": 4.968755499362983e-06, "loss": 1.258, "step": 4181 }, { "epoch": 0.08, "learning_rate": 4.968731418108213e-06, "loss": 1.0096, "step": 4182 }, { "epoch": 0.08, "learning_rate": 4.968707327635276e-06, "loss": 0.7883, "step": 4183 }, { "epoch": 0.08, "learning_rate": 4.968683227944261e-06, "loss": 0.9166, "step": 4184 }, { "epoch": 0.08, "learning_rate": 4.9686591190352594e-06, "loss": 0.9524, "step": 4185 }, { "epoch": 0.08, "learning_rate": 4.96863500090836e-06, "loss": 1.0467, "step": 4186 }, { "epoch": 0.08, "learning_rate": 4.968610873563653e-06, "loss": 1.2054, "step": 4187 }, { "epoch": 0.08, "learning_rate": 4.968586737001229e-06, "loss": 1.0803, "step": 4188 }, { "epoch": 0.08, "learning_rate": 4.968562591221177e-06, "loss": 0.8968, "step": 4189 }, { "epoch": 0.08, "learning_rate": 4.968538436223589e-06, "loss": 1.1424, "step": 4190 }, { "epoch": 0.08, "learning_rate": 4.968514272008553e-06, "loss": 1.0209, "step": 4191 }, { "epoch": 0.08, "learning_rate": 4.968490098576161e-06, "loss": 0.9585, "step": 4192 }, { "epoch": 0.08, "learning_rate": 4.968465915926503e-06, "loss": 0.8975, "step": 4193 }, { "epoch": 0.08, "learning_rate": 4.968441724059669e-06, "loss": 0.9781, "step": 4194 }, { "epoch": 0.08, "learning_rate": 4.968417522975749e-06, "loss": 1.0073, "step": 4195 }, { "epoch": 0.08, "learning_rate": 4.968393312674834e-06, "loss": 0.8912, "step": 4196 }, { "epoch": 0.08, "learning_rate": 4.968369093157013e-06, "loss": 0.988, "step": 4197 }, { "epoch": 0.08, "learning_rate": 4.9683448644223785e-06, "loss": 0.9809, "step": 4198 }, { "epoch": 0.08, "learning_rate": 4.968320626471019e-06, "loss": 0.9529, "step": 4199 }, { "epoch": 0.08, "learning_rate": 4.968296379303027e-06, "loss": 1.0959, "step": 4200 }, { "epoch": 0.08, "learning_rate": 4.968272122918492e-06, "loss": 1.0205, "step": 4201 }, { "epoch": 0.08, "learning_rate": 4.968247857317504e-06, "loss": 0.9195, "step": 4202 }, { "epoch": 0.08, "learning_rate": 4.968223582500155e-06, "loss": 0.9952, "step": 4203 }, { "epoch": 0.08, "learning_rate": 4.968199298466534e-06, "loss": 0.8112, "step": 4204 }, { "epoch": 0.08, "learning_rate": 4.968175005216732e-06, "loss": 0.9819, "step": 4205 }, { "epoch": 0.08, "learning_rate": 4.968150702750842e-06, "loss": 1.2183, "step": 4206 }, { "epoch": 0.08, "learning_rate": 4.968126391068951e-06, "loss": 1.0697, "step": 4207 }, { "epoch": 0.08, "learning_rate": 4.968102070171152e-06, "loss": 0.9817, "step": 4208 }, { "epoch": 0.08, "learning_rate": 4.9680777400575365e-06, "loss": 0.99, "step": 4209 }, { "epoch": 0.08, "learning_rate": 4.9680534007281945e-06, "loss": 0.9517, "step": 4210 }, { "epoch": 0.08, "learning_rate": 4.968029052183216e-06, "loss": 0.9592, "step": 4211 }, { "epoch": 0.08, "learning_rate": 4.968004694422693e-06, "loss": 1.0787, "step": 4212 }, { "epoch": 0.08, "learning_rate": 4.967980327446716e-06, "loss": 1.0139, "step": 4213 }, { "epoch": 0.08, "learning_rate": 4.967955951255377e-06, "loss": 0.9935, "step": 4214 }, { "epoch": 0.08, "learning_rate": 4.967931565848765e-06, "loss": 0.9977, "step": 4215 }, { "epoch": 0.08, "learning_rate": 4.967907171226972e-06, "loss": 0.7963, "step": 4216 }, { "epoch": 0.08, "learning_rate": 4.96788276739009e-06, "loss": 0.8492, "step": 4217 }, { "epoch": 0.08, "learning_rate": 4.96785835433821e-06, "loss": 0.9519, "step": 4218 }, { "epoch": 0.08, "learning_rate": 4.967833932071421e-06, "loss": 1.121, "step": 4219 }, { "epoch": 0.08, "learning_rate": 4.967809500589817e-06, "loss": 1.0041, "step": 4220 }, { "epoch": 0.08, "learning_rate": 4.967785059893487e-06, "loss": 0.9341, "step": 4221 }, { "epoch": 0.08, "learning_rate": 4.967760609982524e-06, "loss": 0.9818, "step": 4222 }, { "epoch": 0.08, "learning_rate": 4.9677361508570186e-06, "loss": 0.8147, "step": 4223 }, { "epoch": 0.08, "learning_rate": 4.967711682517062e-06, "loss": 1.0451, "step": 4224 }, { "epoch": 0.08, "learning_rate": 4.967687204962746e-06, "loss": 1.2407, "step": 4225 }, { "epoch": 0.08, "learning_rate": 4.967662718194161e-06, "loss": 0.7022, "step": 4226 }, { "epoch": 0.08, "learning_rate": 4.967638222211399e-06, "loss": 0.8286, "step": 4227 }, { "epoch": 0.08, "learning_rate": 4.967613717014551e-06, "loss": 1.049, "step": 4228 }, { "epoch": 0.08, "learning_rate": 4.96758920260371e-06, "loss": 0.9619, "step": 4229 }, { "epoch": 0.08, "learning_rate": 4.9675646789789665e-06, "loss": 1.0068, "step": 4230 }, { "epoch": 0.08, "learning_rate": 4.967540146140413e-06, "loss": 0.9198, "step": 4231 }, { "epoch": 0.08, "learning_rate": 4.967515604088139e-06, "loss": 1.0753, "step": 4232 }, { "epoch": 0.08, "learning_rate": 4.967491052822237e-06, "loss": 0.9616, "step": 4233 }, { "epoch": 0.08, "learning_rate": 4.9674664923428005e-06, "loss": 0.9746, "step": 4234 }, { "epoch": 0.08, "learning_rate": 4.9674419226499185e-06, "loss": 0.9027, "step": 4235 }, { "epoch": 0.08, "learning_rate": 4.967417343743685e-06, "loss": 0.9984, "step": 4236 }, { "epoch": 0.08, "learning_rate": 4.96739275562419e-06, "loss": 1.0212, "step": 4237 }, { "epoch": 0.08, "learning_rate": 4.967368158291526e-06, "loss": 0.9611, "step": 4238 }, { "epoch": 0.08, "learning_rate": 4.967343551745785e-06, "loss": 1.0297, "step": 4239 }, { "epoch": 0.08, "learning_rate": 4.96731893598706e-06, "loss": 0.842, "step": 4240 }, { "epoch": 0.08, "learning_rate": 4.967294311015441e-06, "loss": 0.7588, "step": 4241 }, { "epoch": 0.08, "learning_rate": 4.96726967683102e-06, "loss": 1.0783, "step": 4242 }, { "epoch": 0.08, "learning_rate": 4.967245033433891e-06, "loss": 1.0441, "step": 4243 }, { "epoch": 0.08, "learning_rate": 4.967220380824144e-06, "loss": 1.1663, "step": 4244 }, { "epoch": 0.08, "learning_rate": 4.967195719001872e-06, "loss": 0.8982, "step": 4245 }, { "epoch": 0.08, "learning_rate": 4.967171047967166e-06, "loss": 0.8403, "step": 4246 }, { "epoch": 0.08, "learning_rate": 4.967146367720119e-06, "loss": 1.011, "step": 4247 }, { "epoch": 0.08, "learning_rate": 4.967121678260824e-06, "loss": 0.8901, "step": 4248 }, { "epoch": 0.08, "learning_rate": 4.967096979589372e-06, "loss": 1.1151, "step": 4249 }, { "epoch": 0.08, "learning_rate": 4.967072271705855e-06, "loss": 1.0102, "step": 4250 }, { "epoch": 0.08, "learning_rate": 4.967047554610367e-06, "loss": 0.984, "step": 4251 }, { "epoch": 0.08, "learning_rate": 4.9670228283029975e-06, "loss": 0.838, "step": 4252 }, { "epoch": 0.08, "learning_rate": 4.966998092783841e-06, "loss": 0.8079, "step": 4253 }, { "epoch": 0.08, "learning_rate": 4.96697334805299e-06, "loss": 0.946, "step": 4254 }, { "epoch": 0.08, "learning_rate": 4.966948594110536e-06, "loss": 0.987, "step": 4255 }, { "epoch": 0.08, "learning_rate": 4.966923830956571e-06, "loss": 0.9153, "step": 4256 }, { "epoch": 0.08, "learning_rate": 4.966899058591188e-06, "loss": 0.8296, "step": 4257 }, { "epoch": 0.08, "learning_rate": 4.96687427701448e-06, "loss": 0.9461, "step": 4258 }, { "epoch": 0.08, "learning_rate": 4.966849486226539e-06, "loss": 0.7975, "step": 4259 }, { "epoch": 0.08, "learning_rate": 4.9668246862274576e-06, "loss": 0.8749, "step": 4260 }, { "epoch": 0.08, "learning_rate": 4.9667998770173285e-06, "loss": 0.8776, "step": 4261 }, { "epoch": 0.08, "learning_rate": 4.966775058596244e-06, "loss": 1.1937, "step": 4262 }, { "epoch": 0.08, "learning_rate": 4.966750230964297e-06, "loss": 1.0247, "step": 4263 }, { "epoch": 0.08, "learning_rate": 4.966725394121581e-06, "loss": 0.778, "step": 4264 }, { "epoch": 0.08, "learning_rate": 4.966700548068187e-06, "loss": 0.9895, "step": 4265 }, { "epoch": 0.08, "learning_rate": 4.966675692804209e-06, "loss": 0.8882, "step": 4266 }, { "epoch": 0.08, "learning_rate": 4.966650828329741e-06, "loss": 0.933, "step": 4267 }, { "epoch": 0.08, "learning_rate": 4.966625954644872e-06, "loss": 1.19, "step": 4268 }, { "epoch": 0.08, "learning_rate": 4.966601071749699e-06, "loss": 0.9506, "step": 4269 }, { "epoch": 0.08, "learning_rate": 4.9665761796443135e-06, "loss": 1.1184, "step": 4270 }, { "epoch": 0.08, "learning_rate": 4.966551278328807e-06, "loss": 0.9505, "step": 4271 }, { "epoch": 0.08, "learning_rate": 4.966526367803275e-06, "loss": 1.1063, "step": 4272 }, { "epoch": 0.08, "learning_rate": 4.9665014480678075e-06, "loss": 0.9681, "step": 4273 }, { "epoch": 0.08, "learning_rate": 4.9664765191225e-06, "loss": 1.0861, "step": 4274 }, { "epoch": 0.08, "learning_rate": 4.966451580967445e-06, "loss": 1.0121, "step": 4275 }, { "epoch": 0.08, "learning_rate": 4.966426633602736e-06, "loss": 0.9655, "step": 4276 }, { "epoch": 0.08, "learning_rate": 4.966401677028464e-06, "loss": 1.0314, "step": 4277 }, { "epoch": 0.08, "learning_rate": 4.966376711244725e-06, "loss": 0.9151, "step": 4278 }, { "epoch": 0.08, "learning_rate": 4.966351736251611e-06, "loss": 0.9772, "step": 4279 }, { "epoch": 0.08, "learning_rate": 4.966326752049215e-06, "loss": 0.8928, "step": 4280 }, { "epoch": 0.08, "learning_rate": 4.96630175863763e-06, "loss": 0.8885, "step": 4281 }, { "epoch": 0.08, "learning_rate": 4.96627675601695e-06, "loss": 1.1854, "step": 4282 }, { "epoch": 0.08, "learning_rate": 4.9662517441872685e-06, "loss": 0.8783, "step": 4283 }, { "epoch": 0.08, "learning_rate": 4.9662267231486785e-06, "loss": 0.7327, "step": 4284 }, { "epoch": 0.08, "learning_rate": 4.966201692901274e-06, "loss": 1.0765, "step": 4285 }, { "epoch": 0.08, "learning_rate": 4.966176653445147e-06, "loss": 1.0377, "step": 4286 }, { "epoch": 0.08, "learning_rate": 4.966151604780393e-06, "loss": 1.0673, "step": 4287 }, { "epoch": 0.08, "learning_rate": 4.966126546907104e-06, "loss": 1.087, "step": 4288 }, { "epoch": 0.08, "learning_rate": 4.966101479825375e-06, "loss": 0.8813, "step": 4289 }, { "epoch": 0.08, "learning_rate": 4.966076403535297e-06, "loss": 1.0146, "step": 4290 }, { "epoch": 0.08, "learning_rate": 4.966051318036967e-06, "loss": 0.9375, "step": 4291 }, { "epoch": 0.08, "learning_rate": 4.966026223330475e-06, "loss": 0.9811, "step": 4292 }, { "epoch": 0.08, "learning_rate": 4.9660011194159185e-06, "loss": 0.9337, "step": 4293 }, { "epoch": 0.08, "learning_rate": 4.965976006293389e-06, "loss": 1.0262, "step": 4294 }, { "epoch": 0.08, "learning_rate": 4.96595088396298e-06, "loss": 0.7677, "step": 4295 }, { "epoch": 0.08, "learning_rate": 4.9659257524247874e-06, "loss": 0.955, "step": 4296 }, { "epoch": 0.08, "learning_rate": 4.965900611678902e-06, "loss": 0.9626, "step": 4297 }, { "epoch": 0.08, "learning_rate": 4.96587546172542e-06, "loss": 0.8416, "step": 4298 }, { "epoch": 0.08, "learning_rate": 4.965850302564435e-06, "loss": 0.8126, "step": 4299 }, { "epoch": 0.08, "learning_rate": 4.9658251341960406e-06, "loss": 1.1898, "step": 4300 }, { "epoch": 0.08, "learning_rate": 4.96579995662033e-06, "loss": 1.0953, "step": 4301 }, { "epoch": 0.08, "learning_rate": 4.965774769837399e-06, "loss": 1.0595, "step": 4302 }, { "epoch": 0.08, "learning_rate": 4.9657495738473395e-06, "loss": 1.0131, "step": 4303 }, { "epoch": 0.08, "learning_rate": 4.965724368650248e-06, "loss": 0.9852, "step": 4304 }, { "epoch": 0.08, "learning_rate": 4.965699154246216e-06, "loss": 0.9662, "step": 4305 }, { "epoch": 0.08, "learning_rate": 4.96567393063534e-06, "loss": 1.1782, "step": 4306 }, { "epoch": 0.08, "learning_rate": 4.965648697817712e-06, "loss": 1.2123, "step": 4307 }, { "epoch": 0.08, "learning_rate": 4.965623455793428e-06, "loss": 0.8857, "step": 4308 }, { "epoch": 0.08, "learning_rate": 4.965598204562582e-06, "loss": 0.7381, "step": 4309 }, { "epoch": 0.08, "learning_rate": 4.965572944125267e-06, "loss": 1.168, "step": 4310 }, { "epoch": 0.08, "learning_rate": 4.965547674481579e-06, "loss": 0.9362, "step": 4311 }, { "epoch": 0.08, "learning_rate": 4.9655223956316115e-06, "loss": 1.0429, "step": 4312 }, { "epoch": 0.08, "learning_rate": 4.965497107575458e-06, "loss": 1.0988, "step": 4313 }, { "epoch": 0.08, "learning_rate": 4.965471810313215e-06, "loss": 0.9271, "step": 4314 }, { "epoch": 0.08, "learning_rate": 4.965446503844975e-06, "loss": 0.7336, "step": 4315 }, { "epoch": 0.08, "learning_rate": 4.965421188170835e-06, "loss": 1.0143, "step": 4316 }, { "epoch": 0.08, "learning_rate": 4.965395863290886e-06, "loss": 0.8921, "step": 4317 }, { "epoch": 0.08, "learning_rate": 4.965370529205226e-06, "loss": 1.055, "step": 4318 }, { "epoch": 0.08, "learning_rate": 4.9653451859139465e-06, "loss": 1.0845, "step": 4319 }, { "epoch": 0.08, "learning_rate": 4.965319833417144e-06, "loss": 0.9377, "step": 4320 }, { "epoch": 0.08, "learning_rate": 4.965294471714913e-06, "loss": 0.9058, "step": 4321 }, { "epoch": 0.08, "learning_rate": 4.965269100807349e-06, "loss": 0.8797, "step": 4322 }, { "epoch": 0.08, "learning_rate": 4.965243720694545e-06, "loss": 0.9216, "step": 4323 }, { "epoch": 0.08, "learning_rate": 4.965218331376597e-06, "loss": 1.1761, "step": 4324 }, { "epoch": 0.08, "learning_rate": 4.965192932853598e-06, "loss": 0.9456, "step": 4325 }, { "epoch": 0.08, "learning_rate": 4.965167525125645e-06, "loss": 1.0358, "step": 4326 }, { "epoch": 0.08, "learning_rate": 4.965142108192832e-06, "loss": 0.9588, "step": 4327 }, { "epoch": 0.08, "learning_rate": 4.965116682055254e-06, "loss": 0.8273, "step": 4328 }, { "epoch": 0.08, "learning_rate": 4.965091246713006e-06, "loss": 0.7857, "step": 4329 }, { "epoch": 0.08, "learning_rate": 4.965065802166183e-06, "loss": 0.9614, "step": 4330 }, { "epoch": 0.08, "learning_rate": 4.9650403484148794e-06, "loss": 1.2422, "step": 4331 }, { "epoch": 0.08, "learning_rate": 4.965014885459191e-06, "loss": 0.9413, "step": 4332 }, { "epoch": 0.08, "learning_rate": 4.964989413299213e-06, "loss": 0.923, "step": 4333 }, { "epoch": 0.08, "learning_rate": 4.964963931935039e-06, "loss": 1.0099, "step": 4334 }, { "epoch": 0.08, "learning_rate": 4.964938441366767e-06, "loss": 1.0192, "step": 4335 }, { "epoch": 0.08, "learning_rate": 4.964912941594488e-06, "loss": 1.0172, "step": 4336 }, { "epoch": 0.08, "learning_rate": 4.964887432618302e-06, "loss": 1.0658, "step": 4337 }, { "epoch": 0.08, "learning_rate": 4.964861914438301e-06, "loss": 1.139, "step": 4338 }, { "epoch": 0.08, "learning_rate": 4.964836387054581e-06, "loss": 0.875, "step": 4339 }, { "epoch": 0.08, "learning_rate": 4.964810850467237e-06, "loss": 1.0212, "step": 4340 }, { "epoch": 0.08, "learning_rate": 4.964785304676366e-06, "loss": 0.9008, "step": 4341 }, { "epoch": 0.08, "learning_rate": 4.964759749682062e-06, "loss": 1.0915, "step": 4342 }, { "epoch": 0.08, "learning_rate": 4.96473418548442e-06, "loss": 1.0674, "step": 4343 }, { "epoch": 0.08, "learning_rate": 4.9647086120835365e-06, "loss": 0.9172, "step": 4344 }, { "epoch": 0.08, "learning_rate": 4.9646830294795065e-06, "loss": 1.0927, "step": 4345 }, { "epoch": 0.08, "learning_rate": 4.964657437672426e-06, "loss": 0.8277, "step": 4346 }, { "epoch": 0.08, "learning_rate": 4.9646318366623905e-06, "loss": 0.8683, "step": 4347 }, { "epoch": 0.08, "learning_rate": 4.964606226449494e-06, "loss": 0.9655, "step": 4348 }, { "epoch": 0.08, "learning_rate": 4.964580607033834e-06, "loss": 0.981, "step": 4349 }, { "epoch": 0.08, "learning_rate": 4.964554978415506e-06, "loss": 1.0561, "step": 4350 }, { "epoch": 0.08, "learning_rate": 4.964529340594605e-06, "loss": 0.9211, "step": 4351 }, { "epoch": 0.08, "learning_rate": 4.964503693571227e-06, "loss": 0.8619, "step": 4352 }, { "epoch": 0.08, "learning_rate": 4.964478037345468e-06, "loss": 1.0267, "step": 4353 }, { "epoch": 0.08, "learning_rate": 4.964452371917423e-06, "loss": 1.1031, "step": 4354 }, { "epoch": 0.08, "learning_rate": 4.964426697287189e-06, "loss": 1.0338, "step": 4355 }, { "epoch": 0.08, "learning_rate": 4.964401013454861e-06, "loss": 1.1519, "step": 4356 }, { "epoch": 0.08, "learning_rate": 4.9643753204205355e-06, "loss": 0.9076, "step": 4357 }, { "epoch": 0.08, "learning_rate": 4.964349618184308e-06, "loss": 0.9258, "step": 4358 }, { "epoch": 0.08, "learning_rate": 4.964323906746274e-06, "loss": 1.2247, "step": 4359 }, { "epoch": 0.08, "learning_rate": 4.9642981861065305e-06, "loss": 1.0429, "step": 4360 }, { "epoch": 0.08, "learning_rate": 4.964272456265173e-06, "loss": 1.1932, "step": 4361 }, { "epoch": 0.08, "learning_rate": 4.9642467172222985e-06, "loss": 1.0179, "step": 4362 }, { "epoch": 0.08, "learning_rate": 4.964220968978002e-06, "loss": 0.9547, "step": 4363 }, { "epoch": 0.08, "learning_rate": 4.964195211532379e-06, "loss": 0.623, "step": 4364 }, { "epoch": 0.08, "learning_rate": 4.964169444885527e-06, "loss": 0.9062, "step": 4365 }, { "epoch": 0.08, "learning_rate": 4.9641436690375426e-06, "loss": 1.0526, "step": 4366 }, { "epoch": 0.08, "learning_rate": 4.964117883988521e-06, "loss": 0.9793, "step": 4367 }, { "epoch": 0.08, "learning_rate": 4.964092089738558e-06, "loss": 0.9377, "step": 4368 }, { "epoch": 0.08, "learning_rate": 4.964066286287752e-06, "loss": 1.0184, "step": 4369 }, { "epoch": 0.08, "learning_rate": 4.964040473636197e-06, "loss": 1.1167, "step": 4370 }, { "epoch": 0.08, "learning_rate": 4.96401465178399e-06, "loss": 0.875, "step": 4371 }, { "epoch": 0.08, "learning_rate": 4.963988820731229e-06, "loss": 0.9036, "step": 4372 }, { "epoch": 0.08, "learning_rate": 4.963962980478009e-06, "loss": 0.9146, "step": 4373 }, { "epoch": 0.08, "learning_rate": 4.963937131024427e-06, "loss": 1.1709, "step": 4374 }, { "epoch": 0.08, "learning_rate": 4.963911272370579e-06, "loss": 1.0193, "step": 4375 }, { "epoch": 0.08, "learning_rate": 4.9638854045165605e-06, "loss": 0.9817, "step": 4376 }, { "epoch": 0.08, "learning_rate": 4.963859527462471e-06, "loss": 1.0594, "step": 4377 }, { "epoch": 0.08, "learning_rate": 4.963833641208405e-06, "loss": 0.9724, "step": 4378 }, { "epoch": 0.08, "learning_rate": 4.963807745754461e-06, "loss": 0.8828, "step": 4379 }, { "epoch": 0.08, "learning_rate": 4.963781841100733e-06, "loss": 1.1252, "step": 4380 }, { "epoch": 0.08, "learning_rate": 4.96375592724732e-06, "loss": 1.0483, "step": 4381 }, { "epoch": 0.08, "learning_rate": 4.963730004194317e-06, "loss": 1.1212, "step": 4382 }, { "epoch": 0.08, "learning_rate": 4.963704071941822e-06, "loss": 1.0365, "step": 4383 }, { "epoch": 0.08, "learning_rate": 4.963678130489932e-06, "loss": 1.0075, "step": 4384 }, { "epoch": 0.08, "learning_rate": 4.963652179838743e-06, "loss": 0.9592, "step": 4385 }, { "epoch": 0.08, "learning_rate": 4.9636262199883525e-06, "loss": 1.0306, "step": 4386 }, { "epoch": 0.08, "learning_rate": 4.963600250938857e-06, "loss": 1.0107, "step": 4387 }, { "epoch": 0.08, "learning_rate": 4.963574272690354e-06, "loss": 0.9616, "step": 4388 }, { "epoch": 0.08, "learning_rate": 4.96354828524294e-06, "loss": 0.9292, "step": 4389 }, { "epoch": 0.08, "learning_rate": 4.963522288596712e-06, "loss": 0.9846, "step": 4390 }, { "epoch": 0.08, "learning_rate": 4.963496282751768e-06, "loss": 0.9975, "step": 4391 }, { "epoch": 0.08, "learning_rate": 4.963470267708203e-06, "loss": 0.9733, "step": 4392 }, { "epoch": 0.08, "learning_rate": 4.9634442434661174e-06, "loss": 0.8278, "step": 4393 }, { "epoch": 0.08, "learning_rate": 4.963418210025605e-06, "loss": 1.2269, "step": 4394 }, { "epoch": 0.08, "learning_rate": 4.963392167386766e-06, "loss": 1.2045, "step": 4395 }, { "epoch": 0.08, "learning_rate": 4.963366115549695e-06, "loss": 0.9297, "step": 4396 }, { "epoch": 0.08, "learning_rate": 4.963340054514491e-06, "loss": 0.8795, "step": 4397 }, { "epoch": 0.08, "learning_rate": 4.963313984281251e-06, "loss": 0.9146, "step": 4398 }, { "epoch": 0.08, "learning_rate": 4.963287904850072e-06, "loss": 1.124, "step": 4399 }, { "epoch": 0.08, "learning_rate": 4.96326181622105e-06, "loss": 1.1362, "step": 4400 }, { "epoch": 0.08, "learning_rate": 4.963235718394286e-06, "loss": 1.0351, "step": 4401 }, { "epoch": 0.08, "learning_rate": 4.963209611369874e-06, "loss": 0.8522, "step": 4402 }, { "epoch": 0.08, "learning_rate": 4.963183495147913e-06, "loss": 0.88, "step": 4403 }, { "epoch": 0.08, "learning_rate": 4.963157369728501e-06, "loss": 0.9625, "step": 4404 }, { "epoch": 0.08, "learning_rate": 4.9631312351117345e-06, "loss": 1.0453, "step": 4405 }, { "epoch": 0.08, "learning_rate": 4.963105091297712e-06, "loss": 1.1104, "step": 4406 }, { "epoch": 0.08, "learning_rate": 4.96307893828653e-06, "loss": 0.9141, "step": 4407 }, { "epoch": 0.08, "learning_rate": 4.963052776078287e-06, "loss": 0.6802, "step": 4408 }, { "epoch": 0.08, "learning_rate": 4.9630266046730804e-06, "loss": 1.079, "step": 4409 }, { "epoch": 0.08, "learning_rate": 4.963000424071008e-06, "loss": 0.9523, "step": 4410 }, { "epoch": 0.08, "learning_rate": 4.962974234272167e-06, "loss": 0.853, "step": 4411 }, { "epoch": 0.08, "learning_rate": 4.9629480352766564e-06, "loss": 1.0173, "step": 4412 }, { "epoch": 0.08, "learning_rate": 4.962921827084573e-06, "loss": 1.0404, "step": 4413 }, { "epoch": 0.08, "learning_rate": 4.9628956096960155e-06, "loss": 0.8823, "step": 4414 }, { "epoch": 0.08, "learning_rate": 4.962869383111081e-06, "loss": 0.9094, "step": 4415 }, { "epoch": 0.08, "learning_rate": 4.962843147329868e-06, "loss": 0.8245, "step": 4416 }, { "epoch": 0.08, "learning_rate": 4.962816902352473e-06, "loss": 1.0034, "step": 4417 }, { "epoch": 0.08, "learning_rate": 4.962790648178997e-06, "loss": 1.174, "step": 4418 }, { "epoch": 0.08, "learning_rate": 4.9627643848095345e-06, "loss": 1.0171, "step": 4419 }, { "epoch": 0.08, "learning_rate": 4.962738112244186e-06, "loss": 1.0569, "step": 4420 }, { "epoch": 0.08, "learning_rate": 4.962711830483049e-06, "loss": 0.8995, "step": 4421 }, { "epoch": 0.08, "learning_rate": 4.962685539526222e-06, "loss": 1.0253, "step": 4422 }, { "epoch": 0.08, "learning_rate": 4.962659239373802e-06, "loss": 0.8983, "step": 4423 }, { "epoch": 0.08, "learning_rate": 4.962632930025888e-06, "loss": 1.172, "step": 4424 }, { "epoch": 0.08, "learning_rate": 4.9626066114825785e-06, "loss": 1.1508, "step": 4425 }, { "epoch": 0.08, "learning_rate": 4.962580283743972e-06, "loss": 1.0773, "step": 4426 }, { "epoch": 0.08, "learning_rate": 4.962553946810164e-06, "loss": 0.9904, "step": 4427 }, { "epoch": 0.08, "learning_rate": 4.962527600681257e-06, "loss": 0.9331, "step": 4428 }, { "epoch": 0.08, "learning_rate": 4.962501245357348e-06, "loss": 0.8416, "step": 4429 }, { "epoch": 0.08, "learning_rate": 4.962474880838534e-06, "loss": 0.9442, "step": 4430 }, { "epoch": 0.08, "learning_rate": 4.962448507124914e-06, "loss": 1.2097, "step": 4431 }, { "epoch": 0.08, "learning_rate": 4.962422124216586e-06, "loss": 1.007, "step": 4432 }, { "epoch": 0.08, "learning_rate": 4.962395732113651e-06, "loss": 0.8903, "step": 4433 }, { "epoch": 0.08, "learning_rate": 4.962369330816205e-06, "loss": 0.933, "step": 4434 }, { "epoch": 0.08, "learning_rate": 4.9623429203243464e-06, "loss": 0.9009, "step": 4435 }, { "epoch": 0.08, "learning_rate": 4.962316500638177e-06, "loss": 0.9152, "step": 4436 }, { "epoch": 0.08, "learning_rate": 4.962290071757791e-06, "loss": 0.9744, "step": 4437 }, { "epoch": 0.08, "learning_rate": 4.962263633683291e-06, "loss": 1.0049, "step": 4438 }, { "epoch": 0.08, "learning_rate": 4.962237186414773e-06, "loss": 1.0311, "step": 4439 }, { "epoch": 0.08, "learning_rate": 4.962210729952338e-06, "loss": 0.9655, "step": 4440 }, { "epoch": 0.08, "learning_rate": 4.962184264296083e-06, "loss": 1.1332, "step": 4441 }, { "epoch": 0.08, "learning_rate": 4.962157789446108e-06, "loss": 0.7886, "step": 4442 }, { "epoch": 0.08, "learning_rate": 4.962131305402511e-06, "loss": 1.0914, "step": 4443 }, { "epoch": 0.08, "learning_rate": 4.96210481216539e-06, "loss": 0.869, "step": 4444 }, { "epoch": 0.08, "learning_rate": 4.962078309734847e-06, "loss": 0.756, "step": 4445 }, { "epoch": 0.08, "learning_rate": 4.962051798110978e-06, "loss": 0.9274, "step": 4446 }, { "epoch": 0.08, "learning_rate": 4.962025277293883e-06, "loss": 1.0738, "step": 4447 }, { "epoch": 0.08, "learning_rate": 4.961998747283662e-06, "loss": 0.8227, "step": 4448 }, { "epoch": 0.08, "learning_rate": 4.961972208080412e-06, "loss": 0.9934, "step": 4449 }, { "epoch": 0.08, "learning_rate": 4.9619456596842345e-06, "loss": 0.9521, "step": 4450 }, { "epoch": 0.08, "learning_rate": 4.961919102095226e-06, "loss": 0.9706, "step": 4451 }, { "epoch": 0.08, "learning_rate": 4.961892535313488e-06, "loss": 0.9491, "step": 4452 }, { "epoch": 0.08, "learning_rate": 4.961865959339119e-06, "loss": 1.0314, "step": 4453 }, { "epoch": 0.08, "learning_rate": 4.9618393741722174e-06, "loss": 1.2114, "step": 4454 }, { "epoch": 0.08, "learning_rate": 4.961812779812883e-06, "loss": 1.1433, "step": 4455 }, { "epoch": 0.08, "learning_rate": 4.961786176261215e-06, "loss": 1.2054, "step": 4456 }, { "epoch": 0.08, "learning_rate": 4.961759563517313e-06, "loss": 1.0512, "step": 4457 }, { "epoch": 0.08, "learning_rate": 4.9617329415812774e-06, "loss": 0.9634, "step": 4458 }, { "epoch": 0.08, "learning_rate": 4.961706310453205e-06, "loss": 0.971, "step": 4459 }, { "epoch": 0.08, "learning_rate": 4.961679670133197e-06, "loss": 0.879, "step": 4460 }, { "epoch": 0.08, "learning_rate": 4.961653020621353e-06, "loss": 1.072, "step": 4461 }, { "epoch": 0.08, "learning_rate": 4.961626361917772e-06, "loss": 1.092, "step": 4462 }, { "epoch": 0.08, "learning_rate": 4.961599694022554e-06, "loss": 0.7173, "step": 4463 }, { "epoch": 0.08, "learning_rate": 4.961573016935798e-06, "loss": 1.0746, "step": 4464 }, { "epoch": 0.08, "learning_rate": 4.961546330657603e-06, "loss": 1.0919, "step": 4465 }, { "epoch": 0.08, "learning_rate": 4.961519635188071e-06, "loss": 0.8145, "step": 4466 }, { "epoch": 0.08, "learning_rate": 4.961492930527299e-06, "loss": 0.8046, "step": 4467 }, { "epoch": 0.08, "learning_rate": 4.961466216675388e-06, "loss": 1.0145, "step": 4468 }, { "epoch": 0.08, "learning_rate": 4.961439493632438e-06, "loss": 0.8984, "step": 4469 }, { "epoch": 0.08, "learning_rate": 4.961412761398548e-06, "loss": 1.0262, "step": 4470 }, { "epoch": 0.08, "learning_rate": 4.961386019973818e-06, "loss": 0.9386, "step": 4471 }, { "epoch": 0.08, "learning_rate": 4.961359269358349e-06, "loss": 0.9845, "step": 4472 }, { "epoch": 0.08, "learning_rate": 4.961332509552239e-06, "loss": 0.9089, "step": 4473 }, { "epoch": 0.08, "learning_rate": 4.9613057405555896e-06, "loss": 0.9304, "step": 4474 }, { "epoch": 0.08, "learning_rate": 4.9612789623685e-06, "loss": 1.1797, "step": 4475 }, { "epoch": 0.08, "learning_rate": 4.96125217499107e-06, "loss": 1.1782, "step": 4476 }, { "epoch": 0.08, "learning_rate": 4.961225378423399e-06, "loss": 1.0204, "step": 4477 }, { "epoch": 0.08, "learning_rate": 4.9611985726655895e-06, "loss": 0.8828, "step": 4478 }, { "epoch": 0.08, "learning_rate": 4.961171757717738e-06, "loss": 0.9305, "step": 4479 }, { "epoch": 0.08, "learning_rate": 4.961144933579949e-06, "loss": 0.7894, "step": 4480 }, { "epoch": 0.08, "learning_rate": 4.961118100252319e-06, "loss": 1.0739, "step": 4481 }, { "epoch": 0.08, "learning_rate": 4.961091257734949e-06, "loss": 0.9966, "step": 4482 }, { "epoch": 0.08, "learning_rate": 4.961064406027941e-06, "loss": 0.7811, "step": 4483 }, { "epoch": 0.08, "learning_rate": 4.961037545131393e-06, "loss": 0.9345, "step": 4484 }, { "epoch": 0.08, "learning_rate": 4.961010675045406e-06, "loss": 0.8441, "step": 4485 }, { "epoch": 0.08, "learning_rate": 4.960983795770081e-06, "loss": 0.96, "step": 4486 }, { "epoch": 0.08, "learning_rate": 4.960956907305519e-06, "loss": 1.2296, "step": 4487 }, { "epoch": 0.08, "learning_rate": 4.960930009651817e-06, "loss": 1.1619, "step": 4488 }, { "epoch": 0.08, "learning_rate": 4.96090310280908e-06, "loss": 0.8463, "step": 4489 }, { "epoch": 0.08, "learning_rate": 4.960876186777405e-06, "loss": 0.7736, "step": 4490 }, { "epoch": 0.08, "learning_rate": 4.960849261556895e-06, "loss": 0.7014, "step": 4491 }, { "epoch": 0.08, "learning_rate": 4.960822327147648e-06, "loss": 0.9643, "step": 4492 }, { "epoch": 0.08, "learning_rate": 4.960795383549767e-06, "loss": 0.9474, "step": 4493 }, { "epoch": 0.08, "learning_rate": 4.96076843076335e-06, "loss": 1.1025, "step": 4494 }, { "epoch": 0.08, "learning_rate": 4.9607414687885e-06, "loss": 1.0035, "step": 4495 }, { "epoch": 0.08, "learning_rate": 4.960714497625317e-06, "loss": 1.0784, "step": 4496 }, { "epoch": 0.08, "learning_rate": 4.960687517273902e-06, "loss": 0.9011, "step": 4497 }, { "epoch": 0.08, "learning_rate": 4.960660527734354e-06, "loss": 0.9439, "step": 4498 }, { "epoch": 0.08, "learning_rate": 4.960633529006776e-06, "loss": 1.037, "step": 4499 }, { "epoch": 0.08, "learning_rate": 4.960606521091268e-06, "loss": 0.9733, "step": 4500 }, { "epoch": 0.08, "learning_rate": 4.9605795039879295e-06, "loss": 0.9383, "step": 4501 }, { "epoch": 0.08, "learning_rate": 4.960552477696863e-06, "loss": 0.824, "step": 4502 }, { "epoch": 0.08, "learning_rate": 4.960525442218169e-06, "loss": 0.9788, "step": 4503 }, { "epoch": 0.08, "learning_rate": 4.96049839755195e-06, "loss": 1.0146, "step": 4504 }, { "epoch": 0.08, "learning_rate": 4.960471343698303e-06, "loss": 1.0214, "step": 4505 }, { "epoch": 0.09, "learning_rate": 4.960444280657333e-06, "loss": 1.2019, "step": 4506 }, { "epoch": 0.09, "learning_rate": 4.960417208429139e-06, "loss": 0.9914, "step": 4507 }, { "epoch": 0.09, "learning_rate": 4.960390127013823e-06, "loss": 0.8483, "step": 4508 }, { "epoch": 0.09, "learning_rate": 4.960363036411485e-06, "loss": 0.93, "step": 4509 }, { "epoch": 0.09, "learning_rate": 4.960335936622227e-06, "loss": 0.9541, "step": 4510 }, { "epoch": 0.09, "learning_rate": 4.960308827646151e-06, "loss": 0.9387, "step": 4511 }, { "epoch": 0.09, "learning_rate": 4.960281709483356e-06, "loss": 0.9923, "step": 4512 }, { "epoch": 0.09, "learning_rate": 4.960254582133945e-06, "loss": 1.1952, "step": 4513 }, { "epoch": 0.09, "learning_rate": 4.9602274455980195e-06, "loss": 0.8536, "step": 4514 }, { "epoch": 0.09, "learning_rate": 4.9602002998756795e-06, "loss": 0.8023, "step": 4515 }, { "epoch": 0.09, "learning_rate": 4.9601731449670265e-06, "loss": 0.9367, "step": 4516 }, { "epoch": 0.09, "learning_rate": 4.960145980872163e-06, "loss": 0.8895, "step": 4517 }, { "epoch": 0.09, "learning_rate": 4.9601188075911895e-06, "loss": 1.0541, "step": 4518 }, { "epoch": 0.09, "learning_rate": 4.960091625124208e-06, "loss": 1.1996, "step": 4519 }, { "epoch": 0.09, "learning_rate": 4.96006443347132e-06, "loss": 0.8911, "step": 4520 }, { "epoch": 0.09, "learning_rate": 4.960037232632627e-06, "loss": 1.0329, "step": 4521 }, { "epoch": 0.09, "learning_rate": 4.960010022608231e-06, "loss": 0.7675, "step": 4522 }, { "epoch": 0.09, "learning_rate": 4.959982803398231e-06, "loss": 1.0787, "step": 4523 }, { "epoch": 0.09, "learning_rate": 4.959955575002732e-06, "loss": 0.9764, "step": 4524 }, { "epoch": 0.09, "learning_rate": 4.959928337421835e-06, "loss": 1.2024, "step": 4525 }, { "epoch": 0.09, "learning_rate": 4.959901090655639e-06, "loss": 0.9424, "step": 4526 }, { "epoch": 0.09, "learning_rate": 4.959873834704249e-06, "loss": 0.9354, "step": 4527 }, { "epoch": 0.09, "learning_rate": 4.9598465695677655e-06, "loss": 0.9249, "step": 4528 }, { "epoch": 0.09, "learning_rate": 4.95981929524629e-06, "loss": 0.8493, "step": 4529 }, { "epoch": 0.09, "learning_rate": 4.959792011739924e-06, "loss": 1.0652, "step": 4530 }, { "epoch": 0.09, "learning_rate": 4.959764719048772e-06, "loss": 0.8524, "step": 4531 }, { "epoch": 0.09, "learning_rate": 4.959737417172933e-06, "loss": 1.0159, "step": 4532 }, { "epoch": 0.09, "learning_rate": 4.959710106112509e-06, "loss": 0.7591, "step": 4533 }, { "epoch": 0.09, "learning_rate": 4.959682785867604e-06, "loss": 1.0156, "step": 4534 }, { "epoch": 0.09, "learning_rate": 4.959655456438318e-06, "loss": 0.8957, "step": 4535 }, { "epoch": 0.09, "learning_rate": 4.959628117824755e-06, "loss": 1.0824, "step": 4536 }, { "epoch": 0.09, "learning_rate": 4.959600770027015e-06, "loss": 1.0883, "step": 4537 }, { "epoch": 0.09, "learning_rate": 4.959573413045202e-06, "loss": 0.9114, "step": 4538 }, { "epoch": 0.09, "learning_rate": 4.959546046879417e-06, "loss": 0.8073, "step": 4539 }, { "epoch": 0.09, "learning_rate": 4.9595186715297625e-06, "loss": 1.0442, "step": 4540 }, { "epoch": 0.09, "learning_rate": 4.95949128699634e-06, "loss": 0.9753, "step": 4541 }, { "epoch": 0.09, "learning_rate": 4.959463893279253e-06, "loss": 0.9158, "step": 4542 }, { "epoch": 0.09, "learning_rate": 4.959436490378604e-06, "loss": 1.2248, "step": 4543 }, { "epoch": 0.09, "learning_rate": 4.9594090782944935e-06, "loss": 0.9612, "step": 4544 }, { "epoch": 0.09, "learning_rate": 4.959381657027025e-06, "loss": 0.8468, "step": 4545 }, { "epoch": 0.09, "learning_rate": 4.959354226576301e-06, "loss": 0.8584, "step": 4546 }, { "epoch": 0.09, "learning_rate": 4.959326786942424e-06, "loss": 0.861, "step": 4547 }, { "epoch": 0.09, "learning_rate": 4.9592993381254964e-06, "loss": 0.9744, "step": 4548 }, { "epoch": 0.09, "learning_rate": 4.959271880125619e-06, "loss": 1.1487, "step": 4549 }, { "epoch": 0.09, "learning_rate": 4.959244412942897e-06, "loss": 1.1076, "step": 4550 }, { "epoch": 0.09, "learning_rate": 4.959216936577432e-06, "loss": 0.9658, "step": 4551 }, { "epoch": 0.09, "learning_rate": 4.959189451029326e-06, "loss": 0.9902, "step": 4552 }, { "epoch": 0.09, "learning_rate": 4.959161956298681e-06, "loss": 1.0035, "step": 4553 }, { "epoch": 0.09, "learning_rate": 4.959134452385602e-06, "loss": 0.9308, "step": 4554 }, { "epoch": 0.09, "learning_rate": 4.9591069392901905e-06, "loss": 1.1959, "step": 4555 }, { "epoch": 0.09, "learning_rate": 4.959079417012548e-06, "loss": 1.0191, "step": 4556 }, { "epoch": 0.09, "learning_rate": 4.959051885552779e-06, "loss": 1.0559, "step": 4557 }, { "epoch": 0.09, "learning_rate": 4.959024344910985e-06, "loss": 1.051, "step": 4558 }, { "epoch": 0.09, "learning_rate": 4.9589967950872704e-06, "loss": 0.9738, "step": 4559 }, { "epoch": 0.09, "learning_rate": 4.958969236081736e-06, "loss": 0.7592, "step": 4560 }, { "epoch": 0.09, "learning_rate": 4.958941667894488e-06, "loss": 0.8262, "step": 4561 }, { "epoch": 0.09, "learning_rate": 4.958914090525625e-06, "loss": 1.0824, "step": 4562 }, { "epoch": 0.09, "learning_rate": 4.958886503975253e-06, "loss": 1.162, "step": 4563 }, { "epoch": 0.09, "learning_rate": 4.958858908243474e-06, "loss": 0.8477, "step": 4564 }, { "epoch": 0.09, "learning_rate": 4.9588313033303916e-06, "loss": 0.9515, "step": 4565 }, { "epoch": 0.09, "learning_rate": 4.958803689236109e-06, "loss": 0.7603, "step": 4566 }, { "epoch": 0.09, "learning_rate": 4.958776065960727e-06, "loss": 0.9541, "step": 4567 }, { "epoch": 0.09, "learning_rate": 4.9587484335043525e-06, "loss": 1.1152, "step": 4568 }, { "epoch": 0.09, "learning_rate": 4.958720791867086e-06, "loss": 0.986, "step": 4569 }, { "epoch": 0.09, "learning_rate": 4.958693141049031e-06, "loss": 1.0062, "step": 4570 }, { "epoch": 0.09, "learning_rate": 4.958665481050292e-06, "loss": 1.1091, "step": 4571 }, { "epoch": 0.09, "learning_rate": 4.958637811870971e-06, "loss": 0.9576, "step": 4572 }, { "epoch": 0.09, "learning_rate": 4.958610133511171e-06, "loss": 0.9839, "step": 4573 }, { "epoch": 0.09, "learning_rate": 4.958582445970997e-06, "loss": 0.842, "step": 4574 }, { "epoch": 0.09, "learning_rate": 4.958554749250553e-06, "loss": 1.0735, "step": 4575 }, { "epoch": 0.09, "learning_rate": 4.958527043349939e-06, "loss": 1.0408, "step": 4576 }, { "epoch": 0.09, "learning_rate": 4.958499328269261e-06, "loss": 0.9014, "step": 4577 }, { "epoch": 0.09, "learning_rate": 4.958471604008621e-06, "loss": 1.0899, "step": 4578 }, { "epoch": 0.09, "learning_rate": 4.958443870568124e-06, "loss": 0.8879, "step": 4579 }, { "epoch": 0.09, "learning_rate": 4.9584161279478735e-06, "loss": 0.7466, "step": 4580 }, { "epoch": 0.09, "learning_rate": 4.9583883761479724e-06, "loss": 1.2397, "step": 4581 }, { "epoch": 0.09, "learning_rate": 4.958360615168525e-06, "loss": 0.9435, "step": 4582 }, { "epoch": 0.09, "learning_rate": 4.958332845009633e-06, "loss": 0.8667, "step": 4583 }, { "epoch": 0.09, "learning_rate": 4.958305065671402e-06, "loss": 1.0735, "step": 4584 }, { "epoch": 0.09, "learning_rate": 4.958277277153936e-06, "loss": 0.9565, "step": 4585 }, { "epoch": 0.09, "learning_rate": 4.9582494794573375e-06, "loss": 0.9563, "step": 4586 }, { "epoch": 0.09, "learning_rate": 4.958221672581711e-06, "loss": 1.1239, "step": 4587 }, { "epoch": 0.09, "learning_rate": 4.958193856527159e-06, "loss": 1.1293, "step": 4588 }, { "epoch": 0.09, "learning_rate": 4.958166031293788e-06, "loss": 1.1859, "step": 4589 }, { "epoch": 0.09, "learning_rate": 4.9581381968816995e-06, "loss": 0.8524, "step": 4590 }, { "epoch": 0.09, "learning_rate": 4.958110353290999e-06, "loss": 1.0801, "step": 4591 }, { "epoch": 0.09, "learning_rate": 4.958082500521789e-06, "loss": 0.7877, "step": 4592 }, { "epoch": 0.09, "learning_rate": 4.958054638574176e-06, "loss": 0.9865, "step": 4593 }, { "epoch": 0.09, "learning_rate": 4.958026767448261e-06, "loss": 1.1411, "step": 4594 }, { "epoch": 0.09, "learning_rate": 4.9579988871441494e-06, "loss": 0.9833, "step": 4595 }, { "epoch": 0.09, "learning_rate": 4.957970997661945e-06, "loss": 0.7846, "step": 4596 }, { "epoch": 0.09, "learning_rate": 4.957943099001753e-06, "loss": 0.7848, "step": 4597 }, { "epoch": 0.09, "learning_rate": 4.9579151911636766e-06, "loss": 0.9213, "step": 4598 }, { "epoch": 0.09, "learning_rate": 4.95788727414782e-06, "loss": 0.9991, "step": 4599 }, { "epoch": 0.09, "learning_rate": 4.957859347954288e-06, "loss": 1.0056, "step": 4600 }, { "epoch": 0.09, "learning_rate": 4.957831412583185e-06, "loss": 0.9415, "step": 4601 }, { "epoch": 0.09, "learning_rate": 4.9578034680346145e-06, "loss": 0.9334, "step": 4602 }, { "epoch": 0.09, "learning_rate": 4.957775514308681e-06, "loss": 0.9277, "step": 4603 }, { "epoch": 0.09, "learning_rate": 4.957747551405489e-06, "loss": 0.9695, "step": 4604 }, { "epoch": 0.09, "learning_rate": 4.957719579325143e-06, "loss": 1.0569, "step": 4605 }, { "epoch": 0.09, "learning_rate": 4.957691598067748e-06, "loss": 1.2115, "step": 4606 }, { "epoch": 0.09, "learning_rate": 4.957663607633408e-06, "loss": 1.0381, "step": 4607 }, { "epoch": 0.09, "learning_rate": 4.957635608022226e-06, "loss": 0.8205, "step": 4608 }, { "epoch": 0.09, "learning_rate": 4.9576075992343095e-06, "loss": 1.1953, "step": 4609 }, { "epoch": 0.09, "learning_rate": 4.957579581269761e-06, "loss": 0.9124, "step": 4610 }, { "epoch": 0.09, "learning_rate": 4.9575515541286855e-06, "loss": 0.9431, "step": 4611 }, { "epoch": 0.09, "learning_rate": 4.957523517811188e-06, "loss": 1.0596, "step": 4612 }, { "epoch": 0.09, "learning_rate": 4.957495472317373e-06, "loss": 1.0068, "step": 4613 }, { "epoch": 0.09, "learning_rate": 4.957467417647345e-06, "loss": 0.8223, "step": 4614 }, { "epoch": 0.09, "learning_rate": 4.95743935380121e-06, "loss": 1.1216, "step": 4615 }, { "epoch": 0.09, "learning_rate": 4.957411280779071e-06, "loss": 0.7764, "step": 4616 }, { "epoch": 0.09, "learning_rate": 4.957383198581034e-06, "loss": 1.1256, "step": 4617 }, { "epoch": 0.09, "learning_rate": 4.957355107207203e-06, "loss": 1.3221, "step": 4618 }, { "epoch": 0.09, "learning_rate": 4.957327006657684e-06, "loss": 1.2861, "step": 4619 }, { "epoch": 0.09, "learning_rate": 4.957298896932581e-06, "loss": 0.9742, "step": 4620 }, { "epoch": 0.09, "learning_rate": 4.957270778031999e-06, "loss": 1.0383, "step": 4621 }, { "epoch": 0.09, "learning_rate": 4.957242649956043e-06, "loss": 0.8785, "step": 4622 }, { "epoch": 0.09, "learning_rate": 4.9572145127048185e-06, "loss": 0.9604, "step": 4623 }, { "epoch": 0.09, "learning_rate": 4.957186366278431e-06, "loss": 0.9273, "step": 4624 }, { "epoch": 0.09, "learning_rate": 4.957158210676985e-06, "loss": 0.9401, "step": 4625 }, { "epoch": 0.09, "learning_rate": 4.957130045900585e-06, "loss": 0.8744, "step": 4626 }, { "epoch": 0.09, "learning_rate": 4.957101871949337e-06, "loss": 0.7254, "step": 4627 }, { "epoch": 0.09, "learning_rate": 4.9570736888233455e-06, "loss": 0.9984, "step": 4628 }, { "epoch": 0.09, "learning_rate": 4.957045496522717e-06, "loss": 0.9559, "step": 4629 }, { "epoch": 0.09, "learning_rate": 4.957017295047555e-06, "loss": 1.0782, "step": 4630 }, { "epoch": 0.09, "learning_rate": 4.9569890843979665e-06, "loss": 1.3484, "step": 4631 }, { "epoch": 0.09, "learning_rate": 4.956960864574055e-06, "loss": 0.8606, "step": 4632 }, { "epoch": 0.09, "learning_rate": 4.956932635575928e-06, "loss": 1.0343, "step": 4633 }, { "epoch": 0.09, "learning_rate": 4.9569043974036905e-06, "loss": 1.0364, "step": 4634 }, { "epoch": 0.09, "learning_rate": 4.956876150057446e-06, "loss": 1.044, "step": 4635 }, { "epoch": 0.09, "learning_rate": 4.9568478935373015e-06, "loss": 0.9963, "step": 4636 }, { "epoch": 0.09, "learning_rate": 4.956819627843363e-06, "loss": 1.1974, "step": 4637 }, { "epoch": 0.09, "learning_rate": 4.956791352975734e-06, "loss": 0.948, "step": 4638 }, { "epoch": 0.09, "learning_rate": 4.956763068934522e-06, "loss": 0.9988, "step": 4639 }, { "epoch": 0.09, "learning_rate": 4.956734775719833e-06, "loss": 1.066, "step": 4640 }, { "epoch": 0.09, "learning_rate": 4.956706473331771e-06, "loss": 0.9386, "step": 4641 }, { "epoch": 0.09, "learning_rate": 4.956678161770443e-06, "loss": 0.8074, "step": 4642 }, { "epoch": 0.09, "learning_rate": 4.956649841035953e-06, "loss": 0.9478, "step": 4643 }, { "epoch": 0.09, "learning_rate": 4.9566215111284076e-06, "loss": 1.1237, "step": 4644 }, { "epoch": 0.09, "learning_rate": 4.956593172047914e-06, "loss": 0.9228, "step": 4645 }, { "epoch": 0.09, "learning_rate": 4.956564823794576e-06, "loss": 1.0641, "step": 4646 }, { "epoch": 0.09, "learning_rate": 4.956536466368501e-06, "loss": 1.0375, "step": 4647 }, { "epoch": 0.09, "learning_rate": 4.9565080997697934e-06, "loss": 1.0167, "step": 4648 }, { "epoch": 0.09, "learning_rate": 4.95647972399856e-06, "loss": 0.9535, "step": 4649 }, { "epoch": 0.09, "learning_rate": 4.956451339054906e-06, "loss": 0.8806, "step": 4650 }, { "epoch": 0.09, "learning_rate": 4.956422944938939e-06, "loss": 0.9959, "step": 4651 }, { "epoch": 0.09, "learning_rate": 4.9563945416507645e-06, "loss": 0.848, "step": 4652 }, { "epoch": 0.09, "learning_rate": 4.9563661291904875e-06, "loss": 0.9272, "step": 4653 }, { "epoch": 0.09, "learning_rate": 4.956337707558214e-06, "loss": 0.9694, "step": 4654 }, { "epoch": 0.09, "learning_rate": 4.956309276754051e-06, "loss": 1.1617, "step": 4655 }, { "epoch": 0.09, "learning_rate": 4.9562808367781055e-06, "loss": 1.3005, "step": 4656 }, { "epoch": 0.09, "learning_rate": 4.956252387630483e-06, "loss": 0.9972, "step": 4657 }, { "epoch": 0.09, "learning_rate": 4.956223929311287e-06, "loss": 0.9998, "step": 4658 }, { "epoch": 0.09, "learning_rate": 4.956195461820628e-06, "loss": 0.9338, "step": 4659 }, { "epoch": 0.09, "learning_rate": 4.95616698515861e-06, "loss": 0.8921, "step": 4660 }, { "epoch": 0.09, "learning_rate": 4.95613849932534e-06, "loss": 0.9412, "step": 4661 }, { "epoch": 0.09, "learning_rate": 4.956110004320924e-06, "loss": 1.2062, "step": 4662 }, { "epoch": 0.09, "learning_rate": 4.956081500145469e-06, "loss": 0.9556, "step": 4663 }, { "epoch": 0.09, "learning_rate": 4.95605298679908e-06, "loss": 0.7086, "step": 4664 }, { "epoch": 0.09, "learning_rate": 4.956024464281865e-06, "loss": 0.9041, "step": 4665 }, { "epoch": 0.09, "learning_rate": 4.95599593259393e-06, "loss": 0.8286, "step": 4666 }, { "epoch": 0.09, "learning_rate": 4.955967391735381e-06, "loss": 1.0139, "step": 4667 }, { "epoch": 0.09, "learning_rate": 4.9559388417063256e-06, "loss": 0.9919, "step": 4668 }, { "epoch": 0.09, "learning_rate": 4.95591028250687e-06, "loss": 1.2369, "step": 4669 }, { "epoch": 0.09, "learning_rate": 4.955881714137121e-06, "loss": 0.8855, "step": 4670 }, { "epoch": 0.09, "learning_rate": 4.955853136597184e-06, "loss": 0.9589, "step": 4671 }, { "epoch": 0.09, "learning_rate": 4.955824549887167e-06, "loss": 0.7958, "step": 4672 }, { "epoch": 0.09, "learning_rate": 4.9557959540071765e-06, "loss": 0.7958, "step": 4673 }, { "epoch": 0.09, "learning_rate": 4.955767348957319e-06, "loss": 1.1864, "step": 4674 }, { "epoch": 0.09, "learning_rate": 4.955738734737702e-06, "loss": 1.3278, "step": 4675 }, { "epoch": 0.09, "learning_rate": 4.955710111348432e-06, "loss": 0.883, "step": 4676 }, { "epoch": 0.09, "learning_rate": 4.955681478789615e-06, "loss": 0.8909, "step": 4677 }, { "epoch": 0.09, "learning_rate": 4.955652837061359e-06, "loss": 0.8805, "step": 4678 }, { "epoch": 0.09, "learning_rate": 4.95562418616377e-06, "loss": 1.1419, "step": 4679 }, { "epoch": 0.09, "learning_rate": 4.955595526096957e-06, "loss": 1.0417, "step": 4680 }, { "epoch": 0.09, "learning_rate": 4.955566856861025e-06, "loss": 0.9817, "step": 4681 }, { "epoch": 0.09, "learning_rate": 4.955538178456081e-06, "loss": 0.9903, "step": 4682 }, { "epoch": 0.09, "learning_rate": 4.955509490882233e-06, "loss": 0.8599, "step": 4683 }, { "epoch": 0.09, "learning_rate": 4.9554807941395875e-06, "loss": 0.8285, "step": 4684 }, { "epoch": 0.09, "learning_rate": 4.9554520882282534e-06, "loss": 0.9446, "step": 4685 }, { "epoch": 0.09, "learning_rate": 4.955423373148335e-06, "loss": 0.8682, "step": 4686 }, { "epoch": 0.09, "learning_rate": 4.955394648899941e-06, "loss": 0.9582, "step": 4687 }, { "epoch": 0.09, "learning_rate": 4.95536591548318e-06, "loss": 1.1721, "step": 4688 }, { "epoch": 0.09, "learning_rate": 4.955337172898157e-06, "loss": 0.8712, "step": 4689 }, { "epoch": 0.09, "learning_rate": 4.955308421144981e-06, "loss": 0.9732, "step": 4690 }, { "epoch": 0.09, "learning_rate": 4.955279660223758e-06, "loss": 1.0137, "step": 4691 }, { "epoch": 0.09, "learning_rate": 4.955250890134596e-06, "loss": 0.8058, "step": 4692 }, { "epoch": 0.09, "learning_rate": 4.955222110877603e-06, "loss": 1.0965, "step": 4693 }, { "epoch": 0.09, "learning_rate": 4.955193322452885e-06, "loss": 1.1077, "step": 4694 }, { "epoch": 0.09, "learning_rate": 4.955164524860551e-06, "loss": 0.8351, "step": 4695 }, { "epoch": 0.09, "learning_rate": 4.955135718100708e-06, "loss": 1.0041, "step": 4696 }, { "epoch": 0.09, "learning_rate": 4.955106902173463e-06, "loss": 0.9083, "step": 4697 }, { "epoch": 0.09, "learning_rate": 4.955078077078925e-06, "loss": 0.7561, "step": 4698 }, { "epoch": 0.09, "learning_rate": 4.9550492428172e-06, "loss": 0.9085, "step": 4699 }, { "epoch": 0.09, "learning_rate": 4.955020399388397e-06, "loss": 1.2029, "step": 4700 }, { "epoch": 0.09, "learning_rate": 4.9549915467926225e-06, "loss": 0.9966, "step": 4701 }, { "epoch": 0.09, "learning_rate": 4.954962685029985e-06, "loss": 0.9594, "step": 4702 }, { "epoch": 0.09, "learning_rate": 4.954933814100592e-06, "loss": 0.9177, "step": 4703 }, { "epoch": 0.09, "learning_rate": 4.954904934004552e-06, "loss": 0.8561, "step": 4704 }, { "epoch": 0.09, "learning_rate": 4.954876044741972e-06, "loss": 1.1292, "step": 4705 }, { "epoch": 0.09, "learning_rate": 4.95484714631296e-06, "loss": 1.1835, "step": 4706 }, { "epoch": 0.09, "learning_rate": 4.954818238717624e-06, "loss": 1.1434, "step": 4707 }, { "epoch": 0.09, "learning_rate": 4.954789321956072e-06, "loss": 0.8373, "step": 4708 }, { "epoch": 0.09, "learning_rate": 4.9547603960284115e-06, "loss": 0.8358, "step": 4709 }, { "epoch": 0.09, "learning_rate": 4.954731460934751e-06, "loss": 0.8254, "step": 4710 }, { "epoch": 0.09, "learning_rate": 4.954702516675199e-06, "loss": 0.9234, "step": 4711 }, { "epoch": 0.09, "learning_rate": 4.954673563249863e-06, "loss": 0.9818, "step": 4712 }, { "epoch": 0.09, "learning_rate": 4.954644600658851e-06, "loss": 1.0516, "step": 4713 }, { "epoch": 0.09, "learning_rate": 4.954615628902272e-06, "loss": 1.1501, "step": 4714 }, { "epoch": 0.09, "learning_rate": 4.954586647980233e-06, "loss": 0.9368, "step": 4715 }, { "epoch": 0.09, "learning_rate": 4.954557657892842e-06, "loss": 0.955, "step": 4716 }, { "epoch": 0.09, "learning_rate": 4.954528658640209e-06, "loss": 1.0175, "step": 4717 }, { "epoch": 0.09, "learning_rate": 4.95449965022244e-06, "loss": 1.1007, "step": 4718 }, { "epoch": 0.09, "learning_rate": 4.954470632639645e-06, "loss": 1.1489, "step": 4719 }, { "epoch": 0.09, "learning_rate": 4.954441605891933e-06, "loss": 0.8005, "step": 4720 }, { "epoch": 0.09, "learning_rate": 4.95441256997941e-06, "loss": 0.8887, "step": 4721 }, { "epoch": 0.09, "learning_rate": 4.954383524902186e-06, "loss": 0.9611, "step": 4722 }, { "epoch": 0.09, "learning_rate": 4.95435447066037e-06, "loss": 0.8267, "step": 4723 }, { "epoch": 0.09, "learning_rate": 4.954325407254069e-06, "loss": 1.11, "step": 4724 }, { "epoch": 0.09, "learning_rate": 4.954296334683393e-06, "loss": 1.0603, "step": 4725 }, { "epoch": 0.09, "learning_rate": 4.9542672529484486e-06, "loss": 1.0186, "step": 4726 }, { "epoch": 0.09, "learning_rate": 4.9542381620493465e-06, "loss": 1.0153, "step": 4727 }, { "epoch": 0.09, "learning_rate": 4.954209061986193e-06, "loss": 1.035, "step": 4728 }, { "epoch": 0.09, "learning_rate": 4.954179952759099e-06, "loss": 1.0689, "step": 4729 }, { "epoch": 0.09, "learning_rate": 4.954150834368172e-06, "loss": 1.0739, "step": 4730 }, { "epoch": 0.09, "learning_rate": 4.954121706813521e-06, "loss": 1.0634, "step": 4731 }, { "epoch": 0.09, "learning_rate": 4.954092570095256e-06, "loss": 0.8694, "step": 4732 }, { "epoch": 0.09, "learning_rate": 4.954063424213484e-06, "loss": 0.8996, "step": 4733 }, { "epoch": 0.09, "learning_rate": 4.954034269168314e-06, "loss": 0.8422, "step": 4734 }, { "epoch": 0.09, "learning_rate": 4.9540051049598546e-06, "loss": 0.9246, "step": 4735 }, { "epoch": 0.09, "learning_rate": 4.9539759315882165e-06, "loss": 0.8237, "step": 4736 }, { "epoch": 0.09, "learning_rate": 4.953946749053507e-06, "loss": 1.0482, "step": 4737 }, { "epoch": 0.09, "learning_rate": 4.953917557355835e-06, "loss": 0.9843, "step": 4738 }, { "epoch": 0.09, "learning_rate": 4.953888356495311e-06, "loss": 0.9118, "step": 4739 }, { "epoch": 0.09, "learning_rate": 4.953859146472043e-06, "loss": 0.728, "step": 4740 }, { "epoch": 0.09, "learning_rate": 4.95382992728614e-06, "loss": 0.9804, "step": 4741 }, { "epoch": 0.09, "learning_rate": 4.953800698937712e-06, "loss": 0.8096, "step": 4742 }, { "epoch": 0.09, "learning_rate": 4.953771461426866e-06, "loss": 1.1315, "step": 4743 }, { "epoch": 0.09, "learning_rate": 4.953742214753714e-06, "loss": 1.0447, "step": 4744 }, { "epoch": 0.09, "learning_rate": 4.953712958918363e-06, "loss": 0.9565, "step": 4745 }, { "epoch": 0.09, "learning_rate": 4.953683693920924e-06, "loss": 1.075, "step": 4746 }, { "epoch": 0.09, "learning_rate": 4.953654419761504e-06, "loss": 0.7909, "step": 4747 }, { "epoch": 0.09, "learning_rate": 4.953625136440214e-06, "loss": 0.8964, "step": 4748 }, { "epoch": 0.09, "learning_rate": 4.953595843957163e-06, "loss": 0.8724, "step": 4749 }, { "epoch": 0.09, "learning_rate": 4.9535665423124606e-06, "loss": 1.1232, "step": 4750 }, { "epoch": 0.09, "learning_rate": 4.953537231506216e-06, "loss": 1.0586, "step": 4751 }, { "epoch": 0.09, "learning_rate": 4.953507911538539e-06, "loss": 0.8796, "step": 4752 }, { "epoch": 0.09, "learning_rate": 4.953478582409538e-06, "loss": 1.0391, "step": 4753 }, { "epoch": 0.09, "learning_rate": 4.953449244119323e-06, "loss": 0.8122, "step": 4754 }, { "epoch": 0.09, "learning_rate": 4.953419896668004e-06, "loss": 1.0356, "step": 4755 }, { "epoch": 0.09, "learning_rate": 4.953390540055691e-06, "loss": 0.978, "step": 4756 }, { "epoch": 0.09, "learning_rate": 4.953361174282491e-06, "loss": 0.981, "step": 4757 }, { "epoch": 0.09, "learning_rate": 4.953331799348517e-06, "loss": 0.8696, "step": 4758 }, { "epoch": 0.09, "learning_rate": 4.953302415253877e-06, "loss": 0.8887, "step": 4759 }, { "epoch": 0.09, "learning_rate": 4.953273021998682e-06, "loss": 0.7844, "step": 4760 }, { "epoch": 0.09, "learning_rate": 4.95324361958304e-06, "loss": 0.9099, "step": 4761 }, { "epoch": 0.09, "learning_rate": 4.953214208007062e-06, "loss": 0.9999, "step": 4762 }, { "epoch": 0.09, "learning_rate": 4.953184787270857e-06, "loss": 0.9981, "step": 4763 }, { "epoch": 0.09, "learning_rate": 4.953155357374535e-06, "loss": 0.8046, "step": 4764 }, { "epoch": 0.09, "learning_rate": 4.953125918318206e-06, "loss": 0.9852, "step": 4765 }, { "epoch": 0.09, "learning_rate": 4.95309647010198e-06, "loss": 0.8729, "step": 4766 }, { "epoch": 0.09, "learning_rate": 4.953067012725968e-06, "loss": 0.8499, "step": 4767 }, { "epoch": 0.09, "learning_rate": 4.953037546190278e-06, "loss": 1.1888, "step": 4768 }, { "epoch": 0.09, "learning_rate": 4.953008070495021e-06, "loss": 0.9419, "step": 4769 }, { "epoch": 0.09, "learning_rate": 4.952978585640308e-06, "loss": 1.157, "step": 4770 }, { "epoch": 0.09, "learning_rate": 4.952949091626247e-06, "loss": 0.9089, "step": 4771 }, { "epoch": 0.09, "learning_rate": 4.95291958845295e-06, "loss": 1.0349, "step": 4772 }, { "epoch": 0.09, "learning_rate": 4.9528900761205265e-06, "loss": 0.9235, "step": 4773 }, { "epoch": 0.09, "learning_rate": 4.952860554629087e-06, "loss": 1.2134, "step": 4774 }, { "epoch": 0.09, "learning_rate": 4.9528310239787405e-06, "loss": 0.9028, "step": 4775 }, { "epoch": 0.09, "learning_rate": 4.952801484169598e-06, "loss": 0.8629, "step": 4776 }, { "epoch": 0.09, "learning_rate": 4.952771935201771e-06, "loss": 1.0002, "step": 4777 }, { "epoch": 0.09, "learning_rate": 4.952742377075368e-06, "loss": 0.9481, "step": 4778 }, { "epoch": 0.09, "learning_rate": 4.9527128097905005e-06, "loss": 0.888, "step": 4779 }, { "epoch": 0.09, "learning_rate": 4.952683233347279e-06, "loss": 0.9904, "step": 4780 }, { "epoch": 0.09, "learning_rate": 4.952653647745812e-06, "loss": 1.1746, "step": 4781 }, { "epoch": 0.09, "learning_rate": 4.9526240529862126e-06, "loss": 1.1013, "step": 4782 }, { "epoch": 0.09, "learning_rate": 4.9525944490685905e-06, "loss": 0.897, "step": 4783 }, { "epoch": 0.09, "learning_rate": 4.952564835993056e-06, "loss": 1.0063, "step": 4784 }, { "epoch": 0.09, "learning_rate": 4.952535213759718e-06, "loss": 1.0399, "step": 4785 }, { "epoch": 0.09, "learning_rate": 4.95250558236869e-06, "loss": 0.8035, "step": 4786 }, { "epoch": 0.09, "learning_rate": 4.9524759418200815e-06, "loss": 1.2028, "step": 4787 }, { "epoch": 0.09, "learning_rate": 4.952446292114003e-06, "loss": 0.9921, "step": 4788 }, { "epoch": 0.09, "learning_rate": 4.952416633250565e-06, "loss": 1.0583, "step": 4789 }, { "epoch": 0.09, "learning_rate": 4.952386965229878e-06, "loss": 1.0018, "step": 4790 }, { "epoch": 0.09, "learning_rate": 4.952357288052054e-06, "loss": 1.0114, "step": 4791 }, { "epoch": 0.09, "learning_rate": 4.952327601717202e-06, "loss": 0.7801, "step": 4792 }, { "epoch": 0.09, "learning_rate": 4.952297906225435e-06, "loss": 1.0006, "step": 4793 }, { "epoch": 0.09, "learning_rate": 4.952268201576863e-06, "loss": 1.0612, "step": 4794 }, { "epoch": 0.09, "learning_rate": 4.9522384877715955e-06, "loss": 0.9855, "step": 4795 }, { "epoch": 0.09, "learning_rate": 4.9522087648097455e-06, "loss": 0.8955, "step": 4796 }, { "epoch": 0.09, "learning_rate": 4.952179032691423e-06, "loss": 0.8312, "step": 4797 }, { "epoch": 0.09, "learning_rate": 4.952149291416739e-06, "loss": 1.0576, "step": 4798 }, { "epoch": 0.09, "learning_rate": 4.9521195409858055e-06, "loss": 0.9795, "step": 4799 }, { "epoch": 0.09, "learning_rate": 4.952089781398732e-06, "loss": 1.1836, "step": 4800 }, { "epoch": 0.09, "learning_rate": 4.95206001265563e-06, "loss": 0.8479, "step": 4801 }, { "epoch": 0.09, "learning_rate": 4.9520302347566126e-06, "loss": 0.9713, "step": 4802 }, { "epoch": 0.09, "learning_rate": 4.9520004477017895e-06, "loss": 0.8627, "step": 4803 }, { "epoch": 0.09, "learning_rate": 4.95197065149127e-06, "loss": 0.8423, "step": 4804 }, { "epoch": 0.09, "learning_rate": 4.951940846125169e-06, "loss": 1.0129, "step": 4805 }, { "epoch": 0.09, "learning_rate": 4.951911031603595e-06, "loss": 1.1676, "step": 4806 }, { "epoch": 0.09, "learning_rate": 4.951881207926661e-06, "loss": 1.0579, "step": 4807 }, { "epoch": 0.09, "learning_rate": 4.9518513750944775e-06, "loss": 0.9315, "step": 4808 }, { "epoch": 0.09, "learning_rate": 4.951821533107156e-06, "loss": 0.9214, "step": 4809 }, { "epoch": 0.09, "learning_rate": 4.951791681964808e-06, "loss": 0.9831, "step": 4810 }, { "epoch": 0.09, "learning_rate": 4.951761821667546e-06, "loss": 0.9141, "step": 4811 }, { "epoch": 0.09, "learning_rate": 4.9517319522154795e-06, "loss": 1.1445, "step": 4812 }, { "epoch": 0.09, "learning_rate": 4.951702073608722e-06, "loss": 0.9778, "step": 4813 }, { "epoch": 0.09, "learning_rate": 4.9516721858473825e-06, "loss": 0.9041, "step": 4814 }, { "epoch": 0.09, "learning_rate": 4.9516422889315756e-06, "loss": 0.8607, "step": 4815 }, { "epoch": 0.09, "learning_rate": 4.951612382861412e-06, "loss": 0.8234, "step": 4816 }, { "epoch": 0.09, "learning_rate": 4.951582467637002e-06, "loss": 0.9448, "step": 4817 }, { "epoch": 0.09, "learning_rate": 4.951552543258457e-06, "loss": 1.2227, "step": 4818 }, { "epoch": 0.09, "learning_rate": 4.951522609725892e-06, "loss": 1.0857, "step": 4819 }, { "epoch": 0.09, "learning_rate": 4.9514926670394155e-06, "loss": 0.6326, "step": 4820 }, { "epoch": 0.09, "learning_rate": 4.951462715199142e-06, "loss": 0.8577, "step": 4821 }, { "epoch": 0.09, "learning_rate": 4.951432754205181e-06, "loss": 0.8794, "step": 4822 }, { "epoch": 0.09, "learning_rate": 4.951402784057645e-06, "loss": 0.8942, "step": 4823 }, { "epoch": 0.09, "learning_rate": 4.951372804756647e-06, "loss": 1.0348, "step": 4824 }, { "epoch": 0.09, "learning_rate": 4.9513428163022966e-06, "loss": 1.064, "step": 4825 }, { "epoch": 0.09, "learning_rate": 4.951312818694709e-06, "loss": 0.9179, "step": 4826 }, { "epoch": 0.09, "learning_rate": 4.9512828119339935e-06, "loss": 0.9775, "step": 4827 }, { "epoch": 0.09, "learning_rate": 4.951252796020263e-06, "loss": 0.8972, "step": 4828 }, { "epoch": 0.09, "learning_rate": 4.951222770953631e-06, "loss": 0.8648, "step": 4829 }, { "epoch": 0.09, "learning_rate": 4.951192736734207e-06, "loss": 1.0816, "step": 4830 }, { "epoch": 0.09, "learning_rate": 4.951162693362105e-06, "loss": 1.267, "step": 4831 }, { "epoch": 0.09, "learning_rate": 4.951132640837436e-06, "loss": 1.1392, "step": 4832 }, { "epoch": 0.09, "learning_rate": 4.951102579160314e-06, "loss": 0.7768, "step": 4833 }, { "epoch": 0.09, "learning_rate": 4.951072508330849e-06, "loss": 1.1126, "step": 4834 }, { "epoch": 0.09, "learning_rate": 4.951042428349155e-06, "loss": 0.9042, "step": 4835 }, { "epoch": 0.09, "learning_rate": 4.951012339215344e-06, "loss": 0.8837, "step": 4836 }, { "epoch": 0.09, "learning_rate": 4.950982240929527e-06, "loss": 0.9087, "step": 4837 }, { "epoch": 0.09, "learning_rate": 4.950952133491819e-06, "loss": 1.0798, "step": 4838 }, { "epoch": 0.09, "learning_rate": 4.9509220169023295e-06, "loss": 0.9014, "step": 4839 }, { "epoch": 0.09, "learning_rate": 4.950891891161173e-06, "loss": 0.9954, "step": 4840 }, { "epoch": 0.09, "learning_rate": 4.950861756268461e-06, "loss": 0.9455, "step": 4841 }, { "epoch": 0.09, "learning_rate": 4.950831612224307e-06, "loss": 0.8363, "step": 4842 }, { "epoch": 0.09, "learning_rate": 4.950801459028822e-06, "loss": 1.1871, "step": 4843 }, { "epoch": 0.09, "learning_rate": 4.950771296682121e-06, "loss": 1.0809, "step": 4844 }, { "epoch": 0.09, "learning_rate": 4.950741125184313e-06, "loss": 0.7675, "step": 4845 }, { "epoch": 0.09, "learning_rate": 4.950710944535514e-06, "loss": 0.8742, "step": 4846 }, { "epoch": 0.09, "learning_rate": 4.950680754735836e-06, "loss": 0.98, "step": 4847 }, { "epoch": 0.09, "learning_rate": 4.95065055578539e-06, "loss": 0.9031, "step": 4848 }, { "epoch": 0.09, "learning_rate": 4.950620347684291e-06, "loss": 1.0858, "step": 4849 }, { "epoch": 0.09, "learning_rate": 4.95059013043265e-06, "loss": 1.0077, "step": 4850 }, { "epoch": 0.09, "learning_rate": 4.95055990403058e-06, "loss": 1.0256, "step": 4851 }, { "epoch": 0.09, "learning_rate": 4.950529668478197e-06, "loss": 0.9832, "step": 4852 }, { "epoch": 0.09, "learning_rate": 4.950499423775609e-06, "loss": 1.0062, "step": 4853 }, { "epoch": 0.09, "learning_rate": 4.950469169922933e-06, "loss": 0.8647, "step": 4854 }, { "epoch": 0.09, "learning_rate": 4.950438906920279e-06, "loss": 1.0276, "step": 4855 }, { "epoch": 0.09, "learning_rate": 4.950408634767761e-06, "loss": 1.1802, "step": 4856 }, { "epoch": 0.09, "learning_rate": 4.950378353465493e-06, "loss": 1.0192, "step": 4857 }, { "epoch": 0.09, "learning_rate": 4.950348063013587e-06, "loss": 0.7532, "step": 4858 }, { "epoch": 0.09, "learning_rate": 4.950317763412156e-06, "loss": 0.9236, "step": 4859 }, { "epoch": 0.09, "learning_rate": 4.9502874546613145e-06, "loss": 0.9886, "step": 4860 }, { "epoch": 0.09, "learning_rate": 4.950257136761174e-06, "loss": 0.7767, "step": 4861 }, { "epoch": 0.09, "learning_rate": 4.950226809711849e-06, "loss": 1.1637, "step": 4862 }, { "epoch": 0.09, "learning_rate": 4.950196473513453e-06, "loss": 0.8278, "step": 4863 }, { "epoch": 0.09, "learning_rate": 4.950166128166098e-06, "loss": 0.8616, "step": 4864 }, { "epoch": 0.09, "learning_rate": 4.950135773669897e-06, "loss": 0.9858, "step": 4865 }, { "epoch": 0.09, "learning_rate": 4.950105410024964e-06, "loss": 0.9478, "step": 4866 }, { "epoch": 0.09, "learning_rate": 4.950075037231413e-06, "loss": 0.9192, "step": 4867 }, { "epoch": 0.09, "learning_rate": 4.950044655289357e-06, "loss": 1.2024, "step": 4868 }, { "epoch": 0.09, "learning_rate": 4.95001426419891e-06, "loss": 1.0638, "step": 4869 }, { "epoch": 0.09, "learning_rate": 4.9499838639601835e-06, "loss": 1.0963, "step": 4870 }, { "epoch": 0.09, "learning_rate": 4.949953454573294e-06, "loss": 0.9112, "step": 4871 }, { "epoch": 0.09, "learning_rate": 4.949923036038352e-06, "loss": 1.0158, "step": 4872 }, { "epoch": 0.09, "learning_rate": 4.949892608355474e-06, "loss": 0.8436, "step": 4873 }, { "epoch": 0.09, "learning_rate": 4.949862171524771e-06, "loss": 1.2388, "step": 4874 }, { "epoch": 0.09, "learning_rate": 4.949831725546358e-06, "loss": 1.1884, "step": 4875 }, { "epoch": 0.09, "learning_rate": 4.949801270420348e-06, "loss": 1.0687, "step": 4876 }, { "epoch": 0.09, "learning_rate": 4.949770806146855e-06, "loss": 0.9034, "step": 4877 }, { "epoch": 0.09, "learning_rate": 4.949740332725994e-06, "loss": 0.9843, "step": 4878 }, { "epoch": 0.09, "learning_rate": 4.949709850157877e-06, "loss": 1.0312, "step": 4879 }, { "epoch": 0.09, "learning_rate": 4.949679358442618e-06, "loss": 0.8073, "step": 4880 }, { "epoch": 0.09, "learning_rate": 4.9496488575803324e-06, "loss": 1.2829, "step": 4881 }, { "epoch": 0.09, "learning_rate": 4.949618347571134e-06, "loss": 0.8911, "step": 4882 }, { "epoch": 0.09, "learning_rate": 4.949587828415134e-06, "loss": 0.9706, "step": 4883 }, { "epoch": 0.09, "learning_rate": 4.949557300112448e-06, "loss": 0.9467, "step": 4884 }, { "epoch": 0.09, "learning_rate": 4.949526762663191e-06, "loss": 0.9901, "step": 4885 }, { "epoch": 0.09, "learning_rate": 4.949496216067477e-06, "loss": 0.9347, "step": 4886 }, { "epoch": 0.09, "learning_rate": 4.9494656603254175e-06, "loss": 1.1706, "step": 4887 }, { "epoch": 0.09, "learning_rate": 4.9494350954371295e-06, "loss": 1.053, "step": 4888 }, { "epoch": 0.09, "learning_rate": 4.949404521402725e-06, "loss": 0.7992, "step": 4889 }, { "epoch": 0.09, "learning_rate": 4.94937393822232e-06, "loss": 0.9871, "step": 4890 }, { "epoch": 0.09, "learning_rate": 4.949343345896027e-06, "loss": 0.8646, "step": 4891 }, { "epoch": 0.09, "learning_rate": 4.949312744423962e-06, "loss": 1.0099, "step": 4892 }, { "epoch": 0.09, "learning_rate": 4.949282133806238e-06, "loss": 0.8981, "step": 4893 }, { "epoch": 0.09, "learning_rate": 4.949251514042969e-06, "loss": 0.9966, "step": 4894 }, { "epoch": 0.09, "learning_rate": 4.94922088513427e-06, "loss": 1.028, "step": 4895 }, { "epoch": 0.09, "learning_rate": 4.949190247080256e-06, "loss": 0.8176, "step": 4896 }, { "epoch": 0.09, "learning_rate": 4.949159599881041e-06, "loss": 1.0092, "step": 4897 }, { "epoch": 0.09, "learning_rate": 4.949128943536739e-06, "loss": 0.9052, "step": 4898 }, { "epoch": 0.09, "learning_rate": 4.949098278047464e-06, "loss": 0.9781, "step": 4899 }, { "epoch": 0.09, "learning_rate": 4.949067603413331e-06, "loss": 1.1964, "step": 4900 }, { "epoch": 0.09, "learning_rate": 4.949036919634455e-06, "loss": 0.8917, "step": 4901 }, { "epoch": 0.09, "learning_rate": 4.94900622671095e-06, "loss": 1.1453, "step": 4902 }, { "epoch": 0.09, "learning_rate": 4.948975524642931e-06, "loss": 0.977, "step": 4903 }, { "epoch": 0.09, "learning_rate": 4.948944813430513e-06, "loss": 0.9042, "step": 4904 }, { "epoch": 0.09, "learning_rate": 4.948914093073809e-06, "loss": 0.7235, "step": 4905 }, { "epoch": 0.09, "learning_rate": 4.948883363572936e-06, "loss": 1.1443, "step": 4906 }, { "epoch": 0.09, "learning_rate": 4.948852624928007e-06, "loss": 1.231, "step": 4907 }, { "epoch": 0.09, "learning_rate": 4.9488218771391374e-06, "loss": 0.8795, "step": 4908 }, { "epoch": 0.09, "learning_rate": 4.948791120206442e-06, "loss": 1.0024, "step": 4909 }, { "epoch": 0.09, "learning_rate": 4.9487603541300356e-06, "loss": 0.8785, "step": 4910 }, { "epoch": 0.09, "learning_rate": 4.948729578910034e-06, "loss": 0.8561, "step": 4911 }, { "epoch": 0.09, "learning_rate": 4.94869879454655e-06, "loss": 0.9777, "step": 4912 }, { "epoch": 0.09, "learning_rate": 4.9486680010397005e-06, "loss": 1.0, "step": 4913 }, { "epoch": 0.09, "learning_rate": 4.9486371983895996e-06, "loss": 0.9423, "step": 4914 }, { "epoch": 0.09, "learning_rate": 4.948606386596362e-06, "loss": 0.8023, "step": 4915 }, { "epoch": 0.09, "learning_rate": 4.948575565660104e-06, "loss": 1.0822, "step": 4916 }, { "epoch": 0.09, "learning_rate": 4.948544735580939e-06, "loss": 0.9155, "step": 4917 }, { "epoch": 0.09, "learning_rate": 4.948513896358984e-06, "loss": 1.1926, "step": 4918 }, { "epoch": 0.09, "learning_rate": 4.9484830479943525e-06, "loss": 1.2672, "step": 4919 }, { "epoch": 0.09, "learning_rate": 4.9484521904871606e-06, "loss": 1.0552, "step": 4920 }, { "epoch": 0.09, "learning_rate": 4.948421323837524e-06, "loss": 1.1783, "step": 4921 }, { "epoch": 0.09, "learning_rate": 4.948390448045556e-06, "loss": 0.8681, "step": 4922 }, { "epoch": 0.09, "learning_rate": 4.948359563111374e-06, "loss": 1.0189, "step": 4923 }, { "epoch": 0.09, "learning_rate": 4.948328669035092e-06, "loss": 0.9642, "step": 4924 }, { "epoch": 0.09, "learning_rate": 4.948297765816826e-06, "loss": 1.0477, "step": 4925 }, { "epoch": 0.09, "learning_rate": 4.948266853456691e-06, "loss": 0.8011, "step": 4926 }, { "epoch": 0.09, "learning_rate": 4.948235931954804e-06, "loss": 1.0615, "step": 4927 }, { "epoch": 0.09, "learning_rate": 4.948205001311277e-06, "loss": 1.158, "step": 4928 }, { "epoch": 0.09, "learning_rate": 4.948174061526229e-06, "loss": 0.917, "step": 4929 }, { "epoch": 0.09, "learning_rate": 4.948143112599773e-06, "loss": 1.1715, "step": 4930 }, { "epoch": 0.09, "learning_rate": 4.948112154532026e-06, "loss": 1.1888, "step": 4931 }, { "epoch": 0.09, "learning_rate": 4.948081187323104e-06, "loss": 0.91, "step": 4932 }, { "epoch": 0.09, "learning_rate": 4.948050210973121e-06, "loss": 0.9726, "step": 4933 }, { "epoch": 0.09, "learning_rate": 4.948019225482194e-06, "loss": 0.6988, "step": 4934 }, { "epoch": 0.09, "learning_rate": 4.947988230850439e-06, "loss": 0.9811, "step": 4935 }, { "epoch": 0.09, "learning_rate": 4.947957227077971e-06, "loss": 0.9621, "step": 4936 }, { "epoch": 0.09, "learning_rate": 4.947926214164904e-06, "loss": 1.0519, "step": 4937 }, { "epoch": 0.09, "learning_rate": 4.947895192111357e-06, "loss": 1.0269, "step": 4938 }, { "epoch": 0.09, "learning_rate": 4.947864160917444e-06, "loss": 1.0601, "step": 4939 }, { "epoch": 0.09, "learning_rate": 4.947833120583282e-06, "loss": 0.9622, "step": 4940 }, { "epoch": 0.09, "learning_rate": 4.947802071108985e-06, "loss": 0.8726, "step": 4941 }, { "epoch": 0.09, "learning_rate": 4.947771012494671e-06, "loss": 0.9498, "step": 4942 }, { "epoch": 0.09, "learning_rate": 4.947739944740454e-06, "loss": 0.9522, "step": 4943 }, { "epoch": 0.09, "learning_rate": 4.947708867846452e-06, "loss": 1.0871, "step": 4944 }, { "epoch": 0.09, "learning_rate": 4.9476777818127805e-06, "loss": 0.9872, "step": 4945 }, { "epoch": 0.09, "learning_rate": 4.947646686639555e-06, "loss": 0.8777, "step": 4946 }, { "epoch": 0.09, "learning_rate": 4.947615582326891e-06, "loss": 1.0398, "step": 4947 }, { "epoch": 0.09, "learning_rate": 4.947584468874906e-06, "loss": 0.7435, "step": 4948 }, { "epoch": 0.09, "learning_rate": 4.947553346283715e-06, "loss": 1.0596, "step": 4949 }, { "epoch": 0.09, "learning_rate": 4.947522214553436e-06, "loss": 1.3993, "step": 4950 }, { "epoch": 0.09, "learning_rate": 4.947491073684184e-06, "loss": 1.0686, "step": 4951 }, { "epoch": 0.09, "learning_rate": 4.947459923676075e-06, "loss": 0.8162, "step": 4952 }, { "epoch": 0.09, "learning_rate": 4.947428764529225e-06, "loss": 0.9173, "step": 4953 }, { "epoch": 0.09, "learning_rate": 4.947397596243752e-06, "loss": 1.0324, "step": 4954 }, { "epoch": 0.09, "learning_rate": 4.947366418819771e-06, "loss": 1.0184, "step": 4955 }, { "epoch": 0.09, "learning_rate": 4.947335232257399e-06, "loss": 1.1003, "step": 4956 }, { "epoch": 0.09, "learning_rate": 4.947304036556752e-06, "loss": 1.0432, "step": 4957 }, { "epoch": 0.09, "learning_rate": 4.947272831717947e-06, "loss": 1.0199, "step": 4958 }, { "epoch": 0.09, "learning_rate": 4.9472416177411e-06, "loss": 0.96, "step": 4959 }, { "epoch": 0.09, "learning_rate": 4.947210394626328e-06, "loss": 0.858, "step": 4960 }, { "epoch": 0.09, "learning_rate": 4.947179162373748e-06, "loss": 0.958, "step": 4961 }, { "epoch": 0.09, "learning_rate": 4.947147920983475e-06, "loss": 1.1796, "step": 4962 }, { "epoch": 0.09, "learning_rate": 4.947116670455628e-06, "loss": 1.1117, "step": 4963 }, { "epoch": 0.09, "learning_rate": 4.947085410790321e-06, "loss": 0.7874, "step": 4964 }, { "epoch": 0.09, "learning_rate": 4.947054141987673e-06, "loss": 0.9902, "step": 4965 }, { "epoch": 0.09, "learning_rate": 4.947022864047799e-06, "loss": 0.9799, "step": 4966 }, { "epoch": 0.09, "learning_rate": 4.946991576970818e-06, "loss": 0.7815, "step": 4967 }, { "epoch": 0.09, "learning_rate": 4.9469602807568436e-06, "loss": 1.1279, "step": 4968 }, { "epoch": 0.09, "learning_rate": 4.946928975405996e-06, "loss": 1.2061, "step": 4969 }, { "epoch": 0.09, "learning_rate": 4.946897660918391e-06, "loss": 0.8162, "step": 4970 }, { "epoch": 0.09, "learning_rate": 4.946866337294144e-06, "loss": 0.9519, "step": 4971 }, { "epoch": 0.09, "learning_rate": 4.946835004533373e-06, "loss": 1.0339, "step": 4972 }, { "epoch": 0.09, "learning_rate": 4.946803662636196e-06, "loss": 0.9762, "step": 4973 }, { "epoch": 0.09, "learning_rate": 4.946772311602729e-06, "loss": 0.9642, "step": 4974 }, { "epoch": 0.09, "learning_rate": 4.946740951433089e-06, "loss": 1.0475, "step": 4975 }, { "epoch": 0.09, "learning_rate": 4.946709582127393e-06, "loss": 1.0259, "step": 4976 }, { "epoch": 0.09, "learning_rate": 4.946678203685759e-06, "loss": 0.878, "step": 4977 }, { "epoch": 0.09, "learning_rate": 4.946646816108303e-06, "loss": 1.1163, "step": 4978 }, { "epoch": 0.09, "learning_rate": 4.946615419395143e-06, "loss": 0.8519, "step": 4979 }, { "epoch": 0.09, "learning_rate": 4.946584013546397e-06, "loss": 1.1163, "step": 4980 }, { "epoch": 0.09, "learning_rate": 4.9465525985621796e-06, "loss": 1.2224, "step": 4981 }, { "epoch": 0.09, "learning_rate": 4.946521174442611e-06, "loss": 0.8473, "step": 4982 }, { "epoch": 0.09, "learning_rate": 4.9464897411878075e-06, "loss": 0.8562, "step": 4983 }, { "epoch": 0.09, "learning_rate": 4.946458298797886e-06, "loss": 1.0123, "step": 4984 }, { "epoch": 0.09, "learning_rate": 4.946426847272963e-06, "loss": 1.0857, "step": 4985 }, { "epoch": 0.09, "learning_rate": 4.9463953866131584e-06, "loss": 0.9745, "step": 4986 }, { "epoch": 0.09, "learning_rate": 4.946363916818589e-06, "loss": 1.0466, "step": 4987 }, { "epoch": 0.09, "learning_rate": 4.94633243788937e-06, "loss": 0.8188, "step": 4988 }, { "epoch": 0.09, "learning_rate": 4.946300949825623e-06, "loss": 1.0826, "step": 4989 }, { "epoch": 0.09, "learning_rate": 4.946269452627461e-06, "loss": 1.0163, "step": 4990 }, { "epoch": 0.09, "learning_rate": 4.946237946295005e-06, "loss": 1.2715, "step": 4991 }, { "epoch": 0.09, "learning_rate": 4.946206430828372e-06, "loss": 0.9893, "step": 4992 }, { "epoch": 0.09, "learning_rate": 4.946174906227678e-06, "loss": 1.1663, "step": 4993 }, { "epoch": 0.09, "learning_rate": 4.946143372493043e-06, "loss": 1.0223, "step": 4994 }, { "epoch": 0.09, "learning_rate": 4.946111829624582e-06, "loss": 0.8358, "step": 4995 }, { "epoch": 0.09, "learning_rate": 4.946080277622416e-06, "loss": 0.8801, "step": 4996 }, { "epoch": 0.09, "learning_rate": 4.946048716486661e-06, "loss": 0.9301, "step": 4997 }, { "epoch": 0.09, "learning_rate": 4.946017146217435e-06, "loss": 1.0687, "step": 4998 }, { "epoch": 0.09, "learning_rate": 4.945985566814856e-06, "loss": 1.1654, "step": 4999 }, { "epoch": 0.09, "learning_rate": 4.945953978279041e-06, "loss": 1.4332, "step": 5000 }, { "epoch": 0.09, "learning_rate": 4.94592238061011e-06, "loss": 1.0079, "step": 5001 }, { "epoch": 0.09, "learning_rate": 4.945890773808179e-06, "loss": 0.8963, "step": 5002 }, { "epoch": 0.09, "learning_rate": 4.9458591578733675e-06, "loss": 0.8911, "step": 5003 }, { "epoch": 0.09, "learning_rate": 4.945827532805792e-06, "loss": 0.8807, "step": 5004 }, { "epoch": 0.09, "learning_rate": 4.945795898605573e-06, "loss": 1.1611, "step": 5005 }, { "epoch": 0.09, "learning_rate": 4.945764255272826e-06, "loss": 1.2053, "step": 5006 }, { "epoch": 0.09, "learning_rate": 4.94573260280767e-06, "loss": 1.0887, "step": 5007 }, { "epoch": 0.09, "learning_rate": 4.945700941210224e-06, "loss": 1.0096, "step": 5008 }, { "epoch": 0.09, "learning_rate": 4.945669270480606e-06, "loss": 0.9457, "step": 5009 }, { "epoch": 0.09, "learning_rate": 4.945637590618934e-06, "loss": 0.781, "step": 5010 }, { "epoch": 0.09, "learning_rate": 4.945605901625325e-06, "loss": 1.1244, "step": 5011 }, { "epoch": 0.09, "learning_rate": 4.9455742034999e-06, "loss": 1.1567, "step": 5012 }, { "epoch": 0.09, "learning_rate": 4.945542496242774e-06, "loss": 0.9818, "step": 5013 }, { "epoch": 0.09, "learning_rate": 4.945510779854069e-06, "loss": 0.8774, "step": 5014 }, { "epoch": 0.09, "learning_rate": 4.945479054333901e-06, "loss": 1.0649, "step": 5015 }, { "epoch": 0.09, "learning_rate": 4.9454473196823896e-06, "loss": 1.0219, "step": 5016 }, { "epoch": 0.09, "learning_rate": 4.945415575899653e-06, "loss": 0.9477, "step": 5017 }, { "epoch": 0.09, "learning_rate": 4.945383822985809e-06, "loss": 1.2687, "step": 5018 }, { "epoch": 0.09, "learning_rate": 4.945352060940977e-06, "loss": 0.9393, "step": 5019 }, { "epoch": 0.09, "learning_rate": 4.945320289765276e-06, "loss": 0.7926, "step": 5020 }, { "epoch": 0.09, "learning_rate": 4.945288509458823e-06, "loss": 1.0048, "step": 5021 }, { "epoch": 0.09, "learning_rate": 4.945256720021739e-06, "loss": 0.8297, "step": 5022 }, { "epoch": 0.09, "learning_rate": 4.945224921454141e-06, "loss": 0.7521, "step": 5023 }, { "epoch": 0.09, "learning_rate": 4.945193113756147e-06, "loss": 0.8883, "step": 5024 }, { "epoch": 0.09, "learning_rate": 4.945161296927877e-06, "loss": 1.1931, "step": 5025 }, { "epoch": 0.09, "learning_rate": 4.94512947096945e-06, "loss": 0.895, "step": 5026 }, { "epoch": 0.09, "learning_rate": 4.945097635880986e-06, "loss": 0.7456, "step": 5027 }, { "epoch": 0.09, "learning_rate": 4.9450657916626e-06, "loss": 0.808, "step": 5028 }, { "epoch": 0.09, "learning_rate": 4.9450339383144146e-06, "loss": 0.9475, "step": 5029 }, { "epoch": 0.09, "learning_rate": 4.945002075836548e-06, "loss": 1.0184, "step": 5030 }, { "epoch": 0.09, "learning_rate": 4.944970204229117e-06, "loss": 1.1376, "step": 5031 }, { "epoch": 0.09, "learning_rate": 4.944938323492243e-06, "loss": 0.9782, "step": 5032 }, { "epoch": 0.09, "learning_rate": 4.944906433626045e-06, "loss": 0.7682, "step": 5033 }, { "epoch": 0.09, "learning_rate": 4.944874534630641e-06, "loss": 1.024, "step": 5034 }, { "epoch": 0.09, "learning_rate": 4.94484262650615e-06, "loss": 1.028, "step": 5035 }, { "epoch": 0.1, "learning_rate": 4.944810709252692e-06, "loss": 0.9481, "step": 5036 }, { "epoch": 0.1, "learning_rate": 4.944778782870386e-06, "loss": 1.2234, "step": 5037 }, { "epoch": 0.1, "learning_rate": 4.94474684735935e-06, "loss": 0.9918, "step": 5038 }, { "epoch": 0.1, "learning_rate": 4.944714902719705e-06, "loss": 0.9088, "step": 5039 }, { "epoch": 0.1, "learning_rate": 4.944682948951569e-06, "loss": 0.9638, "step": 5040 }, { "epoch": 0.1, "learning_rate": 4.9446509860550615e-06, "loss": 0.6526, "step": 5041 }, { "epoch": 0.1, "learning_rate": 4.944619014030303e-06, "loss": 0.8925, "step": 5042 }, { "epoch": 0.1, "learning_rate": 4.944587032877412e-06, "loss": 1.1694, "step": 5043 }, { "epoch": 0.1, "learning_rate": 4.944555042596508e-06, "loss": 1.1271, "step": 5044 }, { "epoch": 0.1, "learning_rate": 4.94452304318771e-06, "loss": 1.0466, "step": 5045 }, { "epoch": 0.1, "learning_rate": 4.944491034651138e-06, "loss": 0.9694, "step": 5046 }, { "epoch": 0.1, "learning_rate": 4.944459016986911e-06, "loss": 0.996, "step": 5047 }, { "epoch": 0.1, "learning_rate": 4.94442699019515e-06, "loss": 0.7535, "step": 5048 }, { "epoch": 0.1, "learning_rate": 4.944394954275973e-06, "loss": 1.0408, "step": 5049 }, { "epoch": 0.1, "learning_rate": 4.944362909229501e-06, "loss": 1.1461, "step": 5050 }, { "epoch": 0.1, "learning_rate": 4.944330855055852e-06, "loss": 0.7784, "step": 5051 }, { "epoch": 0.1, "learning_rate": 4.944298791755147e-06, "loss": 0.9828, "step": 5052 }, { "epoch": 0.1, "learning_rate": 4.944266719327504e-06, "loss": 0.9959, "step": 5053 }, { "epoch": 0.1, "learning_rate": 4.944234637773046e-06, "loss": 0.8403, "step": 5054 }, { "epoch": 0.1, "learning_rate": 4.944202547091889e-06, "loss": 0.976, "step": 5055 }, { "epoch": 0.1, "learning_rate": 4.944170447284156e-06, "loss": 1.195, "step": 5056 }, { "epoch": 0.1, "learning_rate": 4.944138338349964e-06, "loss": 0.9242, "step": 5057 }, { "epoch": 0.1, "learning_rate": 4.944106220289435e-06, "loss": 1.0037, "step": 5058 }, { "epoch": 0.1, "learning_rate": 4.944074093102689e-06, "loss": 0.9325, "step": 5059 }, { "epoch": 0.1, "learning_rate": 4.944041956789844e-06, "loss": 0.9269, "step": 5060 }, { "epoch": 0.1, "learning_rate": 4.944009811351023e-06, "loss": 0.9222, "step": 5061 }, { "epoch": 0.1, "learning_rate": 4.943977656786344e-06, "loss": 1.1782, "step": 5062 }, { "epoch": 0.1, "learning_rate": 4.9439454930959264e-06, "loss": 0.7943, "step": 5063 }, { "epoch": 0.1, "learning_rate": 4.943913320279891e-06, "loss": 0.9533, "step": 5064 }, { "epoch": 0.1, "learning_rate": 4.9438811383383585e-06, "loss": 0.8185, "step": 5065 }, { "epoch": 0.1, "learning_rate": 4.943848947271449e-06, "loss": 0.9101, "step": 5066 }, { "epoch": 0.1, "learning_rate": 4.943816747079283e-06, "loss": 1.0353, "step": 5067 }, { "epoch": 0.1, "learning_rate": 4.94378453776198e-06, "loss": 1.088, "step": 5068 }, { "epoch": 0.1, "learning_rate": 4.9437523193196604e-06, "loss": 1.1174, "step": 5069 }, { "epoch": 0.1, "learning_rate": 4.943720091752444e-06, "loss": 0.9711, "step": 5070 }, { "epoch": 0.1, "learning_rate": 4.943687855060452e-06, "loss": 0.7299, "step": 5071 }, { "epoch": 0.1, "learning_rate": 4.943655609243805e-06, "loss": 1.0672, "step": 5072 }, { "epoch": 0.1, "learning_rate": 4.943623354302622e-06, "loss": 0.8787, "step": 5073 }, { "epoch": 0.1, "learning_rate": 4.943591090237025e-06, "loss": 1.0582, "step": 5074 }, { "epoch": 0.1, "learning_rate": 4.9435588170471336e-06, "loss": 1.1998, "step": 5075 }, { "epoch": 0.1, "learning_rate": 4.943526534733068e-06, "loss": 1.2186, "step": 5076 }, { "epoch": 0.1, "learning_rate": 4.943494243294949e-06, "loss": 0.8268, "step": 5077 }, { "epoch": 0.1, "learning_rate": 4.943461942732899e-06, "loss": 1.0569, "step": 5078 }, { "epoch": 0.1, "learning_rate": 4.943429633047036e-06, "loss": 0.9694, "step": 5079 }, { "epoch": 0.1, "learning_rate": 4.943397314237482e-06, "loss": 1.0607, "step": 5080 }, { "epoch": 0.1, "learning_rate": 4.943364986304357e-06, "loss": 1.0659, "step": 5081 }, { "epoch": 0.1, "learning_rate": 4.943332649247782e-06, "loss": 1.0276, "step": 5082 }, { "epoch": 0.1, "learning_rate": 4.943300303067878e-06, "loss": 0.8553, "step": 5083 }, { "epoch": 0.1, "learning_rate": 4.943267947764765e-06, "loss": 1.1326, "step": 5084 }, { "epoch": 0.1, "learning_rate": 4.943235583338566e-06, "loss": 0.923, "step": 5085 }, { "epoch": 0.1, "learning_rate": 4.943203209789399e-06, "loss": 0.9077, "step": 5086 }, { "epoch": 0.1, "learning_rate": 4.943170827117386e-06, "loss": 1.0468, "step": 5087 }, { "epoch": 0.1, "learning_rate": 4.943138435322648e-06, "loss": 1.1799, "step": 5088 }, { "epoch": 0.1, "learning_rate": 4.943106034405307e-06, "loss": 0.7342, "step": 5089 }, { "epoch": 0.1, "learning_rate": 4.943073624365482e-06, "loss": 0.9209, "step": 5090 }, { "epoch": 0.1, "learning_rate": 4.943041205203296e-06, "loss": 0.8588, "step": 5091 }, { "epoch": 0.1, "learning_rate": 4.943008776918868e-06, "loss": 1.075, "step": 5092 }, { "epoch": 0.1, "learning_rate": 4.94297633951232e-06, "loss": 1.149, "step": 5093 }, { "epoch": 0.1, "learning_rate": 4.942943892983774e-06, "loss": 0.8713, "step": 5094 }, { "epoch": 0.1, "learning_rate": 4.94291143733335e-06, "loss": 0.9422, "step": 5095 }, { "epoch": 0.1, "learning_rate": 4.9428789725611704e-06, "loss": 0.8385, "step": 5096 }, { "epoch": 0.1, "learning_rate": 4.942846498667354e-06, "loss": 0.9153, "step": 5097 }, { "epoch": 0.1, "learning_rate": 4.942814015652026e-06, "loss": 0.9032, "step": 5098 }, { "epoch": 0.1, "learning_rate": 4.942781523515303e-06, "loss": 0.8961, "step": 5099 }, { "epoch": 0.1, "learning_rate": 4.94274902225731e-06, "loss": 1.2374, "step": 5100 }, { "epoch": 0.1, "learning_rate": 4.942716511878166e-06, "loss": 0.9413, "step": 5101 }, { "epoch": 0.1, "learning_rate": 4.942683992377995e-06, "loss": 1.0359, "step": 5102 }, { "epoch": 0.1, "learning_rate": 4.942651463756915e-06, "loss": 0.9667, "step": 5103 }, { "epoch": 0.1, "learning_rate": 4.942618926015051e-06, "loss": 0.9006, "step": 5104 }, { "epoch": 0.1, "learning_rate": 4.9425863791525216e-06, "loss": 0.9142, "step": 5105 }, { "epoch": 0.1, "learning_rate": 4.942553823169451e-06, "loss": 1.0751, "step": 5106 }, { "epoch": 0.1, "learning_rate": 4.942521258065959e-06, "loss": 0.8479, "step": 5107 }, { "epoch": 0.1, "learning_rate": 4.942488683842166e-06, "loss": 0.883, "step": 5108 }, { "epoch": 0.1, "learning_rate": 4.942456100498196e-06, "loss": 1.004, "step": 5109 }, { "epoch": 0.1, "learning_rate": 4.942423508034171e-06, "loss": 1.069, "step": 5110 }, { "epoch": 0.1, "learning_rate": 4.942390906450209e-06, "loss": 0.9069, "step": 5111 }, { "epoch": 0.1, "learning_rate": 4.942358295746436e-06, "loss": 0.9813, "step": 5112 }, { "epoch": 0.1, "learning_rate": 4.942325675922972e-06, "loss": 1.0883, "step": 5113 }, { "epoch": 0.1, "learning_rate": 4.942293046979939e-06, "loss": 0.8575, "step": 5114 }, { "epoch": 0.1, "learning_rate": 4.9422604089174574e-06, "loss": 0.9037, "step": 5115 }, { "epoch": 0.1, "learning_rate": 4.942227761735652e-06, "loss": 0.9624, "step": 5116 }, { "epoch": 0.1, "learning_rate": 4.942195105434642e-06, "loss": 0.9263, "step": 5117 }, { "epoch": 0.1, "learning_rate": 4.9421624400145495e-06, "loss": 1.2498, "step": 5118 }, { "epoch": 0.1, "learning_rate": 4.942129765475499e-06, "loss": 1.2084, "step": 5119 }, { "epoch": 0.1, "learning_rate": 4.942097081817609e-06, "loss": 0.9803, "step": 5120 }, { "epoch": 0.1, "learning_rate": 4.942064389041005e-06, "loss": 0.9246, "step": 5121 }, { "epoch": 0.1, "learning_rate": 4.942031687145807e-06, "loss": 1.0332, "step": 5122 }, { "epoch": 0.1, "learning_rate": 4.941998976132137e-06, "loss": 0.9965, "step": 5123 }, { "epoch": 0.1, "learning_rate": 4.9419662560001184e-06, "loss": 1.0393, "step": 5124 }, { "epoch": 0.1, "learning_rate": 4.941933526749872e-06, "loss": 0.9801, "step": 5125 }, { "epoch": 0.1, "learning_rate": 4.941900788381521e-06, "loss": 0.9808, "step": 5126 }, { "epoch": 0.1, "learning_rate": 4.941868040895188e-06, "loss": 0.9076, "step": 5127 }, { "epoch": 0.1, "learning_rate": 4.941835284290994e-06, "loss": 0.8889, "step": 5128 }, { "epoch": 0.1, "learning_rate": 4.941802518569062e-06, "loss": 0.8922, "step": 5129 }, { "epoch": 0.1, "learning_rate": 4.941769743729515e-06, "loss": 0.9741, "step": 5130 }, { "epoch": 0.1, "learning_rate": 4.941736959772473e-06, "loss": 1.1696, "step": 5131 }, { "epoch": 0.1, "learning_rate": 4.941704166698062e-06, "loss": 1.0944, "step": 5132 }, { "epoch": 0.1, "learning_rate": 4.941671364506401e-06, "loss": 0.9064, "step": 5133 }, { "epoch": 0.1, "learning_rate": 4.941638553197614e-06, "loss": 0.9767, "step": 5134 }, { "epoch": 0.1, "learning_rate": 4.9416057327718235e-06, "loss": 0.8309, "step": 5135 }, { "epoch": 0.1, "learning_rate": 4.941572903229153e-06, "loss": 1.0092, "step": 5136 }, { "epoch": 0.1, "learning_rate": 4.941540064569723e-06, "loss": 1.2802, "step": 5137 }, { "epoch": 0.1, "learning_rate": 4.941507216793659e-06, "loss": 1.0955, "step": 5138 }, { "epoch": 0.1, "learning_rate": 4.94147435990108e-06, "loss": 0.9193, "step": 5139 }, { "epoch": 0.1, "learning_rate": 4.9414414938921115e-06, "loss": 0.9614, "step": 5140 }, { "epoch": 0.1, "learning_rate": 4.941408618766875e-06, "loss": 0.9279, "step": 5141 }, { "epoch": 0.1, "learning_rate": 4.941375734525494e-06, "loss": 0.8043, "step": 5142 }, { "epoch": 0.1, "learning_rate": 4.941342841168091e-06, "loss": 1.1971, "step": 5143 }, { "epoch": 0.1, "learning_rate": 4.941309938694788e-06, "loss": 1.126, "step": 5144 }, { "epoch": 0.1, "learning_rate": 4.941277027105709e-06, "loss": 1.0403, "step": 5145 }, { "epoch": 0.1, "learning_rate": 4.941244106400976e-06, "loss": 0.8662, "step": 5146 }, { "epoch": 0.1, "learning_rate": 4.941211176580712e-06, "loss": 0.7154, "step": 5147 }, { "epoch": 0.1, "learning_rate": 4.941178237645041e-06, "loss": 0.7007, "step": 5148 }, { "epoch": 0.1, "learning_rate": 4.941145289594086e-06, "loss": 1.2094, "step": 5149 }, { "epoch": 0.1, "learning_rate": 4.941112332427969e-06, "loss": 1.1411, "step": 5150 }, { "epoch": 0.1, "learning_rate": 4.941079366146813e-06, "loss": 1.0127, "step": 5151 }, { "epoch": 0.1, "learning_rate": 4.941046390750741e-06, "loss": 1.1223, "step": 5152 }, { "epoch": 0.1, "learning_rate": 4.9410134062398775e-06, "loss": 0.8895, "step": 5153 }, { "epoch": 0.1, "learning_rate": 4.940980412614344e-06, "loss": 0.8927, "step": 5154 }, { "epoch": 0.1, "learning_rate": 4.940947409874265e-06, "loss": 1.0507, "step": 5155 }, { "epoch": 0.1, "learning_rate": 4.9409143980197625e-06, "loss": 1.2144, "step": 5156 }, { "epoch": 0.1, "learning_rate": 4.940881377050961e-06, "loss": 0.9376, "step": 5157 }, { "epoch": 0.1, "learning_rate": 4.940848346967983e-06, "loss": 1.0038, "step": 5158 }, { "epoch": 0.1, "learning_rate": 4.940815307770953e-06, "loss": 0.8939, "step": 5159 }, { "epoch": 0.1, "learning_rate": 4.940782259459993e-06, "loss": 0.929, "step": 5160 }, { "epoch": 0.1, "learning_rate": 4.940749202035227e-06, "loss": 0.9626, "step": 5161 }, { "epoch": 0.1, "learning_rate": 4.940716135496778e-06, "loss": 1.1577, "step": 5162 }, { "epoch": 0.1, "learning_rate": 4.94068305984477e-06, "loss": 1.2072, "step": 5163 }, { "epoch": 0.1, "learning_rate": 4.940649975079327e-06, "loss": 0.8369, "step": 5164 }, { "epoch": 0.1, "learning_rate": 4.940616881200571e-06, "loss": 0.8807, "step": 5165 }, { "epoch": 0.1, "learning_rate": 4.940583778208626e-06, "loss": 1.1608, "step": 5166 }, { "epoch": 0.1, "learning_rate": 4.940550666103616e-06, "loss": 0.9313, "step": 5167 }, { "epoch": 0.1, "learning_rate": 4.940517544885665e-06, "loss": 0.8925, "step": 5168 }, { "epoch": 0.1, "learning_rate": 4.940484414554897e-06, "loss": 1.1749, "step": 5169 }, { "epoch": 0.1, "learning_rate": 4.940451275111434e-06, "loss": 0.9499, "step": 5170 }, { "epoch": 0.1, "learning_rate": 4.940418126555401e-06, "loss": 1.0856, "step": 5171 }, { "epoch": 0.1, "learning_rate": 4.940384968886922e-06, "loss": 1.0182, "step": 5172 }, { "epoch": 0.1, "learning_rate": 4.94035180210612e-06, "loss": 0.8954, "step": 5173 }, { "epoch": 0.1, "learning_rate": 4.940318626213119e-06, "loss": 1.0637, "step": 5174 }, { "epoch": 0.1, "learning_rate": 4.940285441208044e-06, "loss": 0.937, "step": 5175 }, { "epoch": 0.1, "learning_rate": 4.940252247091017e-06, "loss": 0.8578, "step": 5176 }, { "epoch": 0.1, "learning_rate": 4.940219043862163e-06, "loss": 0.8596, "step": 5177 }, { "epoch": 0.1, "learning_rate": 4.940185831521606e-06, "loss": 0.9762, "step": 5178 }, { "epoch": 0.1, "learning_rate": 4.94015261006947e-06, "loss": 0.8416, "step": 5179 }, { "epoch": 0.1, "learning_rate": 4.940119379505879e-06, "loss": 1.1063, "step": 5180 }, { "epoch": 0.1, "learning_rate": 4.940086139830957e-06, "loss": 1.0887, "step": 5181 }, { "epoch": 0.1, "learning_rate": 4.940052891044829e-06, "loss": 0.9345, "step": 5182 }, { "epoch": 0.1, "learning_rate": 4.940019633147617e-06, "loss": 1.0729, "step": 5183 }, { "epoch": 0.1, "learning_rate": 4.939986366139448e-06, "loss": 0.8852, "step": 5184 }, { "epoch": 0.1, "learning_rate": 4.939953090020443e-06, "loss": 0.8727, "step": 5185 }, { "epoch": 0.1, "learning_rate": 4.939919804790729e-06, "loss": 0.9626, "step": 5186 }, { "epoch": 0.1, "learning_rate": 4.939886510450429e-06, "loss": 1.2165, "step": 5187 }, { "epoch": 0.1, "learning_rate": 4.939853206999667e-06, "loss": 1.0981, "step": 5188 }, { "epoch": 0.1, "learning_rate": 4.939819894438569e-06, "loss": 0.8076, "step": 5189 }, { "epoch": 0.1, "learning_rate": 4.939786572767258e-06, "loss": 1.0083, "step": 5190 }, { "epoch": 0.1, "learning_rate": 4.939753241985858e-06, "loss": 0.7321, "step": 5191 }, { "epoch": 0.1, "learning_rate": 4.939719902094495e-06, "loss": 0.9532, "step": 5192 }, { "epoch": 0.1, "learning_rate": 4.939686553093292e-06, "loss": 1.1477, "step": 5193 }, { "epoch": 0.1, "learning_rate": 4.939653194982376e-06, "loss": 1.0145, "step": 5194 }, { "epoch": 0.1, "learning_rate": 4.939619827761868e-06, "loss": 0.8333, "step": 5195 }, { "epoch": 0.1, "learning_rate": 4.939586451431895e-06, "loss": 0.9951, "step": 5196 }, { "epoch": 0.1, "learning_rate": 4.939553065992581e-06, "loss": 0.9545, "step": 5197 }, { "epoch": 0.1, "learning_rate": 4.93951967144405e-06, "loss": 0.8291, "step": 5198 }, { "epoch": 0.1, "learning_rate": 4.939486267786428e-06, "loss": 0.9836, "step": 5199 }, { "epoch": 0.1, "learning_rate": 4.939452855019839e-06, "loss": 1.2262, "step": 5200 }, { "epoch": 0.1, "learning_rate": 4.939419433144408e-06, "loss": 1.1349, "step": 5201 }, { "epoch": 0.1, "learning_rate": 4.939386002160259e-06, "loss": 0.9022, "step": 5202 }, { "epoch": 0.1, "learning_rate": 4.939352562067517e-06, "loss": 0.9694, "step": 5203 }, { "epoch": 0.1, "learning_rate": 4.939319112866309e-06, "loss": 0.9858, "step": 5204 }, { "epoch": 0.1, "learning_rate": 4.9392856545567574e-06, "loss": 0.9236, "step": 5205 }, { "epoch": 0.1, "learning_rate": 4.939252187138988e-06, "loss": 1.287, "step": 5206 }, { "epoch": 0.1, "learning_rate": 4.939218710613126e-06, "loss": 1.2739, "step": 5207 }, { "epoch": 0.1, "learning_rate": 4.939185224979295e-06, "loss": 1.0074, "step": 5208 }, { "epoch": 0.1, "learning_rate": 4.9391517302376225e-06, "loss": 1.1801, "step": 5209 }, { "epoch": 0.1, "learning_rate": 4.939118226388231e-06, "loss": 0.8748, "step": 5210 }, { "epoch": 0.1, "learning_rate": 4.939084713431248e-06, "loss": 0.8144, "step": 5211 }, { "epoch": 0.1, "learning_rate": 4.939051191366797e-06, "loss": 1.2484, "step": 5212 }, { "epoch": 0.1, "learning_rate": 4.939017660195004e-06, "loss": 0.8859, "step": 5213 }, { "epoch": 0.1, "learning_rate": 4.938984119915993e-06, "loss": 1.0699, "step": 5214 }, { "epoch": 0.1, "learning_rate": 4.93895057052989e-06, "loss": 0.8405, "step": 5215 }, { "epoch": 0.1, "learning_rate": 4.938917012036821e-06, "loss": 0.965, "step": 5216 }, { "epoch": 0.1, "learning_rate": 4.9388834444369105e-06, "loss": 0.8076, "step": 5217 }, { "epoch": 0.1, "learning_rate": 4.9388498677302845e-06, "loss": 1.0397, "step": 5218 }, { "epoch": 0.1, "learning_rate": 4.9388162819170675e-06, "loss": 1.1174, "step": 5219 }, { "epoch": 0.1, "learning_rate": 4.938782686997385e-06, "loss": 0.9524, "step": 5220 }, { "epoch": 0.1, "learning_rate": 4.938749082971363e-06, "loss": 0.7991, "step": 5221 }, { "epoch": 0.1, "learning_rate": 4.938715469839126e-06, "loss": 0.9977, "step": 5222 }, { "epoch": 0.1, "learning_rate": 4.938681847600801e-06, "loss": 0.8826, "step": 5223 }, { "epoch": 0.1, "learning_rate": 4.938648216256512e-06, "loss": 1.0906, "step": 5224 }, { "epoch": 0.1, "learning_rate": 4.938614575806386e-06, "loss": 1.148, "step": 5225 }, { "epoch": 0.1, "learning_rate": 4.938580926250548e-06, "loss": 0.8344, "step": 5226 }, { "epoch": 0.1, "learning_rate": 4.938547267589123e-06, "loss": 0.9444, "step": 5227 }, { "epoch": 0.1, "learning_rate": 4.938513599822238e-06, "loss": 0.759, "step": 5228 }, { "epoch": 0.1, "learning_rate": 4.938479922950018e-06, "loss": 0.8492, "step": 5229 }, { "epoch": 0.1, "learning_rate": 4.938446236972588e-06, "loss": 0.9838, "step": 5230 }, { "epoch": 0.1, "learning_rate": 4.9384125418900754e-06, "loss": 1.157, "step": 5231 }, { "epoch": 0.1, "learning_rate": 4.938378837702604e-06, "loss": 0.9546, "step": 5232 }, { "epoch": 0.1, "learning_rate": 4.938345124410302e-06, "loss": 0.9144, "step": 5233 }, { "epoch": 0.1, "learning_rate": 4.938311402013294e-06, "loss": 1.0942, "step": 5234 }, { "epoch": 0.1, "learning_rate": 4.938277670511705e-06, "loss": 0.9855, "step": 5235 }, { "epoch": 0.1, "learning_rate": 4.938243929905662e-06, "loss": 1.0898, "step": 5236 }, { "epoch": 0.1, "learning_rate": 4.9382101801952916e-06, "loss": 0.9903, "step": 5237 }, { "epoch": 0.1, "learning_rate": 4.938176421380719e-06, "loss": 1.0709, "step": 5238 }, { "epoch": 0.1, "learning_rate": 4.93814265346207e-06, "loss": 0.9131, "step": 5239 }, { "epoch": 0.1, "learning_rate": 4.938108876439471e-06, "loss": 1.0719, "step": 5240 }, { "epoch": 0.1, "learning_rate": 4.938075090313049e-06, "loss": 1.2809, "step": 5241 }, { "epoch": 0.1, "learning_rate": 4.938041295082929e-06, "loss": 0.9226, "step": 5242 }, { "epoch": 0.1, "learning_rate": 4.938007490749237e-06, "loss": 1.0201, "step": 5243 }, { "epoch": 0.1, "learning_rate": 4.9379736773121e-06, "loss": 1.179, "step": 5244 }, { "epoch": 0.1, "learning_rate": 4.937939854771645e-06, "loss": 0.9524, "step": 5245 }, { "epoch": 0.1, "learning_rate": 4.937906023127996e-06, "loss": 1.0234, "step": 5246 }, { "epoch": 0.1, "learning_rate": 4.937872182381282e-06, "loss": 1.019, "step": 5247 }, { "epoch": 0.1, "learning_rate": 4.937838332531627e-06, "loss": 1.0298, "step": 5248 }, { "epoch": 0.1, "learning_rate": 4.937804473579159e-06, "loss": 1.0767, "step": 5249 }, { "epoch": 0.1, "learning_rate": 4.937770605524004e-06, "loss": 1.1036, "step": 5250 }, { "epoch": 0.1, "learning_rate": 4.937736728366287e-06, "loss": 1.1064, "step": 5251 }, { "epoch": 0.1, "learning_rate": 4.937702842106137e-06, "loss": 0.9885, "step": 5252 }, { "epoch": 0.1, "learning_rate": 4.937668946743679e-06, "loss": 1.1113, "step": 5253 }, { "epoch": 0.1, "learning_rate": 4.9376350422790396e-06, "loss": 0.8331, "step": 5254 }, { "epoch": 0.1, "learning_rate": 4.937601128712346e-06, "loss": 1.1772, "step": 5255 }, { "epoch": 0.1, "learning_rate": 4.9375672060437245e-06, "loss": 1.0281, "step": 5256 }, { "epoch": 0.1, "learning_rate": 4.937533274273302e-06, "loss": 1.1115, "step": 5257 }, { "epoch": 0.1, "learning_rate": 4.9374993334012045e-06, "loss": 0.7354, "step": 5258 }, { "epoch": 0.1, "learning_rate": 4.93746538342756e-06, "loss": 0.9312, "step": 5259 }, { "epoch": 0.1, "learning_rate": 4.937431424352494e-06, "loss": 0.8539, "step": 5260 }, { "epoch": 0.1, "learning_rate": 4.937397456176134e-06, "loss": 1.0517, "step": 5261 }, { "epoch": 0.1, "learning_rate": 4.937363478898606e-06, "loss": 1.2566, "step": 5262 }, { "epoch": 0.1, "learning_rate": 4.9373294925200375e-06, "loss": 1.1223, "step": 5263 }, { "epoch": 0.1, "learning_rate": 4.937295497040556e-06, "loss": 0.7529, "step": 5264 }, { "epoch": 0.1, "learning_rate": 4.937261492460288e-06, "loss": 0.9717, "step": 5265 }, { "epoch": 0.1, "learning_rate": 4.93722747877936e-06, "loss": 1.0235, "step": 5266 }, { "epoch": 0.1, "learning_rate": 4.937193455997899e-06, "loss": 0.9492, "step": 5267 }, { "epoch": 0.1, "learning_rate": 4.937159424116033e-06, "loss": 1.1169, "step": 5268 }, { "epoch": 0.1, "learning_rate": 4.937125383133888e-06, "loss": 1.1104, "step": 5269 }, { "epoch": 0.1, "learning_rate": 4.9370913330515914e-06, "loss": 0.9172, "step": 5270 }, { "epoch": 0.1, "learning_rate": 4.937057273869271e-06, "loss": 0.9936, "step": 5271 }, { "epoch": 0.1, "learning_rate": 4.937023205587053e-06, "loss": 0.7141, "step": 5272 }, { "epoch": 0.1, "learning_rate": 4.936989128205065e-06, "loss": 0.9971, "step": 5273 }, { "epoch": 0.1, "learning_rate": 4.936955041723435e-06, "loss": 1.035, "step": 5274 }, { "epoch": 0.1, "learning_rate": 4.936920946142289e-06, "loss": 1.0427, "step": 5275 }, { "epoch": 0.1, "learning_rate": 4.936886841461755e-06, "loss": 0.9868, "step": 5276 }, { "epoch": 0.1, "learning_rate": 4.936852727681961e-06, "loss": 0.9603, "step": 5277 }, { "epoch": 0.1, "learning_rate": 4.936818604803032e-06, "loss": 1.0499, "step": 5278 }, { "epoch": 0.1, "learning_rate": 4.9367844728250985e-06, "loss": 1.0712, "step": 5279 }, { "epoch": 0.1, "learning_rate": 4.936750331748286e-06, "loss": 1.2183, "step": 5280 }, { "epoch": 0.1, "learning_rate": 4.936716181572723e-06, "loss": 1.2584, "step": 5281 }, { "epoch": 0.1, "learning_rate": 4.936682022298536e-06, "loss": 0.9769, "step": 5282 }, { "epoch": 0.1, "learning_rate": 4.936647853925852e-06, "loss": 1.02, "step": 5283 }, { "epoch": 0.1, "learning_rate": 4.936613676454801e-06, "loss": 1.0049, "step": 5284 }, { "epoch": 0.1, "learning_rate": 4.936579489885509e-06, "loss": 0.8517, "step": 5285 }, { "epoch": 0.1, "learning_rate": 4.936545294218104e-06, "loss": 0.8934, "step": 5286 }, { "epoch": 0.1, "learning_rate": 4.936511089452714e-06, "loss": 1.0246, "step": 5287 }, { "epoch": 0.1, "learning_rate": 4.936476875589465e-06, "loss": 0.9838, "step": 5288 }, { "epoch": 0.1, "learning_rate": 4.936442652628487e-06, "loss": 0.8387, "step": 5289 }, { "epoch": 0.1, "learning_rate": 4.936408420569906e-06, "loss": 0.8861, "step": 5290 }, { "epoch": 0.1, "learning_rate": 4.936374179413851e-06, "loss": 0.9093, "step": 5291 }, { "epoch": 0.1, "learning_rate": 4.93633992916045e-06, "loss": 0.8176, "step": 5292 }, { "epoch": 0.1, "learning_rate": 4.93630566980983e-06, "loss": 1.0467, "step": 5293 }, { "epoch": 0.1, "learning_rate": 4.93627140136212e-06, "loss": 1.0285, "step": 5294 }, { "epoch": 0.1, "learning_rate": 4.9362371238174465e-06, "loss": 0.9742, "step": 5295 }, { "epoch": 0.1, "learning_rate": 4.936202837175938e-06, "loss": 0.9916, "step": 5296 }, { "epoch": 0.1, "learning_rate": 4.936168541437723e-06, "loss": 0.997, "step": 5297 }, { "epoch": 0.1, "learning_rate": 4.93613423660293e-06, "loss": 0.85, "step": 5298 }, { "epoch": 0.1, "learning_rate": 4.936099922671686e-06, "loss": 0.9714, "step": 5299 }, { "epoch": 0.1, "learning_rate": 4.93606559964412e-06, "loss": 0.8195, "step": 5300 }, { "epoch": 0.1, "learning_rate": 4.936031267520359e-06, "loss": 0.974, "step": 5301 }, { "epoch": 0.1, "learning_rate": 4.935996926300532e-06, "loss": 0.8255, "step": 5302 }, { "epoch": 0.1, "learning_rate": 4.935962575984768e-06, "loss": 1.0211, "step": 5303 }, { "epoch": 0.1, "learning_rate": 4.935928216573194e-06, "loss": 0.9401, "step": 5304 }, { "epoch": 0.1, "learning_rate": 4.935893848065939e-06, "loss": 1.1494, "step": 5305 }, { "epoch": 0.1, "learning_rate": 4.93585947046313e-06, "loss": 1.0496, "step": 5306 }, { "epoch": 0.1, "learning_rate": 4.935825083764898e-06, "loss": 0.8555, "step": 5307 }, { "epoch": 0.1, "learning_rate": 4.935790687971369e-06, "loss": 0.8861, "step": 5308 }, { "epoch": 0.1, "learning_rate": 4.935756283082672e-06, "loss": 0.7988, "step": 5309 }, { "epoch": 0.1, "learning_rate": 4.9357218690989365e-06, "loss": 0.9376, "step": 5310 }, { "epoch": 0.1, "learning_rate": 4.935687446020289e-06, "loss": 1.024, "step": 5311 }, { "epoch": 0.1, "learning_rate": 4.93565301384686e-06, "loss": 1.0928, "step": 5312 }, { "epoch": 0.1, "learning_rate": 4.9356185725787774e-06, "loss": 1.0051, "step": 5313 }, { "epoch": 0.1, "learning_rate": 4.935584122216169e-06, "loss": 1.0657, "step": 5314 }, { "epoch": 0.1, "learning_rate": 4.9355496627591655e-06, "loss": 0.9947, "step": 5315 }, { "epoch": 0.1, "learning_rate": 4.9355151942078935e-06, "loss": 0.9044, "step": 5316 }, { "epoch": 0.1, "learning_rate": 4.935480716562482e-06, "loss": 0.9857, "step": 5317 }, { "epoch": 0.1, "learning_rate": 4.935446229823061e-06, "loss": 1.0722, "step": 5318 }, { "epoch": 0.1, "learning_rate": 4.9354117339897575e-06, "loss": 1.0282, "step": 5319 }, { "epoch": 0.1, "learning_rate": 4.935377229062702e-06, "loss": 1.0212, "step": 5320 }, { "epoch": 0.1, "learning_rate": 4.935342715042023e-06, "loss": 0.8054, "step": 5321 }, { "epoch": 0.1, "learning_rate": 4.935308191927848e-06, "loss": 0.9459, "step": 5322 }, { "epoch": 0.1, "learning_rate": 4.935273659720307e-06, "loss": 0.8563, "step": 5323 }, { "epoch": 0.1, "learning_rate": 4.935239118419529e-06, "loss": 1.0296, "step": 5324 }, { "epoch": 0.1, "learning_rate": 4.935204568025643e-06, "loss": 1.0936, "step": 5325 }, { "epoch": 0.1, "learning_rate": 4.9351700085387776e-06, "loss": 1.0607, "step": 5326 }, { "epoch": 0.1, "learning_rate": 4.935135439959062e-06, "loss": 0.8987, "step": 5327 }, { "epoch": 0.1, "learning_rate": 4.935100862286626e-06, "loss": 1.0957, "step": 5328 }, { "epoch": 0.1, "learning_rate": 4.935066275521597e-06, "loss": 0.8312, "step": 5329 }, { "epoch": 0.1, "learning_rate": 4.9350316796641065e-06, "loss": 1.1602, "step": 5330 }, { "epoch": 0.1, "learning_rate": 4.934997074714281e-06, "loss": 1.2445, "step": 5331 }, { "epoch": 0.1, "learning_rate": 4.934962460672252e-06, "loss": 1.0781, "step": 5332 }, { "epoch": 0.1, "learning_rate": 4.934927837538147e-06, "loss": 0.857, "step": 5333 }, { "epoch": 0.1, "learning_rate": 4.934893205312097e-06, "loss": 1.0322, "step": 5334 }, { "epoch": 0.1, "learning_rate": 4.93485856399423e-06, "loss": 1.0187, "step": 5335 }, { "epoch": 0.1, "learning_rate": 4.934823913584675e-06, "loss": 0.949, "step": 5336 }, { "epoch": 0.1, "learning_rate": 4.934789254083564e-06, "loss": 1.039, "step": 5337 }, { "epoch": 0.1, "learning_rate": 4.934754585491024e-06, "loss": 1.0676, "step": 5338 }, { "epoch": 0.1, "learning_rate": 4.934719907807184e-06, "loss": 0.9086, "step": 5339 }, { "epoch": 0.1, "learning_rate": 4.9346852210321746e-06, "loss": 0.857, "step": 5340 }, { "epoch": 0.1, "learning_rate": 4.9346505251661256e-06, "loss": 1.0138, "step": 5341 }, { "epoch": 0.1, "learning_rate": 4.934615820209167e-06, "loss": 0.9496, "step": 5342 }, { "epoch": 0.1, "learning_rate": 4.934581106161427e-06, "loss": 0.977, "step": 5343 }, { "epoch": 0.1, "learning_rate": 4.934546383023035e-06, "loss": 1.0262, "step": 5344 }, { "epoch": 0.1, "learning_rate": 4.934511650794123e-06, "loss": 0.9601, "step": 5345 }, { "epoch": 0.1, "learning_rate": 4.934476909474818e-06, "loss": 0.8492, "step": 5346 }, { "epoch": 0.1, "learning_rate": 4.934442159065251e-06, "loss": 1.0012, "step": 5347 }, { "epoch": 0.1, "learning_rate": 4.934407399565552e-06, "loss": 0.9499, "step": 5348 }, { "epoch": 0.1, "learning_rate": 4.93437263097585e-06, "loss": 1.154, "step": 5349 }, { "epoch": 0.1, "learning_rate": 4.934337853296275e-06, "loss": 1.0479, "step": 5350 }, { "epoch": 0.1, "learning_rate": 4.934303066526957e-06, "loss": 0.9957, "step": 5351 }, { "epoch": 0.1, "learning_rate": 4.934268270668027e-06, "loss": 0.766, "step": 5352 }, { "epoch": 0.1, "learning_rate": 4.934233465719614e-06, "loss": 0.9965, "step": 5353 }, { "epoch": 0.1, "learning_rate": 4.934198651681847e-06, "loss": 0.8961, "step": 5354 }, { "epoch": 0.1, "learning_rate": 4.934163828554856e-06, "loss": 0.9351, "step": 5355 }, { "epoch": 0.1, "learning_rate": 4.934128996338774e-06, "loss": 1.1957, "step": 5356 }, { "epoch": 0.1, "learning_rate": 4.934094155033727e-06, "loss": 1.1334, "step": 5357 }, { "epoch": 0.1, "learning_rate": 4.934059304639849e-06, "loss": 0.9022, "step": 5358 }, { "epoch": 0.1, "learning_rate": 4.934024445157267e-06, "loss": 1.017, "step": 5359 }, { "epoch": 0.1, "learning_rate": 4.933989576586112e-06, "loss": 0.9088, "step": 5360 }, { "epoch": 0.1, "learning_rate": 4.9339546989265154e-06, "loss": 0.8504, "step": 5361 }, { "epoch": 0.1, "learning_rate": 4.933919812178607e-06, "loss": 1.1559, "step": 5362 }, { "epoch": 0.1, "learning_rate": 4.933884916342516e-06, "loss": 0.8351, "step": 5363 }, { "epoch": 0.1, "learning_rate": 4.933850011418373e-06, "loss": 0.9, "step": 5364 }, { "epoch": 0.1, "learning_rate": 4.933815097406309e-06, "loss": 0.8453, "step": 5365 }, { "epoch": 0.1, "learning_rate": 4.933780174306454e-06, "loss": 0.8164, "step": 5366 }, { "epoch": 0.1, "learning_rate": 4.933745242118938e-06, "loss": 0.9423, "step": 5367 }, { "epoch": 0.1, "learning_rate": 4.9337103008438925e-06, "loss": 1.0995, "step": 5368 }, { "epoch": 0.1, "learning_rate": 4.933675350481447e-06, "loss": 1.1478, "step": 5369 }, { "epoch": 0.1, "learning_rate": 4.933640391031733e-06, "loss": 1.0839, "step": 5370 }, { "epoch": 0.1, "learning_rate": 4.933605422494881e-06, "loss": 0.878, "step": 5371 }, { "epoch": 0.1, "learning_rate": 4.933570444871019e-06, "loss": 0.89, "step": 5372 }, { "epoch": 0.1, "learning_rate": 4.93353545816028e-06, "loss": 0.9021, "step": 5373 }, { "epoch": 0.1, "learning_rate": 4.933500462362795e-06, "loss": 1.0381, "step": 5374 }, { "epoch": 0.1, "learning_rate": 4.933465457478694e-06, "loss": 1.0168, "step": 5375 }, { "epoch": 0.1, "learning_rate": 4.933430443508107e-06, "loss": 0.7063, "step": 5376 }, { "epoch": 0.1, "learning_rate": 4.933395420451166e-06, "loss": 0.812, "step": 5377 }, { "epoch": 0.1, "learning_rate": 4.933360388308001e-06, "loss": 0.9336, "step": 5378 }, { "epoch": 0.1, "learning_rate": 4.9333253470787414e-06, "loss": 0.8591, "step": 5379 }, { "epoch": 0.1, "learning_rate": 4.933290296763521e-06, "loss": 0.811, "step": 5380 }, { "epoch": 0.1, "learning_rate": 4.933255237362469e-06, "loss": 1.1079, "step": 5381 }, { "epoch": 0.1, "learning_rate": 4.933220168875717e-06, "loss": 0.9221, "step": 5382 }, { "epoch": 0.1, "learning_rate": 4.933185091303394e-06, "loss": 0.7494, "step": 5383 }, { "epoch": 0.1, "learning_rate": 4.933150004645634e-06, "loss": 0.9858, "step": 5384 }, { "epoch": 0.1, "learning_rate": 4.933114908902567e-06, "loss": 1.0439, "step": 5385 }, { "epoch": 0.1, "learning_rate": 4.9330798040743215e-06, "loss": 1.065, "step": 5386 }, { "epoch": 0.1, "learning_rate": 4.933044690161032e-06, "loss": 1.1033, "step": 5387 }, { "epoch": 0.1, "learning_rate": 4.933009567162827e-06, "loss": 1.0143, "step": 5388 }, { "epoch": 0.1, "learning_rate": 4.93297443507984e-06, "loss": 0.8722, "step": 5389 }, { "epoch": 0.1, "learning_rate": 4.932939293912201e-06, "loss": 0.989, "step": 5390 }, { "epoch": 0.1, "learning_rate": 4.932904143660041e-06, "loss": 0.8056, "step": 5391 }, { "epoch": 0.1, "learning_rate": 4.932868984323492e-06, "loss": 1.0558, "step": 5392 }, { "epoch": 0.1, "learning_rate": 4.932833815902684e-06, "loss": 1.0658, "step": 5393 }, { "epoch": 0.1, "learning_rate": 4.93279863839775e-06, "loss": 1.0553, "step": 5394 }, { "epoch": 0.1, "learning_rate": 4.93276345180882e-06, "loss": 1.1459, "step": 5395 }, { "epoch": 0.1, "learning_rate": 4.932728256136026e-06, "loss": 0.8812, "step": 5396 }, { "epoch": 0.1, "learning_rate": 4.932693051379498e-06, "loss": 0.8369, "step": 5397 }, { "epoch": 0.1, "learning_rate": 4.93265783753937e-06, "loss": 1.0032, "step": 5398 }, { "epoch": 0.1, "learning_rate": 4.932622614615773e-06, "loss": 0.9547, "step": 5399 }, { "epoch": 0.1, "learning_rate": 4.9325873826088365e-06, "loss": 1.1021, "step": 5400 }, { "epoch": 0.1, "learning_rate": 4.932552141518693e-06, "loss": 1.101, "step": 5401 }, { "epoch": 0.1, "learning_rate": 4.932516891345476e-06, "loss": 0.8527, "step": 5402 }, { "epoch": 0.1, "learning_rate": 4.932481632089314e-06, "loss": 0.9453, "step": 5403 }, { "epoch": 0.1, "learning_rate": 4.932446363750341e-06, "loss": 0.9592, "step": 5404 }, { "epoch": 0.1, "learning_rate": 4.932411086328687e-06, "loss": 0.9362, "step": 5405 }, { "epoch": 0.1, "learning_rate": 4.9323757998244845e-06, "loss": 1.0035, "step": 5406 }, { "epoch": 0.1, "learning_rate": 4.932340504237867e-06, "loss": 1.0048, "step": 5407 }, { "epoch": 0.1, "learning_rate": 4.932305199568963e-06, "loss": 0.9966, "step": 5408 }, { "epoch": 0.1, "learning_rate": 4.932269885817906e-06, "loss": 0.9128, "step": 5409 }, { "epoch": 0.1, "learning_rate": 4.932234562984829e-06, "loss": 0.9445, "step": 5410 }, { "epoch": 0.1, "learning_rate": 4.932199231069862e-06, "loss": 0.9828, "step": 5411 }, { "epoch": 0.1, "learning_rate": 4.932163890073138e-06, "loss": 1.0319, "step": 5412 }, { "epoch": 0.1, "learning_rate": 4.9321285399947886e-06, "loss": 1.0851, "step": 5413 }, { "epoch": 0.1, "learning_rate": 4.932093180834945e-06, "loss": 0.782, "step": 5414 }, { "epoch": 0.1, "learning_rate": 4.932057812593741e-06, "loss": 0.9879, "step": 5415 }, { "epoch": 0.1, "learning_rate": 4.932022435271307e-06, "loss": 0.759, "step": 5416 }, { "epoch": 0.1, "learning_rate": 4.931987048867776e-06, "loss": 0.9109, "step": 5417 }, { "epoch": 0.1, "learning_rate": 4.93195165338328e-06, "loss": 0.988, "step": 5418 }, { "epoch": 0.1, "learning_rate": 4.9319162488179516e-06, "loss": 0.9878, "step": 5419 }, { "epoch": 0.1, "learning_rate": 4.931880835171922e-06, "loss": 0.8956, "step": 5420 }, { "epoch": 0.1, "learning_rate": 4.931845412445323e-06, "loss": 1.1216, "step": 5421 }, { "epoch": 0.1, "learning_rate": 4.9318099806382894e-06, "loss": 0.9856, "step": 5422 }, { "epoch": 0.1, "learning_rate": 4.931774539750951e-06, "loss": 0.8205, "step": 5423 }, { "epoch": 0.1, "learning_rate": 4.9317390897834415e-06, "loss": 1.0165, "step": 5424 }, { "epoch": 0.1, "learning_rate": 4.9317036307358925e-06, "loss": 0.9534, "step": 5425 }, { "epoch": 0.1, "learning_rate": 4.9316681626084365e-06, "loss": 0.7299, "step": 5426 }, { "epoch": 0.1, "learning_rate": 4.931632685401207e-06, "loss": 0.8951, "step": 5427 }, { "epoch": 0.1, "learning_rate": 4.931597199114334e-06, "loss": 0.8795, "step": 5428 }, { "epoch": 0.1, "learning_rate": 4.931561703747952e-06, "loss": 0.8975, "step": 5429 }, { "epoch": 0.1, "learning_rate": 4.931526199302194e-06, "loss": 0.894, "step": 5430 }, { "epoch": 0.1, "learning_rate": 4.931490685777192e-06, "loss": 1.1392, "step": 5431 }, { "epoch": 0.1, "learning_rate": 4.931455163173078e-06, "loss": 1.1353, "step": 5432 }, { "epoch": 0.1, "learning_rate": 4.9314196314899845e-06, "loss": 0.7807, "step": 5433 }, { "epoch": 0.1, "learning_rate": 4.931384090728045e-06, "loss": 0.8243, "step": 5434 }, { "epoch": 0.1, "learning_rate": 4.9313485408873915e-06, "loss": 1.0158, "step": 5435 }, { "epoch": 0.1, "learning_rate": 4.931312981968157e-06, "loss": 0.8269, "step": 5436 }, { "epoch": 0.1, "learning_rate": 4.931277413970475e-06, "loss": 1.0191, "step": 5437 }, { "epoch": 0.1, "learning_rate": 4.931241836894478e-06, "loss": 0.7592, "step": 5438 }, { "epoch": 0.1, "learning_rate": 4.931206250740297e-06, "loss": 1.0216, "step": 5439 }, { "epoch": 0.1, "learning_rate": 4.931170655508068e-06, "loss": 0.812, "step": 5440 }, { "epoch": 0.1, "learning_rate": 4.931135051197921e-06, "loss": 0.8506, "step": 5441 }, { "epoch": 0.1, "learning_rate": 4.931099437809991e-06, "loss": 0.9025, "step": 5442 }, { "epoch": 0.1, "learning_rate": 4.93106381534441e-06, "loss": 1.3167, "step": 5443 }, { "epoch": 0.1, "learning_rate": 4.931028183801312e-06, "loss": 1.0787, "step": 5444 }, { "epoch": 0.1, "learning_rate": 4.9309925431808284e-06, "loss": 1.097, "step": 5445 }, { "epoch": 0.1, "learning_rate": 4.9309568934830935e-06, "loss": 0.9163, "step": 5446 }, { "epoch": 0.1, "learning_rate": 4.93092123470824e-06, "loss": 0.9449, "step": 5447 }, { "epoch": 0.1, "learning_rate": 4.930885566856401e-06, "loss": 1.0671, "step": 5448 }, { "epoch": 0.1, "learning_rate": 4.93084988992771e-06, "loss": 0.837, "step": 5449 }, { "epoch": 0.1, "learning_rate": 4.9308142039223005e-06, "loss": 1.087, "step": 5450 }, { "epoch": 0.1, "learning_rate": 4.930778508840305e-06, "loss": 1.082, "step": 5451 }, { "epoch": 0.1, "learning_rate": 4.930742804681856e-06, "loss": 0.9144, "step": 5452 }, { "epoch": 0.1, "learning_rate": 4.93070709144709e-06, "loss": 0.8315, "step": 5453 }, { "epoch": 0.1, "learning_rate": 4.930671369136137e-06, "loss": 0.9764, "step": 5454 }, { "epoch": 0.1, "learning_rate": 4.9306356377491315e-06, "loss": 1.1655, "step": 5455 }, { "epoch": 0.1, "learning_rate": 4.930599897286207e-06, "loss": 0.9949, "step": 5456 }, { "epoch": 0.1, "learning_rate": 4.930564147747498e-06, "loss": 0.9021, "step": 5457 }, { "epoch": 0.1, "learning_rate": 4.930528389133136e-06, "loss": 0.7757, "step": 5458 }, { "epoch": 0.1, "learning_rate": 4.930492621443256e-06, "loss": 0.7612, "step": 5459 }, { "epoch": 0.1, "learning_rate": 4.93045684467799e-06, "loss": 0.9466, "step": 5460 }, { "epoch": 0.1, "learning_rate": 4.9304210588374735e-06, "loss": 0.9562, "step": 5461 }, { "epoch": 0.1, "learning_rate": 4.930385263921839e-06, "loss": 1.3502, "step": 5462 }, { "epoch": 0.1, "learning_rate": 4.930349459931221e-06, "loss": 0.9879, "step": 5463 }, { "epoch": 0.1, "learning_rate": 4.930313646865752e-06, "loss": 0.8667, "step": 5464 }, { "epoch": 0.1, "learning_rate": 4.930277824725568e-06, "loss": 0.938, "step": 5465 }, { "epoch": 0.1, "learning_rate": 4.930241993510799e-06, "loss": 1.0134, "step": 5466 }, { "epoch": 0.1, "learning_rate": 4.930206153221582e-06, "loss": 0.947, "step": 5467 }, { "epoch": 0.1, "learning_rate": 4.93017030385805e-06, "loss": 1.0803, "step": 5468 }, { "epoch": 0.1, "learning_rate": 4.930134445420336e-06, "loss": 1.107, "step": 5469 }, { "epoch": 0.1, "learning_rate": 4.930098577908574e-06, "loss": 0.9423, "step": 5470 }, { "epoch": 0.1, "learning_rate": 4.930062701322899e-06, "loss": 0.9303, "step": 5471 }, { "epoch": 0.1, "learning_rate": 4.930026815663444e-06, "loss": 0.785, "step": 5472 }, { "epoch": 0.1, "learning_rate": 4.929990920930344e-06, "loss": 0.991, "step": 5473 }, { "epoch": 0.1, "learning_rate": 4.929955017123732e-06, "loss": 1.0097, "step": 5474 }, { "epoch": 0.1, "learning_rate": 4.929919104243743e-06, "loss": 1.0686, "step": 5475 }, { "epoch": 0.1, "learning_rate": 4.9298831822905105e-06, "loss": 0.9453, "step": 5476 }, { "epoch": 0.1, "learning_rate": 4.929847251264169e-06, "loss": 0.9548, "step": 5477 }, { "epoch": 0.1, "learning_rate": 4.929811311164851e-06, "loss": 1.0129, "step": 5478 }, { "epoch": 0.1, "learning_rate": 4.929775361992693e-06, "loss": 0.9088, "step": 5479 }, { "epoch": 0.1, "learning_rate": 4.929739403747827e-06, "loss": 0.9644, "step": 5480 }, { "epoch": 0.1, "learning_rate": 4.929703436430391e-06, "loss": 1.2236, "step": 5481 }, { "epoch": 0.1, "learning_rate": 4.929667460040515e-06, "loss": 0.8851, "step": 5482 }, { "epoch": 0.1, "learning_rate": 4.929631474578336e-06, "loss": 0.7275, "step": 5483 }, { "epoch": 0.1, "learning_rate": 4.929595480043987e-06, "loss": 0.9203, "step": 5484 }, { "epoch": 0.1, "learning_rate": 4.929559476437603e-06, "loss": 0.845, "step": 5485 }, { "epoch": 0.1, "learning_rate": 4.929523463759319e-06, "loss": 1.0911, "step": 5486 }, { "epoch": 0.1, "learning_rate": 4.929487442009269e-06, "loss": 1.0107, "step": 5487 }, { "epoch": 0.1, "learning_rate": 4.9294514111875865e-06, "loss": 1.0743, "step": 5488 }, { "epoch": 0.1, "learning_rate": 4.929415371294407e-06, "loss": 0.999, "step": 5489 }, { "epoch": 0.1, "learning_rate": 4.929379322329866e-06, "loss": 0.881, "step": 5490 }, { "epoch": 0.1, "learning_rate": 4.929343264294096e-06, "loss": 0.8707, "step": 5491 }, { "epoch": 0.1, "learning_rate": 4.929307197187233e-06, "loss": 0.9882, "step": 5492 }, { "epoch": 0.1, "learning_rate": 4.929271121009412e-06, "loss": 1.1297, "step": 5493 }, { "epoch": 0.1, "learning_rate": 4.929235035760766e-06, "loss": 1.1084, "step": 5494 }, { "epoch": 0.1, "learning_rate": 4.9291989414414325e-06, "loss": 1.02, "step": 5495 }, { "epoch": 0.1, "learning_rate": 4.929162838051544e-06, "loss": 1.0894, "step": 5496 }, { "epoch": 0.1, "learning_rate": 4.929126725591236e-06, "loss": 0.9509, "step": 5497 }, { "epoch": 0.1, "learning_rate": 4.929090604060643e-06, "loss": 1.0175, "step": 5498 }, { "epoch": 0.1, "learning_rate": 4.929054473459899e-06, "loss": 1.1154, "step": 5499 }, { "epoch": 0.1, "learning_rate": 4.929018333789142e-06, "loss": 1.0709, "step": 5500 }, { "epoch": 0.1, "learning_rate": 4.9289821850485034e-06, "loss": 0.9907, "step": 5501 }, { "epoch": 0.1, "learning_rate": 4.928946027238121e-06, "loss": 0.9348, "step": 5502 }, { "epoch": 0.1, "learning_rate": 4.928909860358128e-06, "loss": 1.0698, "step": 5503 }, { "epoch": 0.1, "learning_rate": 4.9288736844086606e-06, "loss": 0.9178, "step": 5504 }, { "epoch": 0.1, "learning_rate": 4.928837499389853e-06, "loss": 0.8443, "step": 5505 }, { "epoch": 0.1, "learning_rate": 4.92880130530184e-06, "loss": 1.0775, "step": 5506 }, { "epoch": 0.1, "learning_rate": 4.928765102144759e-06, "loss": 1.0121, "step": 5507 }, { "epoch": 0.1, "learning_rate": 4.928728889918743e-06, "loss": 0.8026, "step": 5508 }, { "epoch": 0.1, "learning_rate": 4.928692668623927e-06, "loss": 0.8362, "step": 5509 }, { "epoch": 0.1, "learning_rate": 4.928656438260447e-06, "loss": 0.8742, "step": 5510 }, { "epoch": 0.1, "learning_rate": 4.928620198828438e-06, "loss": 1.0135, "step": 5511 }, { "epoch": 0.1, "learning_rate": 4.928583950328037e-06, "loss": 1.0466, "step": 5512 }, { "epoch": 0.1, "learning_rate": 4.928547692759378e-06, "loss": 1.0742, "step": 5513 }, { "epoch": 0.1, "learning_rate": 4.928511426122595e-06, "loss": 0.9876, "step": 5514 }, { "epoch": 0.1, "learning_rate": 4.9284751504178254e-06, "loss": 0.8402, "step": 5515 }, { "epoch": 0.1, "learning_rate": 4.9284388656452044e-06, "loss": 1.006, "step": 5516 }, { "epoch": 0.1, "learning_rate": 4.928402571804867e-06, "loss": 0.9606, "step": 5517 }, { "epoch": 0.1, "learning_rate": 4.928366268896949e-06, "loss": 1.0546, "step": 5518 }, { "epoch": 0.1, "learning_rate": 4.928329956921586e-06, "loss": 1.0209, "step": 5519 }, { "epoch": 0.1, "learning_rate": 4.9282936358789125e-06, "loss": 0.8235, "step": 5520 }, { "epoch": 0.1, "learning_rate": 4.928257305769066e-06, "loss": 0.7812, "step": 5521 }, { "epoch": 0.1, "learning_rate": 4.928220966592181e-06, "loss": 0.9052, "step": 5522 }, { "epoch": 0.1, "learning_rate": 4.928184618348392e-06, "loss": 0.76, "step": 5523 }, { "epoch": 0.1, "learning_rate": 4.928148261037837e-06, "loss": 1.1205, "step": 5524 }, { "epoch": 0.1, "learning_rate": 4.9281118946606514e-06, "loss": 1.3457, "step": 5525 }, { "epoch": 0.1, "learning_rate": 4.92807551921697e-06, "loss": 1.0462, "step": 5526 }, { "epoch": 0.1, "learning_rate": 4.9280391347069286e-06, "loss": 0.918, "step": 5527 }, { "epoch": 0.1, "learning_rate": 4.928002741130664e-06, "loss": 0.8196, "step": 5528 }, { "epoch": 0.1, "learning_rate": 4.9279663384883125e-06, "loss": 0.8754, "step": 5529 }, { "epoch": 0.1, "learning_rate": 4.927929926780008e-06, "loss": 0.9443, "step": 5530 }, { "epoch": 0.1, "learning_rate": 4.9278935060058875e-06, "loss": 1.4099, "step": 5531 }, { "epoch": 0.1, "learning_rate": 4.9278570761660875e-06, "loss": 0.9545, "step": 5532 }, { "epoch": 0.1, "learning_rate": 4.927820637260744e-06, "loss": 1.0833, "step": 5533 }, { "epoch": 0.1, "learning_rate": 4.927784189289992e-06, "loss": 0.782, "step": 5534 }, { "epoch": 0.1, "learning_rate": 4.927747732253968e-06, "loss": 0.9731, "step": 5535 }, { "epoch": 0.1, "learning_rate": 4.927711266152809e-06, "loss": 0.8736, "step": 5536 }, { "epoch": 0.1, "learning_rate": 4.927674790986651e-06, "loss": 1.1372, "step": 5537 }, { "epoch": 0.1, "learning_rate": 4.927638306755629e-06, "loss": 1.1194, "step": 5538 }, { "epoch": 0.1, "learning_rate": 4.92760181345988e-06, "loss": 0.8691, "step": 5539 }, { "epoch": 0.1, "learning_rate": 4.92756531109954e-06, "loss": 0.9234, "step": 5540 }, { "epoch": 0.1, "learning_rate": 4.927528799674747e-06, "loss": 0.7435, "step": 5541 }, { "epoch": 0.1, "learning_rate": 4.927492279185634e-06, "loss": 0.8357, "step": 5542 }, { "epoch": 0.1, "learning_rate": 4.927455749632341e-06, "loss": 1.1033, "step": 5543 }, { "epoch": 0.1, "learning_rate": 4.927419211015002e-06, "loss": 1.1127, "step": 5544 }, { "epoch": 0.1, "learning_rate": 4.927382663333754e-06, "loss": 0.8212, "step": 5545 }, { "epoch": 0.1, "learning_rate": 4.927346106588733e-06, "loss": 0.8996, "step": 5546 }, { "epoch": 0.1, "learning_rate": 4.927309540780076e-06, "loss": 0.9993, "step": 5547 }, { "epoch": 0.1, "learning_rate": 4.927272965907921e-06, "loss": 0.8763, "step": 5548 }, { "epoch": 0.1, "learning_rate": 4.927236381972402e-06, "loss": 0.9743, "step": 5549 }, { "epoch": 0.1, "learning_rate": 4.9271997889736564e-06, "loss": 1.0559, "step": 5550 }, { "epoch": 0.1, "learning_rate": 4.927163186911823e-06, "loss": 1.0116, "step": 5551 }, { "epoch": 0.1, "learning_rate": 4.927126575787035e-06, "loss": 0.8788, "step": 5552 }, { "epoch": 0.1, "learning_rate": 4.9270899555994316e-06, "loss": 0.9066, "step": 5553 }, { "epoch": 0.1, "learning_rate": 4.927053326349148e-06, "loss": 0.9528, "step": 5554 }, { "epoch": 0.1, "learning_rate": 4.9270166880363224e-06, "loss": 0.9808, "step": 5555 }, { "epoch": 0.1, "learning_rate": 4.9269800406610915e-06, "loss": 1.2108, "step": 5556 }, { "epoch": 0.1, "learning_rate": 4.9269433842235905e-06, "loss": 1.0415, "step": 5557 }, { "epoch": 0.1, "learning_rate": 4.926906718723958e-06, "loss": 0.9336, "step": 5558 }, { "epoch": 0.1, "learning_rate": 4.926870044162328e-06, "loss": 1.0547, "step": 5559 }, { "epoch": 0.1, "learning_rate": 4.9268333605388424e-06, "loss": 0.8636, "step": 5560 }, { "epoch": 0.1, "learning_rate": 4.926796667853635e-06, "loss": 0.7777, "step": 5561 }, { "epoch": 0.1, "learning_rate": 4.926759966106842e-06, "loss": 1.11, "step": 5562 }, { "epoch": 0.1, "learning_rate": 4.926723255298602e-06, "loss": 0.7108, "step": 5563 }, { "epoch": 0.1, "learning_rate": 4.926686535429052e-06, "loss": 0.827, "step": 5564 }, { "epoch": 0.1, "learning_rate": 4.92664980649833e-06, "loss": 0.7674, "step": 5565 }, { "epoch": 0.11, "learning_rate": 4.9266130685065705e-06, "loss": 0.758, "step": 5566 }, { "epoch": 0.11, "learning_rate": 4.9265763214539135e-06, "loss": 0.8946, "step": 5567 }, { "epoch": 0.11, "learning_rate": 4.926539565340493e-06, "loss": 1.0598, "step": 5568 }, { "epoch": 0.11, "learning_rate": 4.926502800166451e-06, "loss": 1.2158, "step": 5569 }, { "epoch": 0.11, "learning_rate": 4.926466025931919e-06, "loss": 0.98, "step": 5570 }, { "epoch": 0.11, "learning_rate": 4.926429242637039e-06, "loss": 0.6562, "step": 5571 }, { "epoch": 0.11, "learning_rate": 4.926392450281946e-06, "loss": 1.0187, "step": 5572 }, { "epoch": 0.11, "learning_rate": 4.926355648866778e-06, "loss": 0.8448, "step": 5573 }, { "epoch": 0.11, "learning_rate": 4.926318838391673e-06, "loss": 1.0436, "step": 5574 }, { "epoch": 0.11, "learning_rate": 4.926282018856767e-06, "loss": 1.1573, "step": 5575 }, { "epoch": 0.11, "learning_rate": 4.926245190262199e-06, "loss": 1.0736, "step": 5576 }, { "epoch": 0.11, "learning_rate": 4.9262083526081055e-06, "loss": 0.907, "step": 5577 }, { "epoch": 0.11, "learning_rate": 4.926171505894625e-06, "loss": 0.9554, "step": 5578 }, { "epoch": 0.11, "learning_rate": 4.926134650121893e-06, "loss": 0.9556, "step": 5579 }, { "epoch": 0.11, "learning_rate": 4.92609778529005e-06, "loss": 0.8785, "step": 5580 }, { "epoch": 0.11, "learning_rate": 4.9260609113992315e-06, "loss": 1.0577, "step": 5581 }, { "epoch": 0.11, "learning_rate": 4.9260240284495766e-06, "loss": 0.8562, "step": 5582 }, { "epoch": 0.11, "learning_rate": 4.925987136441222e-06, "loss": 0.7773, "step": 5583 }, { "epoch": 0.11, "learning_rate": 4.925950235374306e-06, "loss": 0.7831, "step": 5584 }, { "epoch": 0.11, "learning_rate": 4.925913325248966e-06, "loss": 0.9221, "step": 5585 }, { "epoch": 0.11, "learning_rate": 4.92587640606534e-06, "loss": 0.9572, "step": 5586 }, { "epoch": 0.11, "learning_rate": 4.925839477823566e-06, "loss": 1.1479, "step": 5587 }, { "epoch": 0.11, "learning_rate": 4.925802540523782e-06, "loss": 1.0967, "step": 5588 }, { "epoch": 0.11, "learning_rate": 4.925765594166125e-06, "loss": 1.0128, "step": 5589 }, { "epoch": 0.11, "learning_rate": 4.925728638750734e-06, "loss": 0.9783, "step": 5590 }, { "epoch": 0.11, "learning_rate": 4.925691674277747e-06, "loss": 1.1041, "step": 5591 }, { "epoch": 0.11, "learning_rate": 4.925654700747301e-06, "loss": 0.9611, "step": 5592 }, { "epoch": 0.11, "learning_rate": 4.925617718159535e-06, "loss": 1.0472, "step": 5593 }, { "epoch": 0.11, "learning_rate": 4.925580726514587e-06, "loss": 1.0993, "step": 5594 }, { "epoch": 0.11, "learning_rate": 4.925543725812595e-06, "loss": 0.9883, "step": 5595 }, { "epoch": 0.11, "learning_rate": 4.9255067160536976e-06, "loss": 0.9113, "step": 5596 }, { "epoch": 0.11, "learning_rate": 4.925469697238031e-06, "loss": 1.1036, "step": 5597 }, { "epoch": 0.11, "learning_rate": 4.925432669365736e-06, "loss": 0.9418, "step": 5598 }, { "epoch": 0.11, "learning_rate": 4.925395632436949e-06, "loss": 1.0499, "step": 5599 }, { "epoch": 0.11, "learning_rate": 4.92535858645181e-06, "loss": 1.0164, "step": 5600 }, { "epoch": 0.11, "learning_rate": 4.9253215314104564e-06, "loss": 0.9188, "step": 5601 }, { "epoch": 0.11, "learning_rate": 4.925284467313026e-06, "loss": 1.0266, "step": 5602 }, { "epoch": 0.11, "learning_rate": 4.925247394159658e-06, "loss": 1.0203, "step": 5603 }, { "epoch": 0.11, "learning_rate": 4.92521031195049e-06, "loss": 0.8481, "step": 5604 }, { "epoch": 0.11, "learning_rate": 4.925173220685662e-06, "loss": 0.8804, "step": 5605 }, { "epoch": 0.11, "learning_rate": 4.925136120365311e-06, "loss": 1.1573, "step": 5606 }, { "epoch": 0.11, "learning_rate": 4.925099010989576e-06, "loss": 0.8051, "step": 5607 }, { "epoch": 0.11, "learning_rate": 4.925061892558596e-06, "loss": 0.9268, "step": 5608 }, { "epoch": 0.11, "learning_rate": 4.925024765072509e-06, "loss": 1.0394, "step": 5609 }, { "epoch": 0.11, "learning_rate": 4.924987628531454e-06, "loss": 1.1907, "step": 5610 }, { "epoch": 0.11, "learning_rate": 4.924950482935569e-06, "loss": 0.9203, "step": 5611 }, { "epoch": 0.11, "learning_rate": 4.924913328284994e-06, "loss": 1.1362, "step": 5612 }, { "epoch": 0.11, "learning_rate": 4.924876164579867e-06, "loss": 1.1774, "step": 5613 }, { "epoch": 0.11, "learning_rate": 4.924838991820326e-06, "loss": 0.9643, "step": 5614 }, { "epoch": 0.11, "learning_rate": 4.9248018100065106e-06, "loss": 0.7883, "step": 5615 }, { "epoch": 0.11, "learning_rate": 4.9247646191385605e-06, "loss": 0.9293, "step": 5616 }, { "epoch": 0.11, "learning_rate": 4.9247274192166135e-06, "loss": 1.0062, "step": 5617 }, { "epoch": 0.11, "learning_rate": 4.924690210240808e-06, "loss": 1.1336, "step": 5618 }, { "epoch": 0.11, "learning_rate": 4.924652992211284e-06, "loss": 1.2736, "step": 5619 }, { "epoch": 0.11, "learning_rate": 4.92461576512818e-06, "loss": 0.9691, "step": 5620 }, { "epoch": 0.11, "learning_rate": 4.924578528991635e-06, "loss": 0.8665, "step": 5621 }, { "epoch": 0.11, "learning_rate": 4.924541283801788e-06, "loss": 0.9941, "step": 5622 }, { "epoch": 0.11, "learning_rate": 4.9245040295587785e-06, "loss": 1.0804, "step": 5623 }, { "epoch": 0.11, "learning_rate": 4.924466766262745e-06, "loss": 0.972, "step": 5624 }, { "epoch": 0.11, "learning_rate": 4.924429493913827e-06, "loss": 1.3009, "step": 5625 }, { "epoch": 0.11, "learning_rate": 4.924392212512164e-06, "loss": 0.6278, "step": 5626 }, { "epoch": 0.11, "learning_rate": 4.924354922057894e-06, "loss": 1.0281, "step": 5627 }, { "epoch": 0.11, "learning_rate": 4.924317622551158e-06, "loss": 1.0347, "step": 5628 }, { "epoch": 0.11, "learning_rate": 4.924280313992094e-06, "loss": 0.8883, "step": 5629 }, { "epoch": 0.11, "learning_rate": 4.924242996380842e-06, "loss": 0.9101, "step": 5630 }, { "epoch": 0.11, "learning_rate": 4.92420566971754e-06, "loss": 1.0319, "step": 5631 }, { "epoch": 0.11, "learning_rate": 4.924168334002329e-06, "loss": 0.9564, "step": 5632 }, { "epoch": 0.11, "learning_rate": 4.924130989235348e-06, "loss": 0.7497, "step": 5633 }, { "epoch": 0.11, "learning_rate": 4.924093635416736e-06, "loss": 1.0906, "step": 5634 }, { "epoch": 0.11, "learning_rate": 4.9240562725466325e-06, "loss": 0.9752, "step": 5635 }, { "epoch": 0.11, "learning_rate": 4.924018900625177e-06, "loss": 1.1309, "step": 5636 }, { "epoch": 0.11, "learning_rate": 4.9239815196525095e-06, "loss": 1.0454, "step": 5637 }, { "epoch": 0.11, "learning_rate": 4.923944129628769e-06, "loss": 1.2512, "step": 5638 }, { "epoch": 0.11, "learning_rate": 4.923906730554096e-06, "loss": 1.0221, "step": 5639 }, { "epoch": 0.11, "learning_rate": 4.923869322428629e-06, "loss": 1.0443, "step": 5640 }, { "epoch": 0.11, "learning_rate": 4.923831905252508e-06, "loss": 1.0241, "step": 5641 }, { "epoch": 0.11, "learning_rate": 4.9237944790258745e-06, "loss": 0.8776, "step": 5642 }, { "epoch": 0.11, "learning_rate": 4.9237570437488655e-06, "loss": 1.2289, "step": 5643 }, { "epoch": 0.11, "learning_rate": 4.923719599421622e-06, "loss": 0.9567, "step": 5644 }, { "epoch": 0.11, "learning_rate": 4.923682146044285e-06, "loss": 1.0039, "step": 5645 }, { "epoch": 0.11, "learning_rate": 4.9236446836169925e-06, "loss": 0.9136, "step": 5646 }, { "epoch": 0.11, "learning_rate": 4.923607212139885e-06, "loss": 1.0472, "step": 5647 }, { "epoch": 0.11, "learning_rate": 4.923569731613102e-06, "loss": 0.8416, "step": 5648 }, { "epoch": 0.11, "learning_rate": 4.923532242036784e-06, "loss": 1.1492, "step": 5649 }, { "epoch": 0.11, "learning_rate": 4.9234947434110715e-06, "loss": 1.0305, "step": 5650 }, { "epoch": 0.11, "learning_rate": 4.923457235736103e-06, "loss": 0.9847, "step": 5651 }, { "epoch": 0.11, "learning_rate": 4.9234197190120205e-06, "loss": 0.8312, "step": 5652 }, { "epoch": 0.11, "learning_rate": 4.923382193238963e-06, "loss": 0.9234, "step": 5653 }, { "epoch": 0.11, "learning_rate": 4.9233446584170705e-06, "loss": 0.824, "step": 5654 }, { "epoch": 0.11, "learning_rate": 4.923307114546483e-06, "loss": 0.9517, "step": 5655 }, { "epoch": 0.11, "learning_rate": 4.923269561627342e-06, "loss": 1.1391, "step": 5656 }, { "epoch": 0.11, "learning_rate": 4.923231999659786e-06, "loss": 0.7395, "step": 5657 }, { "epoch": 0.11, "learning_rate": 4.923194428643956e-06, "loss": 0.9274, "step": 5658 }, { "epoch": 0.11, "learning_rate": 4.923156848579992e-06, "loss": 1.0266, "step": 5659 }, { "epoch": 0.11, "learning_rate": 4.923119259468035e-06, "loss": 0.8885, "step": 5660 }, { "epoch": 0.11, "learning_rate": 4.923081661308225e-06, "loss": 0.9572, "step": 5661 }, { "epoch": 0.11, "learning_rate": 4.923044054100702e-06, "loss": 1.2967, "step": 5662 }, { "epoch": 0.11, "learning_rate": 4.923006437845608e-06, "loss": 0.902, "step": 5663 }, { "epoch": 0.11, "learning_rate": 4.922968812543081e-06, "loss": 0.8782, "step": 5664 }, { "epoch": 0.11, "learning_rate": 4.922931178193263e-06, "loss": 1.0998, "step": 5665 }, { "epoch": 0.11, "learning_rate": 4.922893534796294e-06, "loss": 0.949, "step": 5666 }, { "epoch": 0.11, "learning_rate": 4.9228558823523155e-06, "loss": 0.874, "step": 5667 }, { "epoch": 0.11, "learning_rate": 4.922818220861467e-06, "loss": 0.9076, "step": 5668 }, { "epoch": 0.11, "learning_rate": 4.92278055032389e-06, "loss": 0.8768, "step": 5669 }, { "epoch": 0.11, "learning_rate": 4.922742870739724e-06, "loss": 0.9682, "step": 5670 }, { "epoch": 0.11, "learning_rate": 4.922705182109111e-06, "loss": 0.9794, "step": 5671 }, { "epoch": 0.11, "learning_rate": 4.922667484432191e-06, "loss": 0.8174, "step": 5672 }, { "epoch": 0.11, "learning_rate": 4.922629777709105e-06, "loss": 0.7983, "step": 5673 }, { "epoch": 0.11, "learning_rate": 4.922592061939994e-06, "loss": 1.0773, "step": 5674 }, { "epoch": 0.11, "learning_rate": 4.9225543371249974e-06, "loss": 1.2881, "step": 5675 }, { "epoch": 0.11, "learning_rate": 4.922516603264258e-06, "loss": 0.9773, "step": 5676 }, { "epoch": 0.11, "learning_rate": 4.922478860357915e-06, "loss": 0.9368, "step": 5677 }, { "epoch": 0.11, "learning_rate": 4.922441108406111e-06, "loss": 0.7958, "step": 5678 }, { "epoch": 0.11, "learning_rate": 4.922403347408986e-06, "loss": 0.888, "step": 5679 }, { "epoch": 0.11, "learning_rate": 4.922365577366682e-06, "loss": 1.1034, "step": 5680 }, { "epoch": 0.11, "learning_rate": 4.9223277982793385e-06, "loss": 1.0168, "step": 5681 }, { "epoch": 0.11, "learning_rate": 4.922290010147097e-06, "loss": 1.0412, "step": 5682 }, { "epoch": 0.11, "learning_rate": 4.9222522129700985e-06, "loss": 0.8447, "step": 5683 }, { "epoch": 0.11, "learning_rate": 4.922214406748486e-06, "loss": 0.954, "step": 5684 }, { "epoch": 0.11, "learning_rate": 4.922176591482398e-06, "loss": 0.8008, "step": 5685 }, { "epoch": 0.11, "learning_rate": 4.922138767171977e-06, "loss": 0.954, "step": 5686 }, { "epoch": 0.11, "learning_rate": 4.9221009338173645e-06, "loss": 1.222, "step": 5687 }, { "epoch": 0.11, "learning_rate": 4.922063091418701e-06, "loss": 1.206, "step": 5688 }, { "epoch": 0.11, "learning_rate": 4.922025239976128e-06, "loss": 0.9829, "step": 5689 }, { "epoch": 0.11, "learning_rate": 4.921987379489788e-06, "loss": 0.9292, "step": 5690 }, { "epoch": 0.11, "learning_rate": 4.921949509959821e-06, "loss": 0.9177, "step": 5691 }, { "epoch": 0.11, "learning_rate": 4.921911631386368e-06, "loss": 1.0469, "step": 5692 }, { "epoch": 0.11, "learning_rate": 4.921873743769572e-06, "loss": 0.9407, "step": 5693 }, { "epoch": 0.11, "learning_rate": 4.921835847109573e-06, "loss": 1.1159, "step": 5694 }, { "epoch": 0.11, "learning_rate": 4.921797941406514e-06, "loss": 0.908, "step": 5695 }, { "epoch": 0.11, "learning_rate": 4.921760026660535e-06, "loss": 0.8438, "step": 5696 }, { "epoch": 0.11, "learning_rate": 4.921722102871779e-06, "loss": 0.9233, "step": 5697 }, { "epoch": 0.11, "learning_rate": 4.921684170040386e-06, "loss": 0.9598, "step": 5698 }, { "epoch": 0.11, "learning_rate": 4.9216462281664996e-06, "loss": 0.979, "step": 5699 }, { "epoch": 0.11, "learning_rate": 4.92160827725026e-06, "loss": 1.069, "step": 5700 }, { "epoch": 0.11, "learning_rate": 4.92157031729181e-06, "loss": 1.0629, "step": 5701 }, { "epoch": 0.11, "learning_rate": 4.921532348291289e-06, "loss": 0.8512, "step": 5702 }, { "epoch": 0.11, "learning_rate": 4.921494370248841e-06, "loss": 0.6901, "step": 5703 }, { "epoch": 0.11, "learning_rate": 4.921456383164608e-06, "loss": 0.8907, "step": 5704 }, { "epoch": 0.11, "learning_rate": 4.921418387038731e-06, "loss": 1.0831, "step": 5705 }, { "epoch": 0.11, "learning_rate": 4.921380381871352e-06, "loss": 1.0683, "step": 5706 }, { "epoch": 0.11, "learning_rate": 4.9213423676626125e-06, "loss": 1.0135, "step": 5707 }, { "epoch": 0.11, "learning_rate": 4.921304344412655e-06, "loss": 0.7521, "step": 5708 }, { "epoch": 0.11, "learning_rate": 4.921266312121622e-06, "loss": 0.8077, "step": 5709 }, { "epoch": 0.11, "learning_rate": 4.921228270789654e-06, "loss": 0.9913, "step": 5710 }, { "epoch": 0.11, "learning_rate": 4.921190220416894e-06, "loss": 0.9922, "step": 5711 }, { "epoch": 0.11, "learning_rate": 4.921152161003484e-06, "loss": 1.3838, "step": 5712 }, { "epoch": 0.11, "learning_rate": 4.921114092549566e-06, "loss": 0.8387, "step": 5713 }, { "epoch": 0.11, "learning_rate": 4.9210760150552826e-06, "loss": 0.8181, "step": 5714 }, { "epoch": 0.11, "learning_rate": 4.921037928520776e-06, "loss": 1.0272, "step": 5715 }, { "epoch": 0.11, "learning_rate": 4.920999832946187e-06, "loss": 0.9911, "step": 5716 }, { "epoch": 0.11, "learning_rate": 4.920961728331659e-06, "loss": 0.8557, "step": 5717 }, { "epoch": 0.11, "learning_rate": 4.920923614677334e-06, "loss": 1.1644, "step": 5718 }, { "epoch": 0.11, "learning_rate": 4.920885491983355e-06, "loss": 1.2253, "step": 5719 }, { "epoch": 0.11, "learning_rate": 4.920847360249863e-06, "loss": 0.7787, "step": 5720 }, { "epoch": 0.11, "learning_rate": 4.920809219477002e-06, "loss": 0.7536, "step": 5721 }, { "epoch": 0.11, "learning_rate": 4.920771069664914e-06, "loss": 0.9524, "step": 5722 }, { "epoch": 0.11, "learning_rate": 4.92073291081374e-06, "loss": 0.8177, "step": 5723 }, { "epoch": 0.11, "learning_rate": 4.920694742923624e-06, "loss": 0.8063, "step": 5724 }, { "epoch": 0.11, "learning_rate": 4.920656565994707e-06, "loss": 1.1885, "step": 5725 }, { "epoch": 0.11, "learning_rate": 4.920618380027135e-06, "loss": 1.0303, "step": 5726 }, { "epoch": 0.11, "learning_rate": 4.920580185021046e-06, "loss": 0.8708, "step": 5727 }, { "epoch": 0.11, "learning_rate": 4.920541980976585e-06, "loss": 0.8956, "step": 5728 }, { "epoch": 0.11, "learning_rate": 4.920503767893895e-06, "loss": 0.8473, "step": 5729 }, { "epoch": 0.11, "learning_rate": 4.920465545773119e-06, "loss": 0.9517, "step": 5730 }, { "epoch": 0.11, "learning_rate": 4.920427314614398e-06, "loss": 0.9959, "step": 5731 }, { "epoch": 0.11, "learning_rate": 4.920389074417875e-06, "loss": 1.0494, "step": 5732 }, { "epoch": 0.11, "learning_rate": 4.920350825183694e-06, "loss": 0.8773, "step": 5733 }, { "epoch": 0.11, "learning_rate": 4.920312566911998e-06, "loss": 0.9794, "step": 5734 }, { "epoch": 0.11, "learning_rate": 4.920274299602928e-06, "loss": 0.8257, "step": 5735 }, { "epoch": 0.11, "learning_rate": 4.920236023256628e-06, "loss": 0.8149, "step": 5736 }, { "epoch": 0.11, "learning_rate": 4.9201977378732415e-06, "loss": 1.0739, "step": 5737 }, { "epoch": 0.11, "learning_rate": 4.920159443452911e-06, "loss": 1.0299, "step": 5738 }, { "epoch": 0.11, "learning_rate": 4.920121139995778e-06, "loss": 0.9995, "step": 5739 }, { "epoch": 0.11, "learning_rate": 4.920082827501988e-06, "loss": 0.9334, "step": 5740 }, { "epoch": 0.11, "learning_rate": 4.920044505971683e-06, "loss": 1.0626, "step": 5741 }, { "epoch": 0.11, "learning_rate": 4.920006175405006e-06, "loss": 0.9709, "step": 5742 }, { "epoch": 0.11, "learning_rate": 4.919967835802099e-06, "loss": 0.8998, "step": 5743 }, { "epoch": 0.11, "learning_rate": 4.919929487163107e-06, "loss": 1.275, "step": 5744 }, { "epoch": 0.11, "learning_rate": 4.9198911294881735e-06, "loss": 0.7735, "step": 5745 }, { "epoch": 0.11, "learning_rate": 4.9198527627774395e-06, "loss": 0.8787, "step": 5746 }, { "epoch": 0.11, "learning_rate": 4.91981438703105e-06, "loss": 1.007, "step": 5747 }, { "epoch": 0.11, "learning_rate": 4.919776002249148e-06, "loss": 0.9382, "step": 5748 }, { "epoch": 0.11, "learning_rate": 4.9197376084318756e-06, "loss": 1.1186, "step": 5749 }, { "epoch": 0.11, "learning_rate": 4.919699205579378e-06, "loss": 1.1354, "step": 5750 }, { "epoch": 0.11, "learning_rate": 4.919660793691798e-06, "loss": 0.8947, "step": 5751 }, { "epoch": 0.11, "learning_rate": 4.9196223727692784e-06, "loss": 0.8039, "step": 5752 }, { "epoch": 0.11, "learning_rate": 4.919583942811963e-06, "loss": 0.9606, "step": 5753 }, { "epoch": 0.11, "learning_rate": 4.919545503819995e-06, "loss": 0.9877, "step": 5754 }, { "epoch": 0.11, "learning_rate": 4.919507055793519e-06, "loss": 1.0254, "step": 5755 }, { "epoch": 0.11, "learning_rate": 4.9194685987326775e-06, "loss": 1.3348, "step": 5756 }, { "epoch": 0.11, "learning_rate": 4.919430132637614e-06, "loss": 1.0919, "step": 5757 }, { "epoch": 0.11, "learning_rate": 4.9193916575084734e-06, "loss": 0.9378, "step": 5758 }, { "epoch": 0.11, "learning_rate": 4.919353173345397e-06, "loss": 0.8368, "step": 5759 }, { "epoch": 0.11, "learning_rate": 4.919314680148532e-06, "loss": 0.9194, "step": 5760 }, { "epoch": 0.11, "learning_rate": 4.9192761779180185e-06, "loss": 1.0519, "step": 5761 }, { "epoch": 0.11, "learning_rate": 4.919237666654003e-06, "loss": 1.2164, "step": 5762 }, { "epoch": 0.11, "learning_rate": 4.919199146356628e-06, "loss": 0.9479, "step": 5763 }, { "epoch": 0.11, "learning_rate": 4.919160617026038e-06, "loss": 0.97, "step": 5764 }, { "epoch": 0.11, "learning_rate": 4.919122078662375e-06, "loss": 0.8441, "step": 5765 }, { "epoch": 0.11, "learning_rate": 4.919083531265786e-06, "loss": 1.0889, "step": 5766 }, { "epoch": 0.11, "learning_rate": 4.9190449748364126e-06, "loss": 0.8361, "step": 5767 }, { "epoch": 0.11, "learning_rate": 4.919006409374399e-06, "loss": 1.0864, "step": 5768 }, { "epoch": 0.11, "learning_rate": 4.91896783487989e-06, "loss": 0.9501, "step": 5769 }, { "epoch": 0.11, "learning_rate": 4.918929251353029e-06, "loss": 1.0268, "step": 5770 }, { "epoch": 0.11, "learning_rate": 4.918890658793961e-06, "loss": 0.943, "step": 5771 }, { "epoch": 0.11, "learning_rate": 4.9188520572028285e-06, "loss": 0.8667, "step": 5772 }, { "epoch": 0.11, "learning_rate": 4.918813446579777e-06, "loss": 1.0799, "step": 5773 }, { "epoch": 0.11, "learning_rate": 4.91877482692495e-06, "loss": 1.2031, "step": 5774 }, { "epoch": 0.11, "learning_rate": 4.9187361982384925e-06, "loss": 1.1797, "step": 5775 }, { "epoch": 0.11, "learning_rate": 4.918697560520548e-06, "loss": 0.9438, "step": 5776 }, { "epoch": 0.11, "learning_rate": 4.918658913771261e-06, "loss": 0.8287, "step": 5777 }, { "epoch": 0.11, "learning_rate": 4.918620257990776e-06, "loss": 1.1233, "step": 5778 }, { "epoch": 0.11, "learning_rate": 4.918581593179237e-06, "loss": 0.9271, "step": 5779 }, { "epoch": 0.11, "learning_rate": 4.918542919336789e-06, "loss": 1.0626, "step": 5780 }, { "epoch": 0.11, "learning_rate": 4.9185042364635745e-06, "loss": 1.0837, "step": 5781 }, { "epoch": 0.11, "learning_rate": 4.9184655445597405e-06, "loss": 0.9312, "step": 5782 }, { "epoch": 0.11, "learning_rate": 4.91842684362543e-06, "loss": 0.7599, "step": 5783 }, { "epoch": 0.11, "learning_rate": 4.918388133660788e-06, "loss": 0.7984, "step": 5784 }, { "epoch": 0.11, "learning_rate": 4.9183494146659575e-06, "loss": 0.9136, "step": 5785 }, { "epoch": 0.11, "learning_rate": 4.918310686641085e-06, "loss": 1.0563, "step": 5786 }, { "epoch": 0.11, "learning_rate": 4.918271949586316e-06, "loss": 1.048, "step": 5787 }, { "epoch": 0.11, "learning_rate": 4.9182332035017925e-06, "loss": 1.0103, "step": 5788 }, { "epoch": 0.11, "learning_rate": 4.918194448387661e-06, "loss": 0.8054, "step": 5789 }, { "epoch": 0.11, "learning_rate": 4.9181556842440644e-06, "loss": 0.9363, "step": 5790 }, { "epoch": 0.11, "learning_rate": 4.91811691107115e-06, "loss": 0.9268, "step": 5791 }, { "epoch": 0.11, "learning_rate": 4.918078128869061e-06, "loss": 0.884, "step": 5792 }, { "epoch": 0.11, "learning_rate": 4.918039337637941e-06, "loss": 1.0806, "step": 5793 }, { "epoch": 0.11, "learning_rate": 4.9180005373779375e-06, "loss": 1.1554, "step": 5794 }, { "epoch": 0.11, "learning_rate": 4.917961728089194e-06, "loss": 0.9211, "step": 5795 }, { "epoch": 0.11, "learning_rate": 4.917922909771855e-06, "loss": 1.0919, "step": 5796 }, { "epoch": 0.11, "learning_rate": 4.9178840824260665e-06, "loss": 0.9396, "step": 5797 }, { "epoch": 0.11, "learning_rate": 4.917845246051973e-06, "loss": 0.8887, "step": 5798 }, { "epoch": 0.11, "learning_rate": 4.917806400649719e-06, "loss": 1.1474, "step": 5799 }, { "epoch": 0.11, "learning_rate": 4.9177675462194505e-06, "loss": 1.0499, "step": 5800 }, { "epoch": 0.11, "learning_rate": 4.917728682761312e-06, "loss": 1.0155, "step": 5801 }, { "epoch": 0.11, "learning_rate": 4.917689810275449e-06, "loss": 0.9259, "step": 5802 }, { "epoch": 0.11, "learning_rate": 4.917650928762006e-06, "loss": 0.8608, "step": 5803 }, { "epoch": 0.11, "learning_rate": 4.917612038221129e-06, "loss": 1.0082, "step": 5804 }, { "epoch": 0.11, "learning_rate": 4.917573138652962e-06, "loss": 0.8659, "step": 5805 }, { "epoch": 0.11, "learning_rate": 4.917534230057651e-06, "loss": 1.1407, "step": 5806 }, { "epoch": 0.11, "learning_rate": 4.917495312435343e-06, "loss": 0.943, "step": 5807 }, { "epoch": 0.11, "learning_rate": 4.91745638578618e-06, "loss": 0.9365, "step": 5808 }, { "epoch": 0.11, "learning_rate": 4.917417450110309e-06, "loss": 1.0052, "step": 5809 }, { "epoch": 0.11, "learning_rate": 4.917378505407876e-06, "loss": 0.9045, "step": 5810 }, { "epoch": 0.11, "learning_rate": 4.917339551679026e-06, "loss": 0.9844, "step": 5811 }, { "epoch": 0.11, "learning_rate": 4.917300588923903e-06, "loss": 1.2267, "step": 5812 }, { "epoch": 0.11, "learning_rate": 4.917261617142654e-06, "loss": 1.0741, "step": 5813 }, { "epoch": 0.11, "learning_rate": 4.9172226363354255e-06, "loss": 1.0047, "step": 5814 }, { "epoch": 0.11, "learning_rate": 4.917183646502361e-06, "loss": 0.8525, "step": 5815 }, { "epoch": 0.11, "learning_rate": 4.917144647643607e-06, "loss": 0.8607, "step": 5816 }, { "epoch": 0.11, "learning_rate": 4.917105639759309e-06, "loss": 1.0193, "step": 5817 }, { "epoch": 0.11, "learning_rate": 4.917066622849612e-06, "loss": 1.138, "step": 5818 }, { "epoch": 0.11, "learning_rate": 4.917027596914663e-06, "loss": 1.0776, "step": 5819 }, { "epoch": 0.11, "learning_rate": 4.916988561954606e-06, "loss": 0.7509, "step": 5820 }, { "epoch": 0.11, "learning_rate": 4.9169495179695895e-06, "loss": 0.9254, "step": 5821 }, { "epoch": 0.11, "learning_rate": 4.916910464959756e-06, "loss": 1.022, "step": 5822 }, { "epoch": 0.11, "learning_rate": 4.9168714029252544e-06, "loss": 0.8958, "step": 5823 }, { "epoch": 0.11, "learning_rate": 4.916832331866229e-06, "loss": 1.034, "step": 5824 }, { "epoch": 0.11, "learning_rate": 4.916793251782825e-06, "loss": 1.0025, "step": 5825 }, { "epoch": 0.11, "learning_rate": 4.916754162675189e-06, "loss": 0.9583, "step": 5826 }, { "epoch": 0.11, "learning_rate": 4.916715064543468e-06, "loss": 0.9438, "step": 5827 }, { "epoch": 0.11, "learning_rate": 4.916675957387806e-06, "loss": 0.9048, "step": 5828 }, { "epoch": 0.11, "learning_rate": 4.916636841208351e-06, "loss": 1.1205, "step": 5829 }, { "epoch": 0.11, "learning_rate": 4.916597716005247e-06, "loss": 0.9871, "step": 5830 }, { "epoch": 0.11, "learning_rate": 4.916558581778642e-06, "loss": 1.2367, "step": 5831 }, { "epoch": 0.11, "learning_rate": 4.916519438528681e-06, "loss": 1.0976, "step": 5832 }, { "epoch": 0.11, "learning_rate": 4.91648028625551e-06, "loss": 0.8555, "step": 5833 }, { "epoch": 0.11, "learning_rate": 4.916441124959277e-06, "loss": 0.9846, "step": 5834 }, { "epoch": 0.11, "learning_rate": 4.916401954640127e-06, "loss": 1.0209, "step": 5835 }, { "epoch": 0.11, "learning_rate": 4.916362775298205e-06, "loss": 0.8429, "step": 5836 }, { "epoch": 0.11, "learning_rate": 4.916323586933659e-06, "loss": 0.9656, "step": 5837 }, { "epoch": 0.11, "learning_rate": 4.916284389546635e-06, "loss": 0.7693, "step": 5838 }, { "epoch": 0.11, "learning_rate": 4.916245183137279e-06, "loss": 0.9711, "step": 5839 }, { "epoch": 0.11, "learning_rate": 4.9162059677057375e-06, "loss": 0.8517, "step": 5840 }, { "epoch": 0.11, "learning_rate": 4.916166743252157e-06, "loss": 1.0734, "step": 5841 }, { "epoch": 0.11, "learning_rate": 4.916127509776684e-06, "loss": 1.139, "step": 5842 }, { "epoch": 0.11, "learning_rate": 4.916088267279465e-06, "loss": 1.22, "step": 5843 }, { "epoch": 0.11, "learning_rate": 4.916049015760646e-06, "loss": 1.2394, "step": 5844 }, { "epoch": 0.11, "learning_rate": 4.916009755220375e-06, "loss": 1.0526, "step": 5845 }, { "epoch": 0.11, "learning_rate": 4.915970485658797e-06, "loss": 0.9927, "step": 5846 }, { "epoch": 0.11, "learning_rate": 4.91593120707606e-06, "loss": 0.9044, "step": 5847 }, { "epoch": 0.11, "learning_rate": 4.915891919472309e-06, "loss": 0.8616, "step": 5848 }, { "epoch": 0.11, "learning_rate": 4.915852622847692e-06, "loss": 0.9074, "step": 5849 }, { "epoch": 0.11, "learning_rate": 4.915813317202356e-06, "loss": 0.9919, "step": 5850 }, { "epoch": 0.11, "learning_rate": 4.915774002536446e-06, "loss": 0.9605, "step": 5851 }, { "epoch": 0.11, "learning_rate": 4.91573467885011e-06, "loss": 0.8694, "step": 5852 }, { "epoch": 0.11, "learning_rate": 4.915695346143496e-06, "loss": 0.8087, "step": 5853 }, { "epoch": 0.11, "learning_rate": 4.915656004416749e-06, "loss": 0.9085, "step": 5854 }, { "epoch": 0.11, "learning_rate": 4.915616653670017e-06, "loss": 0.8698, "step": 5855 }, { "epoch": 0.11, "learning_rate": 4.915577293903445e-06, "loss": 0.951, "step": 5856 }, { "epoch": 0.11, "learning_rate": 4.915537925117183e-06, "loss": 0.8761, "step": 5857 }, { "epoch": 0.11, "learning_rate": 4.915498547311376e-06, "loss": 0.9236, "step": 5858 }, { "epoch": 0.11, "learning_rate": 4.915459160486171e-06, "loss": 0.773, "step": 5859 }, { "epoch": 0.11, "learning_rate": 4.915419764641716e-06, "loss": 1.0804, "step": 5860 }, { "epoch": 0.11, "learning_rate": 4.915380359778157e-06, "loss": 0.9598, "step": 5861 }, { "epoch": 0.11, "learning_rate": 4.9153409458956424e-06, "loss": 1.1043, "step": 5862 }, { "epoch": 0.11, "learning_rate": 4.915301522994319e-06, "loss": 1.094, "step": 5863 }, { "epoch": 0.11, "learning_rate": 4.915262091074333e-06, "loss": 1.0277, "step": 5864 }, { "epoch": 0.11, "learning_rate": 4.915222650135833e-06, "loss": 1.0908, "step": 5865 }, { "epoch": 0.11, "learning_rate": 4.915183200178965e-06, "loss": 1.0719, "step": 5866 }, { "epoch": 0.11, "learning_rate": 4.915143741203878e-06, "loss": 1.1271, "step": 5867 }, { "epoch": 0.11, "learning_rate": 4.915104273210718e-06, "loss": 1.0101, "step": 5868 }, { "epoch": 0.11, "learning_rate": 4.9150647961996325e-06, "loss": 1.0803, "step": 5869 }, { "epoch": 0.11, "learning_rate": 4.9150253101707695e-06, "loss": 1.0371, "step": 5870 }, { "epoch": 0.11, "learning_rate": 4.914985815124276e-06, "loss": 0.9682, "step": 5871 }, { "epoch": 0.11, "learning_rate": 4.914946311060299e-06, "loss": 0.9205, "step": 5872 }, { "epoch": 0.11, "learning_rate": 4.9149067979789864e-06, "loss": 0.8524, "step": 5873 }, { "epoch": 0.11, "learning_rate": 4.914867275880487e-06, "loss": 0.9923, "step": 5874 }, { "epoch": 0.11, "learning_rate": 4.914827744764946e-06, "loss": 1.2068, "step": 5875 }, { "epoch": 0.11, "learning_rate": 4.9147882046325125e-06, "loss": 1.0939, "step": 5876 }, { "epoch": 0.11, "learning_rate": 4.914748655483334e-06, "loss": 0.8593, "step": 5877 }, { "epoch": 0.11, "learning_rate": 4.914709097317559e-06, "loss": 1.1298, "step": 5878 }, { "epoch": 0.11, "learning_rate": 4.914669530135333e-06, "loss": 0.8122, "step": 5879 }, { "epoch": 0.11, "learning_rate": 4.914629953936805e-06, "loss": 1.1761, "step": 5880 }, { "epoch": 0.11, "learning_rate": 4.914590368722123e-06, "loss": 1.1066, "step": 5881 }, { "epoch": 0.11, "learning_rate": 4.914550774491435e-06, "loss": 1.0271, "step": 5882 }, { "epoch": 0.11, "learning_rate": 4.9145111712448875e-06, "loss": 0.8169, "step": 5883 }, { "epoch": 0.11, "learning_rate": 4.914471558982631e-06, "loss": 1.0903, "step": 5884 }, { "epoch": 0.11, "learning_rate": 4.91443193770481e-06, "loss": 0.9899, "step": 5885 }, { "epoch": 0.11, "learning_rate": 4.914392307411575e-06, "loss": 0.8795, "step": 5886 }, { "epoch": 0.11, "learning_rate": 4.914352668103073e-06, "loss": 0.9463, "step": 5887 }, { "epoch": 0.11, "learning_rate": 4.914313019779453e-06, "loss": 1.085, "step": 5888 }, { "epoch": 0.11, "learning_rate": 4.914273362440861e-06, "loss": 1.068, "step": 5889 }, { "epoch": 0.11, "learning_rate": 4.914233696087447e-06, "loss": 0.9059, "step": 5890 }, { "epoch": 0.11, "learning_rate": 4.914194020719358e-06, "loss": 1.0632, "step": 5891 }, { "epoch": 0.11, "learning_rate": 4.914154336336743e-06, "loss": 1.1021, "step": 5892 }, { "epoch": 0.11, "learning_rate": 4.914114642939749e-06, "loss": 1.0953, "step": 5893 }, { "epoch": 0.11, "learning_rate": 4.914074940528525e-06, "loss": 1.2538, "step": 5894 }, { "epoch": 0.11, "learning_rate": 4.91403522910322e-06, "loss": 0.8777, "step": 5895 }, { "epoch": 0.11, "learning_rate": 4.913995508663981e-06, "loss": 0.9499, "step": 5896 }, { "epoch": 0.11, "learning_rate": 4.913955779210957e-06, "loss": 0.8823, "step": 5897 }, { "epoch": 0.11, "learning_rate": 4.913916040744296e-06, "loss": 0.8328, "step": 5898 }, { "epoch": 0.11, "learning_rate": 4.913876293264146e-06, "loss": 1.3137, "step": 5899 }, { "epoch": 0.11, "learning_rate": 4.913836536770657e-06, "loss": 1.0079, "step": 5900 }, { "epoch": 0.11, "learning_rate": 4.913796771263975e-06, "loss": 0.83, "step": 5901 }, { "epoch": 0.11, "learning_rate": 4.91375699674425e-06, "loss": 1.059, "step": 5902 }, { "epoch": 0.11, "learning_rate": 4.913717213211632e-06, "loss": 0.9451, "step": 5903 }, { "epoch": 0.11, "learning_rate": 4.913677420666267e-06, "loss": 0.9122, "step": 5904 }, { "epoch": 0.11, "learning_rate": 4.913637619108304e-06, "loss": 1.1246, "step": 5905 }, { "epoch": 0.11, "learning_rate": 4.9135978085378925e-06, "loss": 1.1497, "step": 5906 }, { "epoch": 0.11, "learning_rate": 4.913557988955181e-06, "loss": 1.0358, "step": 5907 }, { "epoch": 0.11, "learning_rate": 4.913518160360318e-06, "loss": 0.97, "step": 5908 }, { "epoch": 0.11, "learning_rate": 4.913478322753452e-06, "loss": 0.9423, "step": 5909 }, { "epoch": 0.11, "learning_rate": 4.913438476134732e-06, "loss": 1.0627, "step": 5910 }, { "epoch": 0.11, "learning_rate": 4.913398620504306e-06, "loss": 0.6923, "step": 5911 }, { "epoch": 0.11, "learning_rate": 4.913358755862325e-06, "loss": 1.12, "step": 5912 }, { "epoch": 0.11, "learning_rate": 4.913318882208935e-06, "loss": 1.0341, "step": 5913 }, { "epoch": 0.11, "learning_rate": 4.913278999544288e-06, "loss": 0.8393, "step": 5914 }, { "epoch": 0.11, "learning_rate": 4.913239107868529e-06, "loss": 1.0361, "step": 5915 }, { "epoch": 0.11, "learning_rate": 4.9131992071818106e-06, "loss": 0.96, "step": 5916 }, { "epoch": 0.11, "learning_rate": 4.91315929748428e-06, "loss": 1.2738, "step": 5917 }, { "epoch": 0.11, "learning_rate": 4.9131193787760865e-06, "loss": 1.0034, "step": 5918 }, { "epoch": 0.11, "learning_rate": 4.913079451057379e-06, "loss": 1.1173, "step": 5919 }, { "epoch": 0.11, "learning_rate": 4.913039514328308e-06, "loss": 1.0814, "step": 5920 }, { "epoch": 0.11, "learning_rate": 4.91299956858902e-06, "loss": 0.8211, "step": 5921 }, { "epoch": 0.11, "learning_rate": 4.9129596138396665e-06, "loss": 0.7653, "step": 5922 }, { "epoch": 0.11, "learning_rate": 4.912919650080395e-06, "loss": 0.7952, "step": 5923 }, { "epoch": 0.11, "learning_rate": 4.9128796773113565e-06, "loss": 1.0655, "step": 5924 }, { "epoch": 0.11, "learning_rate": 4.9128396955326985e-06, "loss": 1.3275, "step": 5925 }, { "epoch": 0.11, "learning_rate": 4.912799704744572e-06, "loss": 1.0203, "step": 5926 }, { "epoch": 0.11, "learning_rate": 4.9127597049471244e-06, "loss": 1.0721, "step": 5927 }, { "epoch": 0.11, "learning_rate": 4.9127196961405065e-06, "loss": 0.9091, "step": 5928 }, { "epoch": 0.11, "learning_rate": 4.9126796783248665e-06, "loss": 0.9064, "step": 5929 }, { "epoch": 0.11, "learning_rate": 4.912639651500355e-06, "loss": 1.061, "step": 5930 }, { "epoch": 0.11, "learning_rate": 4.912599615667122e-06, "loss": 1.1957, "step": 5931 }, { "epoch": 0.11, "learning_rate": 4.912559570825315e-06, "loss": 1.1376, "step": 5932 }, { "epoch": 0.11, "learning_rate": 4.912519516975084e-06, "loss": 0.8853, "step": 5933 }, { "epoch": 0.11, "learning_rate": 4.91247945411658e-06, "loss": 0.8423, "step": 5934 }, { "epoch": 0.11, "learning_rate": 4.9124393822499515e-06, "loss": 0.8718, "step": 5935 }, { "epoch": 0.11, "learning_rate": 4.912399301375349e-06, "loss": 1.1682, "step": 5936 }, { "epoch": 0.11, "learning_rate": 4.91235921149292e-06, "loss": 1.3424, "step": 5937 }, { "epoch": 0.11, "learning_rate": 4.912319112602817e-06, "loss": 1.0707, "step": 5938 }, { "epoch": 0.11, "learning_rate": 4.912279004705187e-06, "loss": 1.0315, "step": 5939 }, { "epoch": 0.11, "learning_rate": 4.912238887800182e-06, "loss": 1.0089, "step": 5940 }, { "epoch": 0.11, "learning_rate": 4.912198761887952e-06, "loss": 0.9741, "step": 5941 }, { "epoch": 0.11, "learning_rate": 4.912158626968644e-06, "loss": 0.9735, "step": 5942 }, { "epoch": 0.11, "learning_rate": 4.91211848304241e-06, "loss": 1.0198, "step": 5943 }, { "epoch": 0.11, "learning_rate": 4.9120783301094e-06, "loss": 0.9988, "step": 5944 }, { "epoch": 0.11, "learning_rate": 4.912038168169764e-06, "loss": 0.9356, "step": 5945 }, { "epoch": 0.11, "learning_rate": 4.9119979972236506e-06, "loss": 0.8731, "step": 5946 }, { "epoch": 0.11, "learning_rate": 4.911957817271211e-06, "loss": 0.9044, "step": 5947 }, { "epoch": 0.11, "learning_rate": 4.9119176283125945e-06, "loss": 1.0016, "step": 5948 }, { "epoch": 0.11, "learning_rate": 4.911877430347952e-06, "loss": 1.1541, "step": 5949 }, { "epoch": 0.11, "learning_rate": 4.911837223377432e-06, "loss": 1.1429, "step": 5950 }, { "epoch": 0.11, "learning_rate": 4.911797007401187e-06, "loss": 0.8992, "step": 5951 }, { "epoch": 0.11, "learning_rate": 4.9117567824193654e-06, "loss": 0.9321, "step": 5952 }, { "epoch": 0.11, "learning_rate": 4.911716548432118e-06, "loss": 0.9599, "step": 5953 }, { "epoch": 0.11, "learning_rate": 4.9116763054395955e-06, "loss": 1.0707, "step": 5954 }, { "epoch": 0.11, "learning_rate": 4.911636053441947e-06, "loss": 0.8986, "step": 5955 }, { "epoch": 0.11, "learning_rate": 4.9115957924393235e-06, "loss": 1.1602, "step": 5956 }, { "epoch": 0.11, "learning_rate": 4.911555522431875e-06, "loss": 0.7862, "step": 5957 }, { "epoch": 0.11, "learning_rate": 4.911515243419752e-06, "loss": 0.6967, "step": 5958 }, { "epoch": 0.11, "learning_rate": 4.911474955403106e-06, "loss": 0.9269, "step": 5959 }, { "epoch": 0.11, "learning_rate": 4.911434658382086e-06, "loss": 1.0559, "step": 5960 }, { "epoch": 0.11, "learning_rate": 4.911394352356842e-06, "loss": 0.7309, "step": 5961 }, { "epoch": 0.11, "learning_rate": 4.9113540373275274e-06, "loss": 1.3157, "step": 5962 }, { "epoch": 0.11, "learning_rate": 4.911313713294289e-06, "loss": 1.0394, "step": 5963 }, { "epoch": 0.11, "learning_rate": 4.91127338025728e-06, "loss": 1.0632, "step": 5964 }, { "epoch": 0.11, "learning_rate": 4.911233038216649e-06, "loss": 0.9029, "step": 5965 }, { "epoch": 0.11, "learning_rate": 4.911192687172549e-06, "loss": 0.8192, "step": 5966 }, { "epoch": 0.11, "learning_rate": 4.91115232712513e-06, "loss": 0.8239, "step": 5967 }, { "epoch": 0.11, "learning_rate": 4.9111119580745404e-06, "loss": 1.1741, "step": 5968 }, { "epoch": 0.11, "learning_rate": 4.911071580020933e-06, "loss": 1.0437, "step": 5969 }, { "epoch": 0.11, "learning_rate": 4.911031192964459e-06, "loss": 1.02, "step": 5970 }, { "epoch": 0.11, "learning_rate": 4.910990796905268e-06, "loss": 1.0417, "step": 5971 }, { "epoch": 0.11, "learning_rate": 4.910950391843512e-06, "loss": 0.8513, "step": 5972 }, { "epoch": 0.11, "learning_rate": 4.91090997777934e-06, "loss": 1.0438, "step": 5973 }, { "epoch": 0.11, "learning_rate": 4.910869554712905e-06, "loss": 1.0442, "step": 5974 }, { "epoch": 0.11, "learning_rate": 4.910829122644357e-06, "loss": 1.4626, "step": 5975 }, { "epoch": 0.11, "learning_rate": 4.910788681573846e-06, "loss": 0.8962, "step": 5976 }, { "epoch": 0.11, "learning_rate": 4.910748231501524e-06, "loss": 0.5996, "step": 5977 }, { "epoch": 0.11, "learning_rate": 4.910707772427543e-06, "loss": 0.8547, "step": 5978 }, { "epoch": 0.11, "learning_rate": 4.910667304352053e-06, "loss": 0.8315, "step": 5979 }, { "epoch": 0.11, "learning_rate": 4.910626827275205e-06, "loss": 1.007, "step": 5980 }, { "epoch": 0.11, "learning_rate": 4.91058634119715e-06, "loss": 1.1948, "step": 5981 }, { "epoch": 0.11, "learning_rate": 4.91054584611804e-06, "loss": 0.974, "step": 5982 }, { "epoch": 0.11, "learning_rate": 4.910505342038026e-06, "loss": 0.8149, "step": 5983 }, { "epoch": 0.11, "learning_rate": 4.910464828957258e-06, "loss": 1.1315, "step": 5984 }, { "epoch": 0.11, "learning_rate": 4.910424306875888e-06, "loss": 0.8282, "step": 5985 }, { "epoch": 0.11, "learning_rate": 4.9103837757940685e-06, "loss": 0.8992, "step": 5986 }, { "epoch": 0.11, "learning_rate": 4.9103432357119495e-06, "loss": 1.2824, "step": 5987 }, { "epoch": 0.11, "learning_rate": 4.9103026866296835e-06, "loss": 1.0026, "step": 5988 }, { "epoch": 0.11, "learning_rate": 4.9102621285474205e-06, "loss": 0.869, "step": 5989 }, { "epoch": 0.11, "learning_rate": 4.910221561465312e-06, "loss": 0.9943, "step": 5990 }, { "epoch": 0.11, "learning_rate": 4.910180985383511e-06, "loss": 0.9193, "step": 5991 }, { "epoch": 0.11, "learning_rate": 4.910140400302168e-06, "loss": 1.0377, "step": 5992 }, { "epoch": 0.11, "learning_rate": 4.910099806221434e-06, "loss": 1.1375, "step": 5993 }, { "epoch": 0.11, "learning_rate": 4.910059203141462e-06, "loss": 1.0577, "step": 5994 }, { "epoch": 0.11, "learning_rate": 4.910018591062403e-06, "loss": 0.9609, "step": 5995 }, { "epoch": 0.11, "learning_rate": 4.909977969984408e-06, "loss": 0.9948, "step": 5996 }, { "epoch": 0.11, "learning_rate": 4.909937339907629e-06, "loss": 0.8507, "step": 5997 }, { "epoch": 0.11, "learning_rate": 4.909896700832218e-06, "loss": 0.9592, "step": 5998 }, { "epoch": 0.11, "learning_rate": 4.909856052758327e-06, "loss": 1.0965, "step": 5999 }, { "epoch": 0.11, "learning_rate": 4.909815395686107e-06, "loss": 1.0577, "step": 6000 }, { "epoch": 0.11, "learning_rate": 4.90977472961571e-06, "loss": 0.9689, "step": 6001 }, { "epoch": 0.11, "learning_rate": 4.909734054547288e-06, "loss": 0.9722, "step": 6002 }, { "epoch": 0.11, "learning_rate": 4.909693370480994e-06, "loss": 1.0267, "step": 6003 }, { "epoch": 0.11, "learning_rate": 4.909652677416977e-06, "loss": 0.9753, "step": 6004 }, { "epoch": 0.11, "learning_rate": 4.9096119753553925e-06, "loss": 0.8714, "step": 6005 }, { "epoch": 0.11, "learning_rate": 4.90957126429639e-06, "loss": 1.1601, "step": 6006 }, { "epoch": 0.11, "learning_rate": 4.909530544240122e-06, "loss": 0.9431, "step": 6007 }, { "epoch": 0.11, "learning_rate": 4.909489815186741e-06, "loss": 0.8962, "step": 6008 }, { "epoch": 0.11, "learning_rate": 4.9094490771363986e-06, "loss": 1.0406, "step": 6009 }, { "epoch": 0.11, "learning_rate": 4.909408330089248e-06, "loss": 0.7971, "step": 6010 }, { "epoch": 0.11, "learning_rate": 4.90936757404544e-06, "loss": 0.9932, "step": 6011 }, { "epoch": 0.11, "learning_rate": 4.909326809005129e-06, "loss": 0.9518, "step": 6012 }, { "epoch": 0.11, "learning_rate": 4.909286034968463e-06, "loss": 1.178, "step": 6013 }, { "epoch": 0.11, "learning_rate": 4.909245251935598e-06, "loss": 1.0135, "step": 6014 }, { "epoch": 0.11, "learning_rate": 4.909204459906686e-06, "loss": 0.8608, "step": 6015 }, { "epoch": 0.11, "learning_rate": 4.909163658881877e-06, "loss": 0.9772, "step": 6016 }, { "epoch": 0.11, "learning_rate": 4.909122848861325e-06, "loss": 0.9608, "step": 6017 }, { "epoch": 0.11, "learning_rate": 4.909082029845182e-06, "loss": 1.0402, "step": 6018 }, { "epoch": 0.11, "learning_rate": 4.909041201833602e-06, "loss": 1.0493, "step": 6019 }, { "epoch": 0.11, "learning_rate": 4.909000364826735e-06, "loss": 1.2413, "step": 6020 }, { "epoch": 0.11, "learning_rate": 4.908959518824734e-06, "loss": 1.1204, "step": 6021 }, { "epoch": 0.11, "learning_rate": 4.908918663827753e-06, "loss": 1.0137, "step": 6022 }, { "epoch": 0.11, "learning_rate": 4.908877799835943e-06, "loss": 0.9861, "step": 6023 }, { "epoch": 0.11, "learning_rate": 4.908836926849457e-06, "loss": 0.9195, "step": 6024 }, { "epoch": 0.11, "learning_rate": 4.908796044868448e-06, "loss": 1.3367, "step": 6025 }, { "epoch": 0.11, "learning_rate": 4.908755153893069e-06, "loss": 0.8844, "step": 6026 }, { "epoch": 0.11, "learning_rate": 4.908714253923471e-06, "loss": 0.9499, "step": 6027 }, { "epoch": 0.11, "learning_rate": 4.908673344959809e-06, "loss": 0.9462, "step": 6028 }, { "epoch": 0.11, "learning_rate": 4.9086324270022335e-06, "loss": 0.8384, "step": 6029 }, { "epoch": 0.11, "learning_rate": 4.908591500050899e-06, "loss": 0.9147, "step": 6030 }, { "epoch": 0.11, "learning_rate": 4.908550564105958e-06, "loss": 1.1225, "step": 6031 }, { "epoch": 0.11, "learning_rate": 4.908509619167562e-06, "loss": 1.039, "step": 6032 }, { "epoch": 0.11, "learning_rate": 4.9084686652358655e-06, "loss": 0.8604, "step": 6033 }, { "epoch": 0.11, "learning_rate": 4.9084277023110205e-06, "loss": 0.7827, "step": 6034 }, { "epoch": 0.11, "learning_rate": 4.908386730393181e-06, "loss": 0.8332, "step": 6035 }, { "epoch": 0.11, "learning_rate": 4.908345749482499e-06, "loss": 0.9902, "step": 6036 }, { "epoch": 0.11, "learning_rate": 4.9083047595791275e-06, "loss": 1.136, "step": 6037 }, { "epoch": 0.11, "learning_rate": 4.90826376068322e-06, "loss": 1.1876, "step": 6038 }, { "epoch": 0.11, "learning_rate": 4.90822275279493e-06, "loss": 0.8813, "step": 6039 }, { "epoch": 0.11, "learning_rate": 4.908181735914409e-06, "loss": 0.9578, "step": 6040 }, { "epoch": 0.11, "learning_rate": 4.908140710041812e-06, "loss": 0.7936, "step": 6041 }, { "epoch": 0.11, "learning_rate": 4.908099675177291e-06, "loss": 0.8703, "step": 6042 }, { "epoch": 0.11, "learning_rate": 4.908058631321e-06, "loss": 1.1697, "step": 6043 }, { "epoch": 0.11, "learning_rate": 4.908017578473092e-06, "loss": 1.0533, "step": 6044 }, { "epoch": 0.11, "learning_rate": 4.90797651663372e-06, "loss": 0.968, "step": 6045 }, { "epoch": 0.11, "learning_rate": 4.907935445803038e-06, "loss": 0.988, "step": 6046 }, { "epoch": 0.11, "learning_rate": 4.9078943659811986e-06, "loss": 0.8633, "step": 6047 }, { "epoch": 0.11, "learning_rate": 4.907853277168355e-06, "loss": 0.9116, "step": 6048 }, { "epoch": 0.11, "learning_rate": 4.907812179364661e-06, "loss": 0.9186, "step": 6049 }, { "epoch": 0.11, "learning_rate": 4.907771072570271e-06, "loss": 1.1305, "step": 6050 }, { "epoch": 0.11, "learning_rate": 4.907729956785338e-06, "loss": 1.1494, "step": 6051 }, { "epoch": 0.11, "learning_rate": 4.907688832010013e-06, "loss": 1.0488, "step": 6052 }, { "epoch": 0.11, "learning_rate": 4.907647698244454e-06, "loss": 0.899, "step": 6053 }, { "epoch": 0.11, "learning_rate": 4.90760655548881e-06, "loss": 0.8047, "step": 6054 }, { "epoch": 0.11, "learning_rate": 4.9075654037432394e-06, "loss": 0.8619, "step": 6055 }, { "epoch": 0.11, "learning_rate": 4.907524243007893e-06, "loss": 1.2668, "step": 6056 }, { "epoch": 0.11, "learning_rate": 4.907483073282923e-06, "loss": 1.0618, "step": 6057 }, { "epoch": 0.11, "learning_rate": 4.9074418945684865e-06, "loss": 1.1449, "step": 6058 }, { "epoch": 0.11, "learning_rate": 4.9074007068647355e-06, "loss": 0.8472, "step": 6059 }, { "epoch": 0.11, "learning_rate": 4.907359510171824e-06, "loss": 0.9294, "step": 6060 }, { "epoch": 0.11, "learning_rate": 4.907318304489907e-06, "loss": 0.9331, "step": 6061 }, { "epoch": 0.11, "learning_rate": 4.907277089819136e-06, "loss": 0.9857, "step": 6062 }, { "epoch": 0.11, "learning_rate": 4.907235866159666e-06, "loss": 0.9763, "step": 6063 }, { "epoch": 0.11, "learning_rate": 4.907194633511652e-06, "loss": 1.0005, "step": 6064 }, { "epoch": 0.11, "learning_rate": 4.907153391875245e-06, "loss": 1.0129, "step": 6065 }, { "epoch": 0.11, "learning_rate": 4.907112141250604e-06, "loss": 1.0077, "step": 6066 }, { "epoch": 0.11, "learning_rate": 4.907070881637878e-06, "loss": 0.8466, "step": 6067 }, { "epoch": 0.11, "learning_rate": 4.907029613037224e-06, "loss": 1.0857, "step": 6068 }, { "epoch": 0.11, "learning_rate": 4.906988335448795e-06, "loss": 0.9074, "step": 6069 }, { "epoch": 0.11, "learning_rate": 4.9069470488727454e-06, "loss": 1.1938, "step": 6070 }, { "epoch": 0.11, "learning_rate": 4.906905753309229e-06, "loss": 0.7395, "step": 6071 }, { "epoch": 0.11, "learning_rate": 4.9068644487584005e-06, "loss": 1.0286, "step": 6072 }, { "epoch": 0.11, "learning_rate": 4.906823135220414e-06, "loss": 0.8385, "step": 6073 }, { "epoch": 0.11, "learning_rate": 4.906781812695423e-06, "loss": 0.9026, "step": 6074 }, { "epoch": 0.11, "learning_rate": 4.906740481183584e-06, "loss": 1.0723, "step": 6075 }, { "epoch": 0.11, "learning_rate": 4.9066991406850496e-06, "loss": 0.9467, "step": 6076 }, { "epoch": 0.11, "learning_rate": 4.906657791199973e-06, "loss": 0.7832, "step": 6077 }, { "epoch": 0.11, "learning_rate": 4.906616432728512e-06, "loss": 0.8807, "step": 6078 }, { "epoch": 0.11, "learning_rate": 4.906575065270818e-06, "loss": 0.8091, "step": 6079 }, { "epoch": 0.11, "learning_rate": 4.906533688827046e-06, "loss": 1.034, "step": 6080 }, { "epoch": 0.11, "learning_rate": 4.906492303397351e-06, "loss": 1.0691, "step": 6081 }, { "epoch": 0.11, "learning_rate": 4.906450908981888e-06, "loss": 0.9563, "step": 6082 }, { "epoch": 0.11, "learning_rate": 4.9064095055808116e-06, "loss": 0.8493, "step": 6083 }, { "epoch": 0.11, "learning_rate": 4.906368093194275e-06, "loss": 1.0043, "step": 6084 }, { "epoch": 0.11, "learning_rate": 4.906326671822433e-06, "loss": 0.8337, "step": 6085 }, { "epoch": 0.11, "learning_rate": 4.906285241465443e-06, "loss": 0.9626, "step": 6086 }, { "epoch": 0.11, "learning_rate": 4.906243802123457e-06, "loss": 1.0928, "step": 6087 }, { "epoch": 0.11, "learning_rate": 4.9062023537966295e-06, "loss": 1.0459, "step": 6088 }, { "epoch": 0.11, "learning_rate": 4.906160896485117e-06, "loss": 0.9341, "step": 6089 }, { "epoch": 0.11, "learning_rate": 4.906119430189074e-06, "loss": 0.9046, "step": 6090 }, { "epoch": 0.11, "learning_rate": 4.9060779549086535e-06, "loss": 1.1154, "step": 6091 }, { "epoch": 0.11, "learning_rate": 4.906036470644012e-06, "loss": 0.886, "step": 6092 }, { "epoch": 0.11, "learning_rate": 4.905994977395304e-06, "loss": 1.3126, "step": 6093 }, { "epoch": 0.11, "learning_rate": 4.905953475162685e-06, "loss": 1.1526, "step": 6094 }, { "epoch": 0.11, "learning_rate": 4.90591196394631e-06, "loss": 1.0175, "step": 6095 }, { "epoch": 0.12, "learning_rate": 4.905870443746332e-06, "loss": 0.9758, "step": 6096 }, { "epoch": 0.12, "learning_rate": 4.905828914562909e-06, "loss": 0.7854, "step": 6097 }, { "epoch": 0.12, "learning_rate": 4.905787376396194e-06, "loss": 1.0782, "step": 6098 }, { "epoch": 0.12, "learning_rate": 4.905745829246343e-06, "loss": 0.9782, "step": 6099 }, { "epoch": 0.12, "learning_rate": 4.90570427311351e-06, "loss": 1.2065, "step": 6100 }, { "epoch": 0.12, "learning_rate": 4.905662707997852e-06, "loss": 0.8894, "step": 6101 }, { "epoch": 0.12, "learning_rate": 4.905621133899522e-06, "loss": 1.0355, "step": 6102 }, { "epoch": 0.12, "learning_rate": 4.9055795508186775e-06, "loss": 0.9001, "step": 6103 }, { "epoch": 0.12, "learning_rate": 4.905537958755473e-06, "loss": 0.8093, "step": 6104 }, { "epoch": 0.12, "learning_rate": 4.905496357710062e-06, "loss": 0.883, "step": 6105 }, { "epoch": 0.12, "learning_rate": 4.905454747682603e-06, "loss": 1.16, "step": 6106 }, { "epoch": 0.12, "learning_rate": 4.905413128673249e-06, "loss": 0.8463, "step": 6107 }, { "epoch": 0.12, "learning_rate": 4.905371500682156e-06, "loss": 0.8519, "step": 6108 }, { "epoch": 0.12, "learning_rate": 4.90532986370948e-06, "loss": 1.1613, "step": 6109 }, { "epoch": 0.12, "learning_rate": 4.905288217755375e-06, "loss": 0.9279, "step": 6110 }, { "epoch": 0.12, "learning_rate": 4.905246562819998e-06, "loss": 0.9901, "step": 6111 }, { "epoch": 0.12, "learning_rate": 4.905204898903505e-06, "loss": 1.0025, "step": 6112 }, { "epoch": 0.12, "learning_rate": 4.90516322600605e-06, "loss": 1.1774, "step": 6113 }, { "epoch": 0.12, "learning_rate": 4.905121544127789e-06, "loss": 1.0081, "step": 6114 }, { "epoch": 0.12, "learning_rate": 4.905079853268879e-06, "loss": 0.8354, "step": 6115 }, { "epoch": 0.12, "learning_rate": 4.905038153429473e-06, "loss": 0.9103, "step": 6116 }, { "epoch": 0.12, "learning_rate": 4.90499644460973e-06, "loss": 0.887, "step": 6117 }, { "epoch": 0.12, "learning_rate": 4.904954726809802e-06, "loss": 1.1741, "step": 6118 }, { "epoch": 0.12, "learning_rate": 4.9049130000298486e-06, "loss": 1.1548, "step": 6119 }, { "epoch": 0.12, "learning_rate": 4.9048712642700224e-06, "loss": 0.9148, "step": 6120 }, { "epoch": 0.12, "learning_rate": 4.9048295195304816e-06, "loss": 0.8117, "step": 6121 }, { "epoch": 0.12, "learning_rate": 4.904787765811381e-06, "loss": 0.9262, "step": 6122 }, { "epoch": 0.12, "learning_rate": 4.9047460031128755e-06, "loss": 0.8351, "step": 6123 }, { "epoch": 0.12, "learning_rate": 4.904704231435124e-06, "loss": 0.9437, "step": 6124 }, { "epoch": 0.12, "learning_rate": 4.904662450778279e-06, "loss": 1.2763, "step": 6125 }, { "epoch": 0.12, "learning_rate": 4.904620661142499e-06, "loss": 0.8611, "step": 6126 }, { "epoch": 0.12, "learning_rate": 4.904578862527939e-06, "loss": 1.0675, "step": 6127 }, { "epoch": 0.12, "learning_rate": 4.904537054934755e-06, "loss": 0.8955, "step": 6128 }, { "epoch": 0.12, "learning_rate": 4.904495238363104e-06, "loss": 0.7527, "step": 6129 }, { "epoch": 0.12, "learning_rate": 4.904453412813141e-06, "loss": 1.0233, "step": 6130 }, { "epoch": 0.12, "learning_rate": 4.904411578285023e-06, "loss": 1.0865, "step": 6131 }, { "epoch": 0.12, "learning_rate": 4.904369734778906e-06, "loss": 1.0348, "step": 6132 }, { "epoch": 0.12, "learning_rate": 4.904327882294945e-06, "loss": 0.9658, "step": 6133 }, { "epoch": 0.12, "learning_rate": 4.904286020833299e-06, "loss": 0.9041, "step": 6134 }, { "epoch": 0.12, "learning_rate": 4.904244150394121e-06, "loss": 0.8151, "step": 6135 }, { "epoch": 0.12, "learning_rate": 4.9042022709775704e-06, "loss": 1.0689, "step": 6136 }, { "epoch": 0.12, "learning_rate": 4.904160382583801e-06, "loss": 1.2474, "step": 6137 }, { "epoch": 0.12, "learning_rate": 4.904118485212972e-06, "loss": 1.1447, "step": 6138 }, { "epoch": 0.12, "learning_rate": 4.904076578865238e-06, "loss": 0.8635, "step": 6139 }, { "epoch": 0.12, "learning_rate": 4.904034663540754e-06, "loss": 0.9211, "step": 6140 }, { "epoch": 0.12, "learning_rate": 4.90399273923968e-06, "loss": 1.033, "step": 6141 }, { "epoch": 0.12, "learning_rate": 4.903950805962171e-06, "loss": 1.0417, "step": 6142 }, { "epoch": 0.12, "learning_rate": 4.903908863708382e-06, "loss": 1.0018, "step": 6143 }, { "epoch": 0.12, "learning_rate": 4.903866912478472e-06, "loss": 1.1843, "step": 6144 }, { "epoch": 0.12, "learning_rate": 4.903824952272597e-06, "loss": 0.8294, "step": 6145 }, { "epoch": 0.12, "learning_rate": 4.903782983090912e-06, "loss": 1.0033, "step": 6146 }, { "epoch": 0.12, "learning_rate": 4.903741004933576e-06, "loss": 0.9076, "step": 6147 }, { "epoch": 0.12, "learning_rate": 4.903699017800745e-06, "loss": 0.9692, "step": 6148 }, { "epoch": 0.12, "learning_rate": 4.903657021692575e-06, "loss": 1.2968, "step": 6149 }, { "epoch": 0.12, "learning_rate": 4.9036150166092236e-06, "loss": 1.148, "step": 6150 }, { "epoch": 0.12, "learning_rate": 4.903573002550848e-06, "loss": 0.8159, "step": 6151 }, { "epoch": 0.12, "learning_rate": 4.903530979517604e-06, "loss": 0.8534, "step": 6152 }, { "epoch": 0.12, "learning_rate": 4.903488947509648e-06, "loss": 0.7484, "step": 6153 }, { "epoch": 0.12, "learning_rate": 4.903446906527139e-06, "loss": 1.0103, "step": 6154 }, { "epoch": 0.12, "learning_rate": 4.903404856570233e-06, "loss": 1.1248, "step": 6155 }, { "epoch": 0.12, "learning_rate": 4.903362797639087e-06, "loss": 1.312, "step": 6156 }, { "epoch": 0.12, "learning_rate": 4.903320729733858e-06, "loss": 1.0726, "step": 6157 }, { "epoch": 0.12, "learning_rate": 4.903278652854703e-06, "loss": 0.7881, "step": 6158 }, { "epoch": 0.12, "learning_rate": 4.903236567001778e-06, "loss": 0.9245, "step": 6159 }, { "epoch": 0.12, "learning_rate": 4.903194472175243e-06, "loss": 0.9283, "step": 6160 }, { "epoch": 0.12, "learning_rate": 4.9031523683752525e-06, "loss": 0.9022, "step": 6161 }, { "epoch": 0.12, "learning_rate": 4.903110255601965e-06, "loss": 1.0336, "step": 6162 }, { "epoch": 0.12, "learning_rate": 4.903068133855538e-06, "loss": 1.0639, "step": 6163 }, { "epoch": 0.12, "learning_rate": 4.903026003136127e-06, "loss": 1.041, "step": 6164 }, { "epoch": 0.12, "learning_rate": 4.902983863443893e-06, "loss": 0.9117, "step": 6165 }, { "epoch": 0.12, "learning_rate": 4.902941714778989e-06, "loss": 0.9232, "step": 6166 }, { "epoch": 0.12, "learning_rate": 4.902899557141575e-06, "loss": 0.758, "step": 6167 }, { "epoch": 0.12, "learning_rate": 4.902857390531807e-06, "loss": 1.0707, "step": 6168 }, { "epoch": 0.12, "learning_rate": 4.9028152149498435e-06, "loss": 1.1163, "step": 6169 }, { "epoch": 0.12, "learning_rate": 4.902773030395842e-06, "loss": 1.0856, "step": 6170 }, { "epoch": 0.12, "learning_rate": 4.90273083686996e-06, "loss": 1.1012, "step": 6171 }, { "epoch": 0.12, "learning_rate": 4.902688634372354e-06, "loss": 0.9304, "step": 6172 }, { "epoch": 0.12, "learning_rate": 4.902646422903182e-06, "loss": 0.9332, "step": 6173 }, { "epoch": 0.12, "learning_rate": 4.902604202462603e-06, "loss": 1.2582, "step": 6174 }, { "epoch": 0.12, "learning_rate": 4.902561973050772e-06, "loss": 0.8472, "step": 6175 }, { "epoch": 0.12, "learning_rate": 4.90251973466785e-06, "loss": 0.9471, "step": 6176 }, { "epoch": 0.12, "learning_rate": 4.902477487313993e-06, "loss": 1.2432, "step": 6177 }, { "epoch": 0.12, "learning_rate": 4.902435230989357e-06, "loss": 0.9527, "step": 6178 }, { "epoch": 0.12, "learning_rate": 4.9023929656941025e-06, "loss": 1.0411, "step": 6179 }, { "epoch": 0.12, "learning_rate": 4.902350691428387e-06, "loss": 1.1545, "step": 6180 }, { "epoch": 0.12, "learning_rate": 4.902308408192367e-06, "loss": 1.2146, "step": 6181 }, { "epoch": 0.12, "learning_rate": 4.902266115986201e-06, "loss": 0.9734, "step": 6182 }, { "epoch": 0.12, "learning_rate": 4.902223814810047e-06, "loss": 0.9054, "step": 6183 }, { "epoch": 0.12, "learning_rate": 4.902181504664062e-06, "loss": 0.9846, "step": 6184 }, { "epoch": 0.12, "learning_rate": 4.902139185548406e-06, "loss": 0.9698, "step": 6185 }, { "epoch": 0.12, "learning_rate": 4.902096857463236e-06, "loss": 0.9449, "step": 6186 }, { "epoch": 0.12, "learning_rate": 4.90205452040871e-06, "loss": 1.131, "step": 6187 }, { "epoch": 0.12, "learning_rate": 4.902012174384986e-06, "loss": 0.9132, "step": 6188 }, { "epoch": 0.12, "learning_rate": 4.901969819392222e-06, "loss": 1.0027, "step": 6189 }, { "epoch": 0.12, "learning_rate": 4.901927455430576e-06, "loss": 1.005, "step": 6190 }, { "epoch": 0.12, "learning_rate": 4.901885082500207e-06, "loss": 1.0064, "step": 6191 }, { "epoch": 0.12, "learning_rate": 4.901842700601273e-06, "loss": 0.7381, "step": 6192 }, { "epoch": 0.12, "learning_rate": 4.901800309733932e-06, "loss": 0.9871, "step": 6193 }, { "epoch": 0.12, "learning_rate": 4.901757909898341e-06, "loss": 0.9341, "step": 6194 }, { "epoch": 0.12, "learning_rate": 4.90171550109466e-06, "loss": 1.0439, "step": 6195 }, { "epoch": 0.12, "learning_rate": 4.901673083323048e-06, "loss": 0.9111, "step": 6196 }, { "epoch": 0.12, "learning_rate": 4.901630656583662e-06, "loss": 0.906, "step": 6197 }, { "epoch": 0.12, "learning_rate": 4.901588220876661e-06, "loss": 0.9174, "step": 6198 }, { "epoch": 0.12, "learning_rate": 4.9015457762022025e-06, "loss": 0.9299, "step": 6199 }, { "epoch": 0.12, "learning_rate": 4.901503322560446e-06, "loss": 1.1078, "step": 6200 }, { "epoch": 0.12, "learning_rate": 4.901460859951549e-06, "loss": 1.1857, "step": 6201 }, { "epoch": 0.12, "learning_rate": 4.901418388375671e-06, "loss": 0.7971, "step": 6202 }, { "epoch": 0.12, "learning_rate": 4.9013759078329715e-06, "loss": 0.9535, "step": 6203 }, { "epoch": 0.12, "learning_rate": 4.901333418323608e-06, "loss": 1.0434, "step": 6204 }, { "epoch": 0.12, "learning_rate": 4.901290919847738e-06, "loss": 0.9991, "step": 6205 }, { "epoch": 0.12, "learning_rate": 4.901248412405522e-06, "loss": 1.1623, "step": 6206 }, { "epoch": 0.12, "learning_rate": 4.9012058959971175e-06, "loss": 1.0395, "step": 6207 }, { "epoch": 0.12, "learning_rate": 4.901163370622685e-06, "loss": 0.7812, "step": 6208 }, { "epoch": 0.12, "learning_rate": 4.901120836282381e-06, "loss": 0.8662, "step": 6209 }, { "epoch": 0.12, "learning_rate": 4.9010782929763656e-06, "loss": 1.025, "step": 6210 }, { "epoch": 0.12, "learning_rate": 4.901035740704797e-06, "loss": 0.8737, "step": 6211 }, { "epoch": 0.12, "learning_rate": 4.900993179467836e-06, "loss": 1.2091, "step": 6212 }, { "epoch": 0.12, "learning_rate": 4.900950609265639e-06, "loss": 1.1353, "step": 6213 }, { "epoch": 0.12, "learning_rate": 4.9009080300983664e-06, "loss": 0.8811, "step": 6214 }, { "epoch": 0.12, "learning_rate": 4.900865441966177e-06, "loss": 0.9004, "step": 6215 }, { "epoch": 0.12, "learning_rate": 4.900822844869229e-06, "loss": 0.8281, "step": 6216 }, { "epoch": 0.12, "learning_rate": 4.900780238807683e-06, "loss": 0.9893, "step": 6217 }, { "epoch": 0.12, "learning_rate": 4.900737623781696e-06, "loss": 1.0979, "step": 6218 }, { "epoch": 0.12, "learning_rate": 4.900694999791429e-06, "loss": 1.0435, "step": 6219 }, { "epoch": 0.12, "learning_rate": 4.90065236683704e-06, "loss": 0.7142, "step": 6220 }, { "epoch": 0.12, "learning_rate": 4.90060972491869e-06, "loss": 0.7802, "step": 6221 }, { "epoch": 0.12, "learning_rate": 4.900567074036536e-06, "loss": 0.8657, "step": 6222 }, { "epoch": 0.12, "learning_rate": 4.900524414190738e-06, "loss": 0.8656, "step": 6223 }, { "epoch": 0.12, "learning_rate": 4.9004817453814554e-06, "loss": 1.0613, "step": 6224 }, { "epoch": 0.12, "learning_rate": 4.900439067608847e-06, "loss": 1.0226, "step": 6225 }, { "epoch": 0.12, "learning_rate": 4.900396380873074e-06, "loss": 1.0831, "step": 6226 }, { "epoch": 0.12, "learning_rate": 4.900353685174294e-06, "loss": 0.8929, "step": 6227 }, { "epoch": 0.12, "learning_rate": 4.900310980512667e-06, "loss": 0.9396, "step": 6228 }, { "epoch": 0.12, "learning_rate": 4.900268266888353e-06, "loss": 0.9268, "step": 6229 }, { "epoch": 0.12, "learning_rate": 4.90022554430151e-06, "loss": 0.9702, "step": 6230 }, { "epoch": 0.12, "learning_rate": 4.900182812752298e-06, "loss": 1.1062, "step": 6231 }, { "epoch": 0.12, "learning_rate": 4.900140072240878e-06, "loss": 0.9426, "step": 6232 }, { "epoch": 0.12, "learning_rate": 4.900097322767408e-06, "loss": 0.9462, "step": 6233 }, { "epoch": 0.12, "learning_rate": 4.900054564332049e-06, "loss": 1.0128, "step": 6234 }, { "epoch": 0.12, "learning_rate": 4.900011796934959e-06, "loss": 0.7929, "step": 6235 }, { "epoch": 0.12, "learning_rate": 4.899969020576299e-06, "loss": 1.093, "step": 6236 }, { "epoch": 0.12, "learning_rate": 4.899926235256227e-06, "loss": 1.2272, "step": 6237 }, { "epoch": 0.12, "learning_rate": 4.899883440974905e-06, "loss": 1.1097, "step": 6238 }, { "epoch": 0.12, "learning_rate": 4.899840637732492e-06, "loss": 0.8657, "step": 6239 }, { "epoch": 0.12, "learning_rate": 4.8997978255291475e-06, "loss": 1.0016, "step": 6240 }, { "epoch": 0.12, "learning_rate": 4.899755004365031e-06, "loss": 1.0071, "step": 6241 }, { "epoch": 0.12, "learning_rate": 4.899712174240304e-06, "loss": 1.0034, "step": 6242 }, { "epoch": 0.12, "learning_rate": 4.899669335155124e-06, "loss": 1.006, "step": 6243 }, { "epoch": 0.12, "learning_rate": 4.899626487109653e-06, "loss": 1.1736, "step": 6244 }, { "epoch": 0.12, "learning_rate": 4.899583630104051e-06, "loss": 0.9936, "step": 6245 }, { "epoch": 0.12, "learning_rate": 4.899540764138476e-06, "loss": 0.9203, "step": 6246 }, { "epoch": 0.12, "learning_rate": 4.89949788921309e-06, "loss": 1.1188, "step": 6247 }, { "epoch": 0.12, "learning_rate": 4.899455005328052e-06, "loss": 1.004, "step": 6248 }, { "epoch": 0.12, "learning_rate": 4.899412112483524e-06, "loss": 1.2518, "step": 6249 }, { "epoch": 0.12, "learning_rate": 4.8993692106796634e-06, "loss": 1.0386, "step": 6250 }, { "epoch": 0.12, "learning_rate": 4.8993262999166316e-06, "loss": 0.9883, "step": 6251 }, { "epoch": 0.12, "learning_rate": 4.899283380194589e-06, "loss": 1.1118, "step": 6252 }, { "epoch": 0.12, "learning_rate": 4.899240451513696e-06, "loss": 0.8078, "step": 6253 }, { "epoch": 0.12, "learning_rate": 4.899197513874114e-06, "loss": 0.8674, "step": 6254 }, { "epoch": 0.12, "learning_rate": 4.899154567276e-06, "loss": 0.8428, "step": 6255 }, { "epoch": 0.12, "learning_rate": 4.899111611719517e-06, "loss": 1.1508, "step": 6256 }, { "epoch": 0.12, "learning_rate": 4.899068647204826e-06, "loss": 0.8455, "step": 6257 }, { "epoch": 0.12, "learning_rate": 4.899025673732085e-06, "loss": 0.9497, "step": 6258 }, { "epoch": 0.12, "learning_rate": 4.898982691301456e-06, "loss": 1.0266, "step": 6259 }, { "epoch": 0.12, "learning_rate": 4.898939699913099e-06, "loss": 0.8409, "step": 6260 }, { "epoch": 0.12, "learning_rate": 4.898896699567175e-06, "loss": 0.8585, "step": 6261 }, { "epoch": 0.12, "learning_rate": 4.898853690263844e-06, "loss": 1.2357, "step": 6262 }, { "epoch": 0.12, "learning_rate": 4.898810672003267e-06, "loss": 0.955, "step": 6263 }, { "epoch": 0.12, "learning_rate": 4.898767644785605e-06, "loss": 0.971, "step": 6264 }, { "epoch": 0.12, "learning_rate": 4.898724608611017e-06, "loss": 0.9695, "step": 6265 }, { "epoch": 0.12, "learning_rate": 4.898681563479667e-06, "loss": 0.811, "step": 6266 }, { "epoch": 0.12, "learning_rate": 4.898638509391712e-06, "loss": 0.95, "step": 6267 }, { "epoch": 0.12, "learning_rate": 4.898595446347314e-06, "loss": 0.8926, "step": 6268 }, { "epoch": 0.12, "learning_rate": 4.898552374346635e-06, "loss": 1.0629, "step": 6269 }, { "epoch": 0.12, "learning_rate": 4.8985092933898346e-06, "loss": 0.821, "step": 6270 }, { "epoch": 0.12, "learning_rate": 4.898466203477074e-06, "loss": 0.8679, "step": 6271 }, { "epoch": 0.12, "learning_rate": 4.898423104608514e-06, "loss": 1.0909, "step": 6272 }, { "epoch": 0.12, "learning_rate": 4.898379996784316e-06, "loss": 1.0581, "step": 6273 }, { "epoch": 0.12, "learning_rate": 4.89833688000464e-06, "loss": 0.946, "step": 6274 }, { "epoch": 0.12, "learning_rate": 4.898293754269649e-06, "loss": 1.2068, "step": 6275 }, { "epoch": 0.12, "learning_rate": 4.898250619579502e-06, "loss": 0.8813, "step": 6276 }, { "epoch": 0.12, "learning_rate": 4.8982074759343604e-06, "loss": 0.7313, "step": 6277 }, { "epoch": 0.12, "learning_rate": 4.898164323334386e-06, "loss": 1.0333, "step": 6278 }, { "epoch": 0.12, "learning_rate": 4.8981211617797385e-06, "loss": 0.9519, "step": 6279 }, { "epoch": 0.12, "learning_rate": 4.898077991270581e-06, "loss": 1.0302, "step": 6280 }, { "epoch": 0.12, "learning_rate": 4.898034811807074e-06, "loss": 1.1567, "step": 6281 }, { "epoch": 0.12, "learning_rate": 4.897991623389378e-06, "loss": 1.1677, "step": 6282 }, { "epoch": 0.12, "learning_rate": 4.897948426017655e-06, "loss": 0.9623, "step": 6283 }, { "epoch": 0.12, "learning_rate": 4.897905219692066e-06, "loss": 1.0078, "step": 6284 }, { "epoch": 0.12, "learning_rate": 4.897862004412773e-06, "loss": 0.8992, "step": 6285 }, { "epoch": 0.12, "learning_rate": 4.897818780179936e-06, "loss": 0.9606, "step": 6286 }, { "epoch": 0.12, "learning_rate": 4.897775546993718e-06, "loss": 1.0179, "step": 6287 }, { "epoch": 0.12, "learning_rate": 4.897732304854279e-06, "loss": 1.0, "step": 6288 }, { "epoch": 0.12, "learning_rate": 4.897689053761781e-06, "loss": 0.9141, "step": 6289 }, { "epoch": 0.12, "learning_rate": 4.897645793716386e-06, "loss": 0.923, "step": 6290 }, { "epoch": 0.12, "learning_rate": 4.897602524718255e-06, "loss": 1.1304, "step": 6291 }, { "epoch": 0.12, "learning_rate": 4.89755924676755e-06, "loss": 1.0861, "step": 6292 }, { "epoch": 0.12, "learning_rate": 4.897515959864432e-06, "loss": 0.9473, "step": 6293 }, { "epoch": 0.12, "learning_rate": 4.8974726640090625e-06, "loss": 1.2574, "step": 6294 }, { "epoch": 0.12, "learning_rate": 4.897429359201604e-06, "loss": 0.9684, "step": 6295 }, { "epoch": 0.12, "learning_rate": 4.897386045442218e-06, "loss": 0.9237, "step": 6296 }, { "epoch": 0.12, "learning_rate": 4.897342722731065e-06, "loss": 1.0036, "step": 6297 }, { "epoch": 0.12, "learning_rate": 4.897299391068309e-06, "loss": 0.9437, "step": 6298 }, { "epoch": 0.12, "learning_rate": 4.89725605045411e-06, "loss": 0.9826, "step": 6299 }, { "epoch": 0.12, "learning_rate": 4.897212700888631e-06, "loss": 1.0319, "step": 6300 }, { "epoch": 0.12, "learning_rate": 4.897169342372032e-06, "loss": 0.9214, "step": 6301 }, { "epoch": 0.12, "learning_rate": 4.8971259749044775e-06, "loss": 1.0208, "step": 6302 }, { "epoch": 0.12, "learning_rate": 4.897082598486127e-06, "loss": 1.0099, "step": 6303 }, { "epoch": 0.12, "learning_rate": 4.897039213117144e-06, "loss": 0.879, "step": 6304 }, { "epoch": 0.12, "learning_rate": 4.8969958187976905e-06, "loss": 0.8528, "step": 6305 }, { "epoch": 0.12, "learning_rate": 4.896952415527928e-06, "loss": 1.0634, "step": 6306 }, { "epoch": 0.12, "learning_rate": 4.896909003308019e-06, "loss": 0.7674, "step": 6307 }, { "epoch": 0.12, "learning_rate": 4.8968655821381235e-06, "loss": 0.9787, "step": 6308 }, { "epoch": 0.12, "learning_rate": 4.896822152018408e-06, "loss": 0.9574, "step": 6309 }, { "epoch": 0.12, "learning_rate": 4.89677871294903e-06, "loss": 0.803, "step": 6310 }, { "epoch": 0.12, "learning_rate": 4.896735264930155e-06, "loss": 0.9712, "step": 6311 }, { "epoch": 0.12, "learning_rate": 4.896691807961943e-06, "loss": 1.2487, "step": 6312 }, { "epoch": 0.12, "learning_rate": 4.896648342044557e-06, "loss": 1.1682, "step": 6313 }, { "epoch": 0.12, "learning_rate": 4.896604867178161e-06, "loss": 0.9584, "step": 6314 }, { "epoch": 0.12, "learning_rate": 4.8965613833629155e-06, "loss": 0.9819, "step": 6315 }, { "epoch": 0.12, "learning_rate": 4.896517890598983e-06, "loss": 1.2058, "step": 6316 }, { "epoch": 0.12, "learning_rate": 4.896474388886526e-06, "loss": 0.9211, "step": 6317 }, { "epoch": 0.12, "learning_rate": 4.896430878225708e-06, "loss": 1.0995, "step": 6318 }, { "epoch": 0.12, "learning_rate": 4.89638735861669e-06, "loss": 1.1842, "step": 6319 }, { "epoch": 0.12, "learning_rate": 4.8963438300596345e-06, "loss": 0.9, "step": 6320 }, { "epoch": 0.12, "learning_rate": 4.896300292554706e-06, "loss": 1.0609, "step": 6321 }, { "epoch": 0.12, "learning_rate": 4.896256746102064e-06, "loss": 0.8939, "step": 6322 }, { "epoch": 0.12, "learning_rate": 4.896213190701874e-06, "loss": 0.9697, "step": 6323 }, { "epoch": 0.12, "learning_rate": 4.8961696263542965e-06, "loss": 0.891, "step": 6324 }, { "epoch": 0.12, "learning_rate": 4.8961260530594956e-06, "loss": 1.0717, "step": 6325 }, { "epoch": 0.12, "learning_rate": 4.896082470817634e-06, "loss": 1.0361, "step": 6326 }, { "epoch": 0.12, "learning_rate": 4.896038879628872e-06, "loss": 0.9236, "step": 6327 }, { "epoch": 0.12, "learning_rate": 4.895995279493376e-06, "loss": 1.1405, "step": 6328 }, { "epoch": 0.12, "learning_rate": 4.895951670411308e-06, "loss": 0.9573, "step": 6329 }, { "epoch": 0.12, "learning_rate": 4.8959080523828275e-06, "loss": 1.0971, "step": 6330 }, { "epoch": 0.12, "learning_rate": 4.895864425408101e-06, "loss": 0.9543, "step": 6331 }, { "epoch": 0.12, "learning_rate": 4.895820789487291e-06, "loss": 0.7398, "step": 6332 }, { "epoch": 0.12, "learning_rate": 4.895777144620558e-06, "loss": 0.7811, "step": 6333 }, { "epoch": 0.12, "learning_rate": 4.8957334908080674e-06, "loss": 0.9512, "step": 6334 }, { "epoch": 0.12, "learning_rate": 4.895689828049981e-06, "loss": 0.8257, "step": 6335 }, { "epoch": 0.12, "learning_rate": 4.895646156346463e-06, "loss": 0.9171, "step": 6336 }, { "epoch": 0.12, "learning_rate": 4.895602475697676e-06, "loss": 1.2698, "step": 6337 }, { "epoch": 0.12, "learning_rate": 4.895558786103781e-06, "loss": 1.0852, "step": 6338 }, { "epoch": 0.12, "learning_rate": 4.895515087564945e-06, "loss": 0.9882, "step": 6339 }, { "epoch": 0.12, "learning_rate": 4.895471380081328e-06, "loss": 0.996, "step": 6340 }, { "epoch": 0.12, "learning_rate": 4.8954276636530936e-06, "loss": 0.8663, "step": 6341 }, { "epoch": 0.12, "learning_rate": 4.8953839382804074e-06, "loss": 0.9656, "step": 6342 }, { "epoch": 0.12, "learning_rate": 4.89534020396343e-06, "loss": 0.9596, "step": 6343 }, { "epoch": 0.12, "learning_rate": 4.8952964607023265e-06, "loss": 1.1038, "step": 6344 }, { "epoch": 0.12, "learning_rate": 4.895252708497259e-06, "loss": 0.7975, "step": 6345 }, { "epoch": 0.12, "learning_rate": 4.895208947348391e-06, "loss": 0.9924, "step": 6346 }, { "epoch": 0.12, "learning_rate": 4.8951651772558865e-06, "loss": 0.9086, "step": 6347 }, { "epoch": 0.12, "learning_rate": 4.895121398219908e-06, "loss": 0.8932, "step": 6348 }, { "epoch": 0.12, "learning_rate": 4.895077610240621e-06, "loss": 0.7887, "step": 6349 }, { "epoch": 0.12, "learning_rate": 4.8950338133181865e-06, "loss": 1.0362, "step": 6350 }, { "epoch": 0.12, "learning_rate": 4.89499000745277e-06, "loss": 0.8565, "step": 6351 }, { "epoch": 0.12, "learning_rate": 4.894946192644534e-06, "loss": 0.8455, "step": 6352 }, { "epoch": 0.12, "learning_rate": 4.894902368893642e-06, "loss": 1.0395, "step": 6353 }, { "epoch": 0.12, "learning_rate": 4.894858536200258e-06, "loss": 1.0068, "step": 6354 }, { "epoch": 0.12, "learning_rate": 4.894814694564546e-06, "loss": 1.1302, "step": 6355 }, { "epoch": 0.12, "learning_rate": 4.894770843986669e-06, "loss": 1.2915, "step": 6356 }, { "epoch": 0.12, "learning_rate": 4.894726984466791e-06, "loss": 1.0746, "step": 6357 }, { "epoch": 0.12, "learning_rate": 4.894683116005076e-06, "loss": 0.9236, "step": 6358 }, { "epoch": 0.12, "learning_rate": 4.894639238601688e-06, "loss": 0.8449, "step": 6359 }, { "epoch": 0.12, "learning_rate": 4.8945953522567905e-06, "loss": 0.8044, "step": 6360 }, { "epoch": 0.12, "learning_rate": 4.894551456970548e-06, "loss": 0.9156, "step": 6361 }, { "epoch": 0.12, "learning_rate": 4.894507552743122e-06, "loss": 0.9311, "step": 6362 }, { "epoch": 0.12, "learning_rate": 4.894463639574679e-06, "loss": 1.0759, "step": 6363 }, { "epoch": 0.12, "learning_rate": 4.894419717465383e-06, "loss": 0.641, "step": 6364 }, { "epoch": 0.12, "learning_rate": 4.894375786415396e-06, "loss": 1.1729, "step": 6365 }, { "epoch": 0.12, "learning_rate": 4.894331846424885e-06, "loss": 0.7687, "step": 6366 }, { "epoch": 0.12, "learning_rate": 4.89428789749401e-06, "loss": 0.9647, "step": 6367 }, { "epoch": 0.12, "learning_rate": 4.894243939622939e-06, "loss": 1.1227, "step": 6368 }, { "epoch": 0.12, "learning_rate": 4.894199972811834e-06, "loss": 1.2468, "step": 6369 }, { "epoch": 0.12, "learning_rate": 4.89415599706086e-06, "loss": 0.9023, "step": 6370 }, { "epoch": 0.12, "learning_rate": 4.89411201237018e-06, "loss": 0.996, "step": 6371 }, { "epoch": 0.12, "learning_rate": 4.8940680187399605e-06, "loss": 0.8434, "step": 6372 }, { "epoch": 0.12, "learning_rate": 4.894024016170364e-06, "loss": 0.9308, "step": 6373 }, { "epoch": 0.12, "learning_rate": 4.893980004661555e-06, "loss": 1.0933, "step": 6374 }, { "epoch": 0.12, "learning_rate": 4.893935984213697e-06, "loss": 1.0869, "step": 6375 }, { "epoch": 0.12, "learning_rate": 4.893891954826957e-06, "loss": 0.9782, "step": 6376 }, { "epoch": 0.12, "learning_rate": 4.893847916501497e-06, "loss": 1.0027, "step": 6377 }, { "epoch": 0.12, "learning_rate": 4.893803869237483e-06, "loss": 0.9084, "step": 6378 }, { "epoch": 0.12, "learning_rate": 4.893759813035078e-06, "loss": 0.9199, "step": 6379 }, { "epoch": 0.12, "learning_rate": 4.893715747894447e-06, "loss": 0.881, "step": 6380 }, { "epoch": 0.12, "learning_rate": 4.893671673815756e-06, "loss": 1.4336, "step": 6381 }, { "epoch": 0.12, "learning_rate": 4.8936275907991675e-06, "loss": 0.9864, "step": 6382 }, { "epoch": 0.12, "learning_rate": 4.893583498844847e-06, "loss": 0.9012, "step": 6383 }, { "epoch": 0.12, "learning_rate": 4.89353939795296e-06, "loss": 0.7964, "step": 6384 }, { "epoch": 0.12, "learning_rate": 4.893495288123669e-06, "loss": 1.0115, "step": 6385 }, { "epoch": 0.12, "learning_rate": 4.8934511693571405e-06, "loss": 0.7955, "step": 6386 }, { "epoch": 0.12, "learning_rate": 4.8934070416535385e-06, "loss": 0.9474, "step": 6387 }, { "epoch": 0.12, "learning_rate": 4.893362905013028e-06, "loss": 1.1414, "step": 6388 }, { "epoch": 0.12, "learning_rate": 4.893318759435774e-06, "loss": 0.9204, "step": 6389 }, { "epoch": 0.12, "learning_rate": 4.893274604921941e-06, "loss": 0.8619, "step": 6390 }, { "epoch": 0.12, "learning_rate": 4.893230441471695e-06, "loss": 0.981, "step": 6391 }, { "epoch": 0.12, "learning_rate": 4.893186269085199e-06, "loss": 0.9465, "step": 6392 }, { "epoch": 0.12, "learning_rate": 4.893142087762619e-06, "loss": 0.9581, "step": 6393 }, { "epoch": 0.12, "learning_rate": 4.89309789750412e-06, "loss": 1.1663, "step": 6394 }, { "epoch": 0.12, "learning_rate": 4.893053698309867e-06, "loss": 0.712, "step": 6395 }, { "epoch": 0.12, "learning_rate": 4.893009490180024e-06, "loss": 0.9543, "step": 6396 }, { "epoch": 0.12, "learning_rate": 4.892965273114757e-06, "loss": 1.0358, "step": 6397 }, { "epoch": 0.12, "learning_rate": 4.892921047114232e-06, "loss": 1.0424, "step": 6398 }, { "epoch": 0.12, "learning_rate": 4.892876812178612e-06, "loss": 1.0821, "step": 6399 }, { "epoch": 0.12, "learning_rate": 4.892832568308064e-06, "loss": 1.0845, "step": 6400 }, { "epoch": 0.12, "learning_rate": 4.892788315502752e-06, "loss": 0.9794, "step": 6401 }, { "epoch": 0.12, "learning_rate": 4.892744053762843e-06, "loss": 1.1111, "step": 6402 }, { "epoch": 0.12, "learning_rate": 4.8926997830885e-06, "loss": 0.9071, "step": 6403 }, { "epoch": 0.12, "learning_rate": 4.89265550347989e-06, "loss": 0.9243, "step": 6404 }, { "epoch": 0.12, "learning_rate": 4.892611214937177e-06, "loss": 1.1006, "step": 6405 }, { "epoch": 0.12, "learning_rate": 4.892566917460528e-06, "loss": 1.1984, "step": 6406 }, { "epoch": 0.12, "learning_rate": 4.892522611050106e-06, "loss": 1.1718, "step": 6407 }, { "epoch": 0.12, "learning_rate": 4.89247829570608e-06, "loss": 0.8344, "step": 6408 }, { "epoch": 0.12, "learning_rate": 4.892433971428613e-06, "loss": 0.9796, "step": 6409 }, { "epoch": 0.12, "learning_rate": 4.892389638217869e-06, "loss": 1.0153, "step": 6410 }, { "epoch": 0.12, "learning_rate": 4.892345296074017e-06, "loss": 0.928, "step": 6411 }, { "epoch": 0.12, "learning_rate": 4.892300944997221e-06, "loss": 1.0994, "step": 6412 }, { "epoch": 0.12, "learning_rate": 4.892256584987646e-06, "loss": 0.9071, "step": 6413 }, { "epoch": 0.12, "learning_rate": 4.892212216045459e-06, "loss": 1.0662, "step": 6414 }, { "epoch": 0.12, "learning_rate": 4.8921678381708245e-06, "loss": 0.8535, "step": 6415 }, { "epoch": 0.12, "learning_rate": 4.892123451363908e-06, "loss": 1.1122, "step": 6416 }, { "epoch": 0.12, "learning_rate": 4.8920790556248775e-06, "loss": 0.9501, "step": 6417 }, { "epoch": 0.12, "learning_rate": 4.8920346509538955e-06, "loss": 1.149, "step": 6418 }, { "epoch": 0.12, "learning_rate": 4.891990237351131e-06, "loss": 1.0543, "step": 6419 }, { "epoch": 0.12, "learning_rate": 4.8919458148167465e-06, "loss": 1.1511, "step": 6420 }, { "epoch": 0.12, "learning_rate": 4.891901383350911e-06, "loss": 1.0044, "step": 6421 }, { "epoch": 0.12, "learning_rate": 4.891856942953789e-06, "loss": 0.7673, "step": 6422 }, { "epoch": 0.12, "learning_rate": 4.8918124936255455e-06, "loss": 0.9687, "step": 6423 }, { "epoch": 0.12, "learning_rate": 4.891768035366349e-06, "loss": 1.1149, "step": 6424 }, { "epoch": 0.12, "learning_rate": 4.8917235681763625e-06, "loss": 1.2315, "step": 6425 }, { "epoch": 0.12, "learning_rate": 4.891679092055754e-06, "loss": 0.9256, "step": 6426 }, { "epoch": 0.12, "learning_rate": 4.89163460700469e-06, "loss": 0.9312, "step": 6427 }, { "epoch": 0.12, "learning_rate": 4.891590113023335e-06, "loss": 0.892, "step": 6428 }, { "epoch": 0.12, "learning_rate": 4.8915456101118555e-06, "loss": 0.7871, "step": 6429 }, { "epoch": 0.12, "learning_rate": 4.891501098270418e-06, "loss": 0.8974, "step": 6430 }, { "epoch": 0.12, "learning_rate": 4.8914565774991896e-06, "loss": 1.152, "step": 6431 }, { "epoch": 0.12, "learning_rate": 4.891412047798335e-06, "loss": 1.1575, "step": 6432 }, { "epoch": 0.12, "learning_rate": 4.891367509168021e-06, "loss": 0.9602, "step": 6433 }, { "epoch": 0.12, "learning_rate": 4.891322961608414e-06, "loss": 0.8771, "step": 6434 }, { "epoch": 0.12, "learning_rate": 4.891278405119682e-06, "loss": 0.7537, "step": 6435 }, { "epoch": 0.12, "learning_rate": 4.891233839701987e-06, "loss": 1.0286, "step": 6436 }, { "epoch": 0.12, "learning_rate": 4.891189265355501e-06, "loss": 0.9834, "step": 6437 }, { "epoch": 0.12, "learning_rate": 4.891144682080386e-06, "loss": 0.9363, "step": 6438 }, { "epoch": 0.12, "learning_rate": 4.89110008987681e-06, "loss": 1.0983, "step": 6439 }, { "epoch": 0.12, "learning_rate": 4.89105548874494e-06, "loss": 1.0023, "step": 6440 }, { "epoch": 0.12, "learning_rate": 4.891010878684942e-06, "loss": 1.1294, "step": 6441 }, { "epoch": 0.12, "learning_rate": 4.890966259696982e-06, "loss": 0.8749, "step": 6442 }, { "epoch": 0.12, "learning_rate": 4.890921631781228e-06, "loss": 1.032, "step": 6443 }, { "epoch": 0.12, "learning_rate": 4.890876994937846e-06, "loss": 1.0759, "step": 6444 }, { "epoch": 0.12, "learning_rate": 4.890832349167003e-06, "loss": 0.8638, "step": 6445 }, { "epoch": 0.12, "learning_rate": 4.890787694468864e-06, "loss": 1.0113, "step": 6446 }, { "epoch": 0.12, "learning_rate": 4.890743030843598e-06, "loss": 0.9336, "step": 6447 }, { "epoch": 0.12, "learning_rate": 4.890698358291371e-06, "loss": 0.7623, "step": 6448 }, { "epoch": 0.12, "learning_rate": 4.890653676812349e-06, "loss": 1.0316, "step": 6449 }, { "epoch": 0.12, "learning_rate": 4.8906089864067e-06, "loss": 1.0911, "step": 6450 }, { "epoch": 0.12, "learning_rate": 4.89056428707459e-06, "loss": 0.9252, "step": 6451 }, { "epoch": 0.12, "learning_rate": 4.890519578816186e-06, "loss": 0.9792, "step": 6452 }, { "epoch": 0.12, "learning_rate": 4.890474861631656e-06, "loss": 1.2813, "step": 6453 }, { "epoch": 0.12, "learning_rate": 4.890430135521166e-06, "loss": 0.9459, "step": 6454 }, { "epoch": 0.12, "learning_rate": 4.8903854004848825e-06, "loss": 0.9489, "step": 6455 }, { "epoch": 0.12, "learning_rate": 4.890340656522974e-06, "loss": 1.0942, "step": 6456 }, { "epoch": 0.12, "learning_rate": 4.890295903635606e-06, "loss": 1.2144, "step": 6457 }, { "epoch": 0.12, "learning_rate": 4.890251141822947e-06, "loss": 0.8526, "step": 6458 }, { "epoch": 0.12, "learning_rate": 4.890206371085163e-06, "loss": 0.8841, "step": 6459 }, { "epoch": 0.12, "learning_rate": 4.8901615914224224e-06, "loss": 0.7565, "step": 6460 }, { "epoch": 0.12, "learning_rate": 4.890116802834891e-06, "loss": 0.8994, "step": 6461 }, { "epoch": 0.12, "learning_rate": 4.8900720053227365e-06, "loss": 1.2017, "step": 6462 }, { "epoch": 0.12, "learning_rate": 4.890027198886127e-06, "loss": 1.1563, "step": 6463 }, { "epoch": 0.12, "learning_rate": 4.88998238352523e-06, "loss": 0.8889, "step": 6464 }, { "epoch": 0.12, "learning_rate": 4.889937559240211e-06, "loss": 0.9899, "step": 6465 }, { "epoch": 0.12, "learning_rate": 4.889892726031239e-06, "loss": 0.9568, "step": 6466 }, { "epoch": 0.12, "learning_rate": 4.8898478838984795e-06, "loss": 0.9473, "step": 6467 }, { "epoch": 0.12, "learning_rate": 4.889803032842103e-06, "loss": 1.1891, "step": 6468 }, { "epoch": 0.12, "learning_rate": 4.889758172862274e-06, "loss": 1.0681, "step": 6469 }, { "epoch": 0.12, "learning_rate": 4.889713303959162e-06, "loss": 0.7698, "step": 6470 }, { "epoch": 0.12, "learning_rate": 4.889668426132934e-06, "loss": 0.8103, "step": 6471 }, { "epoch": 0.12, "learning_rate": 4.8896235393837564e-06, "loss": 1.0975, "step": 6472 }, { "epoch": 0.12, "learning_rate": 4.8895786437117985e-06, "loss": 1.0049, "step": 6473 }, { "epoch": 0.12, "learning_rate": 4.889533739117227e-06, "loss": 0.9362, "step": 6474 }, { "epoch": 0.12, "learning_rate": 4.88948882560021e-06, "loss": 1.0545, "step": 6475 }, { "epoch": 0.12, "learning_rate": 4.889443903160914e-06, "loss": 0.9108, "step": 6476 }, { "epoch": 0.12, "learning_rate": 4.889398971799509e-06, "loss": 0.8675, "step": 6477 }, { "epoch": 0.12, "learning_rate": 4.8893540315161615e-06, "loss": 0.9868, "step": 6478 }, { "epoch": 0.12, "learning_rate": 4.889309082311039e-06, "loss": 1.0137, "step": 6479 }, { "epoch": 0.12, "learning_rate": 4.889264124184308e-06, "loss": 0.9871, "step": 6480 }, { "epoch": 0.12, "learning_rate": 4.88921915713614e-06, "loss": 1.26, "step": 6481 }, { "epoch": 0.12, "learning_rate": 4.8891741811667e-06, "loss": 1.0562, "step": 6482 }, { "epoch": 0.12, "learning_rate": 4.889129196276158e-06, "loss": 0.8864, "step": 6483 }, { "epoch": 0.12, "learning_rate": 4.88908420246468e-06, "loss": 0.903, "step": 6484 }, { "epoch": 0.12, "learning_rate": 4.889039199732435e-06, "loss": 1.0542, "step": 6485 }, { "epoch": 0.12, "learning_rate": 4.888994188079591e-06, "loss": 0.9811, "step": 6486 }, { "epoch": 0.12, "learning_rate": 4.888949167506316e-06, "loss": 1.0343, "step": 6487 }, { "epoch": 0.12, "learning_rate": 4.888904138012777e-06, "loss": 1.0453, "step": 6488 }, { "epoch": 0.12, "learning_rate": 4.888859099599144e-06, "loss": 1.1268, "step": 6489 }, { "epoch": 0.12, "learning_rate": 4.888814052265585e-06, "loss": 1.0351, "step": 6490 }, { "epoch": 0.12, "learning_rate": 4.888768996012266e-06, "loss": 1.0465, "step": 6491 }, { "epoch": 0.12, "learning_rate": 4.8887239308393585e-06, "loss": 0.9557, "step": 6492 }, { "epoch": 0.12, "learning_rate": 4.888678856747028e-06, "loss": 1.2227, "step": 6493 }, { "epoch": 0.12, "learning_rate": 4.8886337737354445e-06, "loss": 0.9699, "step": 6494 }, { "epoch": 0.12, "learning_rate": 4.888588681804775e-06, "loss": 1.0886, "step": 6495 }, { "epoch": 0.12, "learning_rate": 4.88854358095519e-06, "loss": 0.8897, "step": 6496 }, { "epoch": 0.12, "learning_rate": 4.8884984711868546e-06, "loss": 0.9681, "step": 6497 }, { "epoch": 0.12, "learning_rate": 4.88845335249994e-06, "loss": 0.8743, "step": 6498 }, { "epoch": 0.12, "learning_rate": 4.888408224894614e-06, "loss": 1.1598, "step": 6499 }, { "epoch": 0.12, "learning_rate": 4.888363088371046e-06, "loss": 1.0575, "step": 6500 }, { "epoch": 0.12, "learning_rate": 4.888317942929401e-06, "loss": 1.009, "step": 6501 }, { "epoch": 0.12, "learning_rate": 4.888272788569852e-06, "loss": 1.0588, "step": 6502 }, { "epoch": 0.12, "learning_rate": 4.888227625292564e-06, "loss": 0.9273, "step": 6503 }, { "epoch": 0.12, "learning_rate": 4.8881824530977085e-06, "loss": 0.8921, "step": 6504 }, { "epoch": 0.12, "learning_rate": 4.8881372719854526e-06, "loss": 1.0225, "step": 6505 }, { "epoch": 0.12, "learning_rate": 4.888092081955966e-06, "loss": 1.0278, "step": 6506 }, { "epoch": 0.12, "learning_rate": 4.888046883009416e-06, "loss": 1.0773, "step": 6507 }, { "epoch": 0.12, "learning_rate": 4.8880016751459724e-06, "loss": 0.877, "step": 6508 }, { "epoch": 0.12, "learning_rate": 4.887956458365804e-06, "loss": 0.8475, "step": 6509 }, { "epoch": 0.12, "learning_rate": 4.8879112326690784e-06, "loss": 1.1196, "step": 6510 }, { "epoch": 0.12, "learning_rate": 4.887865998055966e-06, "loss": 0.8867, "step": 6511 }, { "epoch": 0.12, "learning_rate": 4.887820754526636e-06, "loss": 1.0098, "step": 6512 }, { "epoch": 0.12, "learning_rate": 4.887775502081255e-06, "loss": 0.9457, "step": 6513 }, { "epoch": 0.12, "learning_rate": 4.887730240719995e-06, "loss": 1.0827, "step": 6514 }, { "epoch": 0.12, "learning_rate": 4.887684970443023e-06, "loss": 1.0514, "step": 6515 }, { "epoch": 0.12, "learning_rate": 4.887639691250509e-06, "loss": 1.0361, "step": 6516 }, { "epoch": 0.12, "learning_rate": 4.887594403142621e-06, "loss": 0.8538, "step": 6517 }, { "epoch": 0.12, "learning_rate": 4.887549106119528e-06, "loss": 1.0652, "step": 6518 }, { "epoch": 0.12, "learning_rate": 4.8875038001814e-06, "loss": 1.0832, "step": 6519 }, { "epoch": 0.12, "learning_rate": 4.887458485328407e-06, "loss": 0.9067, "step": 6520 }, { "epoch": 0.12, "learning_rate": 4.887413161560717e-06, "loss": 0.8937, "step": 6521 }, { "epoch": 0.12, "learning_rate": 4.887367828878498e-06, "loss": 0.9566, "step": 6522 }, { "epoch": 0.12, "learning_rate": 4.887322487281923e-06, "loss": 0.8972, "step": 6523 }, { "epoch": 0.12, "learning_rate": 4.887277136771158e-06, "loss": 1.0464, "step": 6524 }, { "epoch": 0.12, "learning_rate": 4.887231777346373e-06, "loss": 1.0766, "step": 6525 }, { "epoch": 0.12, "learning_rate": 4.887186409007738e-06, "loss": 1.1454, "step": 6526 }, { "epoch": 0.12, "learning_rate": 4.8871410317554226e-06, "loss": 0.9216, "step": 6527 }, { "epoch": 0.12, "learning_rate": 4.8870956455895954e-06, "loss": 0.972, "step": 6528 }, { "epoch": 0.12, "learning_rate": 4.887050250510425e-06, "loss": 0.9973, "step": 6529 }, { "epoch": 0.12, "learning_rate": 4.887004846518084e-06, "loss": 0.9304, "step": 6530 }, { "epoch": 0.12, "learning_rate": 4.88695943361274e-06, "loss": 1.0577, "step": 6531 }, { "epoch": 0.12, "learning_rate": 4.886914011794562e-06, "loss": 1.071, "step": 6532 }, { "epoch": 0.12, "learning_rate": 4.886868581063721e-06, "loss": 0.9496, "step": 6533 }, { "epoch": 0.12, "learning_rate": 4.8868231414203845e-06, "loss": 1.0114, "step": 6534 }, { "epoch": 0.12, "learning_rate": 4.886777692864724e-06, "loss": 0.8778, "step": 6535 }, { "epoch": 0.12, "learning_rate": 4.886732235396909e-06, "loss": 0.9469, "step": 6536 }, { "epoch": 0.12, "learning_rate": 4.88668676901711e-06, "loss": 1.0555, "step": 6537 }, { "epoch": 0.12, "learning_rate": 4.8866412937254944e-06, "loss": 0.9755, "step": 6538 }, { "epoch": 0.12, "learning_rate": 4.886595809522234e-06, "loss": 0.8032, "step": 6539 }, { "epoch": 0.12, "learning_rate": 4.886550316407498e-06, "loss": 1.0474, "step": 6540 }, { "epoch": 0.12, "learning_rate": 4.886504814381457e-06, "loss": 1.1515, "step": 6541 }, { "epoch": 0.12, "learning_rate": 4.886459303444279e-06, "loss": 0.9853, "step": 6542 }, { "epoch": 0.12, "learning_rate": 4.886413783596136e-06, "loss": 1.1973, "step": 6543 }, { "epoch": 0.12, "learning_rate": 4.886368254837196e-06, "loss": 1.097, "step": 6544 }, { "epoch": 0.12, "learning_rate": 4.886322717167631e-06, "loss": 0.9115, "step": 6545 }, { "epoch": 0.12, "learning_rate": 4.88627717058761e-06, "loss": 0.6656, "step": 6546 }, { "epoch": 0.12, "learning_rate": 4.886231615097304e-06, "loss": 0.9536, "step": 6547 }, { "epoch": 0.12, "learning_rate": 4.88618605069688e-06, "loss": 0.7578, "step": 6548 }, { "epoch": 0.12, "learning_rate": 4.886140477386512e-06, "loss": 1.0099, "step": 6549 }, { "epoch": 0.12, "learning_rate": 4.886094895166369e-06, "loss": 1.0057, "step": 6550 }, { "epoch": 0.12, "learning_rate": 4.88604930403662e-06, "loss": 1.1782, "step": 6551 }, { "epoch": 0.12, "learning_rate": 4.886003703997436e-06, "loss": 0.7256, "step": 6552 }, { "epoch": 0.12, "learning_rate": 4.885958095048989e-06, "loss": 0.83, "step": 6553 }, { "epoch": 0.12, "learning_rate": 4.885912477191446e-06, "loss": 0.757, "step": 6554 }, { "epoch": 0.12, "learning_rate": 4.885866850424978e-06, "loss": 0.835, "step": 6555 }, { "epoch": 0.12, "learning_rate": 4.885821214749759e-06, "loss": 1.1762, "step": 6556 }, { "epoch": 0.12, "learning_rate": 4.885775570165955e-06, "loss": 1.0834, "step": 6557 }, { "epoch": 0.12, "learning_rate": 4.885729916673738e-06, "loss": 0.9126, "step": 6558 }, { "epoch": 0.12, "learning_rate": 4.8856842542732794e-06, "loss": 0.9779, "step": 6559 }, { "epoch": 0.12, "learning_rate": 4.885638582964749e-06, "loss": 0.8872, "step": 6560 }, { "epoch": 0.12, "learning_rate": 4.8855929027483165e-06, "loss": 0.8622, "step": 6561 }, { "epoch": 0.12, "learning_rate": 4.885547213624154e-06, "loss": 0.9724, "step": 6562 }, { "epoch": 0.12, "learning_rate": 4.8855015155924315e-06, "loss": 0.9803, "step": 6563 }, { "epoch": 0.12, "learning_rate": 4.885455808653319e-06, "loss": 1.0676, "step": 6564 }, { "epoch": 0.12, "learning_rate": 4.885410092806987e-06, "loss": 0.9123, "step": 6565 }, { "epoch": 0.12, "learning_rate": 4.885364368053608e-06, "loss": 0.8766, "step": 6566 }, { "epoch": 0.12, "learning_rate": 4.885318634393351e-06, "loss": 0.9373, "step": 6567 }, { "epoch": 0.12, "learning_rate": 4.885272891826388e-06, "loss": 1.0134, "step": 6568 }, { "epoch": 0.12, "learning_rate": 4.885227140352888e-06, "loss": 1.043, "step": 6569 }, { "epoch": 0.12, "learning_rate": 4.885181379973024e-06, "loss": 1.1057, "step": 6570 }, { "epoch": 0.12, "learning_rate": 4.885135610686965e-06, "loss": 0.8857, "step": 6571 }, { "epoch": 0.12, "learning_rate": 4.885089832494884e-06, "loss": 0.9445, "step": 6572 }, { "epoch": 0.12, "learning_rate": 4.8850440453969495e-06, "loss": 0.7905, "step": 6573 }, { "epoch": 0.12, "learning_rate": 4.884998249393335e-06, "loss": 1.0939, "step": 6574 }, { "epoch": 0.12, "learning_rate": 4.884952444484209e-06, "loss": 0.9589, "step": 6575 }, { "epoch": 0.12, "learning_rate": 4.884906630669743e-06, "loss": 1.013, "step": 6576 }, { "epoch": 0.12, "learning_rate": 4.88486080795011e-06, "loss": 0.8062, "step": 6577 }, { "epoch": 0.12, "learning_rate": 4.88481497632548e-06, "loss": 1.009, "step": 6578 }, { "epoch": 0.12, "learning_rate": 4.8847691357960235e-06, "loss": 1.041, "step": 6579 }, { "epoch": 0.12, "learning_rate": 4.884723286361912e-06, "loss": 1.1054, "step": 6580 }, { "epoch": 0.12, "learning_rate": 4.884677428023318e-06, "loss": 1.1045, "step": 6581 }, { "epoch": 0.12, "learning_rate": 4.88463156078041e-06, "loss": 1.0413, "step": 6582 }, { "epoch": 0.12, "learning_rate": 4.884585684633362e-06, "loss": 0.8824, "step": 6583 }, { "epoch": 0.12, "learning_rate": 4.884539799582344e-06, "loss": 0.9061, "step": 6584 }, { "epoch": 0.12, "learning_rate": 4.884493905627527e-06, "loss": 0.6635, "step": 6585 }, { "epoch": 0.12, "learning_rate": 4.8844480027690835e-06, "loss": 1.0413, "step": 6586 }, { "epoch": 0.12, "learning_rate": 4.884402091007183e-06, "loss": 1.045, "step": 6587 }, { "epoch": 0.12, "learning_rate": 4.884356170341999e-06, "loss": 1.0533, "step": 6588 }, { "epoch": 0.12, "learning_rate": 4.8843102407737035e-06, "loss": 1.049, "step": 6589 }, { "epoch": 0.12, "learning_rate": 4.884264302302465e-06, "loss": 0.9345, "step": 6590 }, { "epoch": 0.12, "learning_rate": 4.8842183549284574e-06, "loss": 0.8073, "step": 6591 }, { "epoch": 0.12, "learning_rate": 4.884172398651851e-06, "loss": 0.7879, "step": 6592 }, { "epoch": 0.12, "learning_rate": 4.884126433472818e-06, "loss": 1.0034, "step": 6593 }, { "epoch": 0.12, "learning_rate": 4.884080459391531e-06, "loss": 1.0276, "step": 6594 }, { "epoch": 0.12, "learning_rate": 4.884034476408159e-06, "loss": 1.1567, "step": 6595 }, { "epoch": 0.12, "learning_rate": 4.883988484522877e-06, "loss": 0.8615, "step": 6596 }, { "epoch": 0.12, "learning_rate": 4.883942483735854e-06, "loss": 0.8857, "step": 6597 }, { "epoch": 0.12, "learning_rate": 4.883896474047263e-06, "loss": 0.8959, "step": 6598 }, { "epoch": 0.12, "learning_rate": 4.883850455457276e-06, "loss": 1.0733, "step": 6599 }, { "epoch": 0.12, "learning_rate": 4.883804427966065e-06, "loss": 1.1468, "step": 6600 }, { "epoch": 0.12, "learning_rate": 4.8837583915738005e-06, "loss": 1.1122, "step": 6601 }, { "epoch": 0.12, "learning_rate": 4.883712346280656e-06, "loss": 1.0288, "step": 6602 }, { "epoch": 0.12, "learning_rate": 4.883666292086802e-06, "loss": 0.9356, "step": 6603 }, { "epoch": 0.12, "learning_rate": 4.88362022899241e-06, "loss": 1.0545, "step": 6604 }, { "epoch": 0.12, "learning_rate": 4.883574156997655e-06, "loss": 1.1046, "step": 6605 }, { "epoch": 0.12, "learning_rate": 4.883528076102707e-06, "loss": 1.2604, "step": 6606 }, { "epoch": 0.12, "learning_rate": 4.883481986307738e-06, "loss": 1.1281, "step": 6607 }, { "epoch": 0.12, "learning_rate": 4.88343588761292e-06, "loss": 1.0955, "step": 6608 }, { "epoch": 0.12, "learning_rate": 4.883389780018426e-06, "loss": 0.7708, "step": 6609 }, { "epoch": 0.12, "learning_rate": 4.883343663524427e-06, "loss": 0.7559, "step": 6610 }, { "epoch": 0.12, "learning_rate": 4.883297538131097e-06, "loss": 1.0166, "step": 6611 }, { "epoch": 0.12, "learning_rate": 4.883251403838606e-06, "loss": 1.1445, "step": 6612 }, { "epoch": 0.12, "learning_rate": 4.883205260647127e-06, "loss": 0.9985, "step": 6613 }, { "epoch": 0.12, "learning_rate": 4.883159108556834e-06, "loss": 0.9333, "step": 6614 }, { "epoch": 0.12, "learning_rate": 4.883112947567896e-06, "loss": 0.921, "step": 6615 }, { "epoch": 0.12, "learning_rate": 4.883066777680489e-06, "loss": 0.8939, "step": 6616 }, { "epoch": 0.12, "learning_rate": 4.883020598894783e-06, "loss": 0.9327, "step": 6617 }, { "epoch": 0.12, "learning_rate": 4.882974411210952e-06, "loss": 0.9747, "step": 6618 }, { "epoch": 0.12, "learning_rate": 4.882928214629167e-06, "loss": 0.9397, "step": 6619 }, { "epoch": 0.12, "learning_rate": 4.882882009149601e-06, "loss": 0.725, "step": 6620 }, { "epoch": 0.12, "learning_rate": 4.882835794772426e-06, "loss": 0.8909, "step": 6621 }, { "epoch": 0.12, "learning_rate": 4.882789571497816e-06, "loss": 0.9435, "step": 6622 }, { "epoch": 0.12, "learning_rate": 4.882743339325943e-06, "loss": 0.9534, "step": 6623 }, { "epoch": 0.12, "learning_rate": 4.88269709825698e-06, "loss": 1.0638, "step": 6624 }, { "epoch": 0.12, "learning_rate": 4.8826508482910976e-06, "loss": 0.9618, "step": 6625 }, { "epoch": 0.13, "learning_rate": 4.882604589428471e-06, "loss": 0.7755, "step": 6626 }, { "epoch": 0.13, "learning_rate": 4.882558321669271e-06, "loss": 0.792, "step": 6627 }, { "epoch": 0.13, "learning_rate": 4.882512045013672e-06, "loss": 0.8156, "step": 6628 }, { "epoch": 0.13, "learning_rate": 4.882465759461846e-06, "loss": 0.9672, "step": 6629 }, { "epoch": 0.13, "learning_rate": 4.882419465013966e-06, "loss": 0.8958, "step": 6630 }, { "epoch": 0.13, "learning_rate": 4.882373161670204e-06, "loss": 1.2505, "step": 6631 }, { "epoch": 0.13, "learning_rate": 4.882326849430734e-06, "loss": 1.013, "step": 6632 }, { "epoch": 0.13, "learning_rate": 4.882280528295729e-06, "loss": 0.9013, "step": 6633 }, { "epoch": 0.13, "learning_rate": 4.882234198265361e-06, "loss": 0.983, "step": 6634 }, { "epoch": 0.13, "learning_rate": 4.882187859339804e-06, "loss": 0.976, "step": 6635 }, { "epoch": 0.13, "learning_rate": 4.882141511519231e-06, "loss": 0.9768, "step": 6636 }, { "epoch": 0.13, "learning_rate": 4.882095154803814e-06, "loss": 1.1339, "step": 6637 }, { "epoch": 0.13, "learning_rate": 4.8820487891937265e-06, "loss": 1.0405, "step": 6638 }, { "epoch": 0.13, "learning_rate": 4.882002414689142e-06, "loss": 0.772, "step": 6639 }, { "epoch": 0.13, "learning_rate": 4.8819560312902344e-06, "loss": 0.8884, "step": 6640 }, { "epoch": 0.13, "learning_rate": 4.881909638997176e-06, "loss": 0.9258, "step": 6641 }, { "epoch": 0.13, "learning_rate": 4.881863237810138e-06, "loss": 0.9927, "step": 6642 }, { "epoch": 0.13, "learning_rate": 4.881816827729298e-06, "loss": 1.0782, "step": 6643 }, { "epoch": 0.13, "learning_rate": 4.881770408754826e-06, "loss": 1.0735, "step": 6644 }, { "epoch": 0.13, "learning_rate": 4.881723980886896e-06, "loss": 1.0349, "step": 6645 }, { "epoch": 0.13, "learning_rate": 4.881677544125682e-06, "loss": 0.7103, "step": 6646 }, { "epoch": 0.13, "learning_rate": 4.881631098471357e-06, "loss": 1.085, "step": 6647 }, { "epoch": 0.13, "learning_rate": 4.881584643924095e-06, "loss": 0.8381, "step": 6648 }, { "epoch": 0.13, "learning_rate": 4.881538180484068e-06, "loss": 0.9816, "step": 6649 }, { "epoch": 0.13, "learning_rate": 4.881491708151451e-06, "loss": 1.3784, "step": 6650 }, { "epoch": 0.13, "learning_rate": 4.881445226926418e-06, "loss": 0.869, "step": 6651 }, { "epoch": 0.13, "learning_rate": 4.88139873680914e-06, "loss": 0.8338, "step": 6652 }, { "epoch": 0.13, "learning_rate": 4.881352237799792e-06, "loss": 1.0879, "step": 6653 }, { "epoch": 0.13, "learning_rate": 4.881305729898549e-06, "loss": 0.8742, "step": 6654 }, { "epoch": 0.13, "learning_rate": 4.881259213105583e-06, "loss": 1.1557, "step": 6655 }, { "epoch": 0.13, "learning_rate": 4.881212687421068e-06, "loss": 0.9697, "step": 6656 }, { "epoch": 0.13, "learning_rate": 4.881166152845178e-06, "loss": 0.7266, "step": 6657 }, { "epoch": 0.13, "learning_rate": 4.881119609378087e-06, "loss": 0.8822, "step": 6658 }, { "epoch": 0.13, "learning_rate": 4.881073057019967e-06, "loss": 0.9777, "step": 6659 }, { "epoch": 0.13, "learning_rate": 4.881026495770994e-06, "loss": 0.8809, "step": 6660 }, { "epoch": 0.13, "learning_rate": 4.880979925631341e-06, "loss": 1.0081, "step": 6661 }, { "epoch": 0.13, "learning_rate": 4.880933346601182e-06, "loss": 1.1427, "step": 6662 }, { "epoch": 0.13, "learning_rate": 4.880886758680691e-06, "loss": 1.1107, "step": 6663 }, { "epoch": 0.13, "learning_rate": 4.880840161870042e-06, "loss": 0.9755, "step": 6664 }, { "epoch": 0.13, "learning_rate": 4.880793556169409e-06, "loss": 1.05, "step": 6665 }, { "epoch": 0.13, "learning_rate": 4.880746941578965e-06, "loss": 0.7348, "step": 6666 }, { "epoch": 0.13, "learning_rate": 4.880700318098885e-06, "loss": 0.8513, "step": 6667 }, { "epoch": 0.13, "learning_rate": 4.880653685729344e-06, "loss": 1.2599, "step": 6668 }, { "epoch": 0.13, "learning_rate": 4.880607044470514e-06, "loss": 1.1871, "step": 6669 }, { "epoch": 0.13, "learning_rate": 4.880560394322571e-06, "loss": 0.9469, "step": 6670 }, { "epoch": 0.13, "learning_rate": 4.880513735285688e-06, "loss": 1.0247, "step": 6671 }, { "epoch": 0.13, "learning_rate": 4.88046706736004e-06, "loss": 0.9313, "step": 6672 }, { "epoch": 0.13, "learning_rate": 4.880420390545801e-06, "loss": 1.0492, "step": 6673 }, { "epoch": 0.13, "learning_rate": 4.880373704843145e-06, "loss": 1.049, "step": 6674 }, { "epoch": 0.13, "learning_rate": 4.880327010252247e-06, "loss": 1.1808, "step": 6675 }, { "epoch": 0.13, "learning_rate": 4.880280306773281e-06, "loss": 0.9818, "step": 6676 }, { "epoch": 0.13, "learning_rate": 4.880233594406421e-06, "loss": 0.7548, "step": 6677 }, { "epoch": 0.13, "learning_rate": 4.880186873151841e-06, "loss": 0.8391, "step": 6678 }, { "epoch": 0.13, "learning_rate": 4.880140143009717e-06, "loss": 0.8036, "step": 6679 }, { "epoch": 0.13, "learning_rate": 4.880093403980223e-06, "loss": 1.1648, "step": 6680 }, { "epoch": 0.13, "learning_rate": 4.880046656063533e-06, "loss": 1.0486, "step": 6681 }, { "epoch": 0.13, "learning_rate": 4.879999899259821e-06, "loss": 1.0363, "step": 6682 }, { "epoch": 0.13, "learning_rate": 4.879953133569263e-06, "loss": 0.7516, "step": 6683 }, { "epoch": 0.13, "learning_rate": 4.879906358992033e-06, "loss": 0.8926, "step": 6684 }, { "epoch": 0.13, "learning_rate": 4.8798595755283055e-06, "loss": 1.0035, "step": 6685 }, { "epoch": 0.13, "learning_rate": 4.879812783178255e-06, "loss": 0.864, "step": 6686 }, { "epoch": 0.13, "learning_rate": 4.879765981942057e-06, "loss": 1.1784, "step": 6687 }, { "epoch": 0.13, "learning_rate": 4.879719171819886e-06, "loss": 1.0297, "step": 6688 }, { "epoch": 0.13, "learning_rate": 4.879672352811916e-06, "loss": 0.9078, "step": 6689 }, { "epoch": 0.13, "learning_rate": 4.879625524918323e-06, "loss": 1.1129, "step": 6690 }, { "epoch": 0.13, "learning_rate": 4.879578688139281e-06, "loss": 0.9395, "step": 6691 }, { "epoch": 0.13, "learning_rate": 4.879531842474965e-06, "loss": 0.8721, "step": 6692 }, { "epoch": 0.13, "learning_rate": 4.87948498792555e-06, "loss": 1.1877, "step": 6693 }, { "epoch": 0.13, "learning_rate": 4.8794381244912105e-06, "loss": 1.179, "step": 6694 }, { "epoch": 0.13, "learning_rate": 4.8793912521721224e-06, "loss": 1.0462, "step": 6695 }, { "epoch": 0.13, "learning_rate": 4.879344370968461e-06, "loss": 0.9955, "step": 6696 }, { "epoch": 0.13, "learning_rate": 4.8792974808804e-06, "loss": 0.8464, "step": 6697 }, { "epoch": 0.13, "learning_rate": 4.879250581908115e-06, "loss": 0.7999, "step": 6698 }, { "epoch": 0.13, "learning_rate": 4.879203674051782e-06, "loss": 0.8058, "step": 6699 }, { "epoch": 0.13, "learning_rate": 4.879156757311575e-06, "loss": 1.0399, "step": 6700 }, { "epoch": 0.13, "learning_rate": 4.87910983168767e-06, "loss": 0.9254, "step": 6701 }, { "epoch": 0.13, "learning_rate": 4.879062897180241e-06, "loss": 0.9495, "step": 6702 }, { "epoch": 0.13, "learning_rate": 4.879015953789464e-06, "loss": 0.9172, "step": 6703 }, { "epoch": 0.13, "learning_rate": 4.878969001515515e-06, "loss": 0.9089, "step": 6704 }, { "epoch": 0.13, "learning_rate": 4.878922040358569e-06, "loss": 0.9387, "step": 6705 }, { "epoch": 0.13, "learning_rate": 4.878875070318801e-06, "loss": 1.1091, "step": 6706 }, { "epoch": 0.13, "learning_rate": 4.878828091396386e-06, "loss": 0.938, "step": 6707 }, { "epoch": 0.13, "learning_rate": 4.8787811035915e-06, "loss": 0.9135, "step": 6708 }, { "epoch": 0.13, "learning_rate": 4.878734106904318e-06, "loss": 1.0436, "step": 6709 }, { "epoch": 0.13, "learning_rate": 4.878687101335016e-06, "loss": 0.8549, "step": 6710 }, { "epoch": 0.13, "learning_rate": 4.878640086883769e-06, "loss": 1.0016, "step": 6711 }, { "epoch": 0.13, "learning_rate": 4.878593063550754e-06, "loss": 1.0126, "step": 6712 }, { "epoch": 0.13, "learning_rate": 4.878546031336144e-06, "loss": 1.0394, "step": 6713 }, { "epoch": 0.13, "learning_rate": 4.878498990240117e-06, "loss": 0.8812, "step": 6714 }, { "epoch": 0.13, "learning_rate": 4.8784519402628476e-06, "loss": 0.8661, "step": 6715 }, { "epoch": 0.13, "learning_rate": 4.878404881404511e-06, "loss": 0.9557, "step": 6716 }, { "epoch": 0.13, "learning_rate": 4.878357813665283e-06, "loss": 1.0349, "step": 6717 }, { "epoch": 0.13, "learning_rate": 4.878310737045341e-06, "loss": 0.9723, "step": 6718 }, { "epoch": 0.13, "learning_rate": 4.878263651544859e-06, "loss": 1.1305, "step": 6719 }, { "epoch": 0.13, "learning_rate": 4.8782165571640135e-06, "loss": 0.9723, "step": 6720 }, { "epoch": 0.13, "learning_rate": 4.878169453902981e-06, "loss": 0.8571, "step": 6721 }, { "epoch": 0.13, "learning_rate": 4.878122341761936e-06, "loss": 0.9265, "step": 6722 }, { "epoch": 0.13, "learning_rate": 4.878075220741055e-06, "loss": 0.8721, "step": 6723 }, { "epoch": 0.13, "learning_rate": 4.878028090840515e-06, "loss": 1.0449, "step": 6724 }, { "epoch": 0.13, "learning_rate": 4.87798095206049e-06, "loss": 1.0222, "step": 6725 }, { "epoch": 0.13, "learning_rate": 4.877933804401158e-06, "loss": 0.8803, "step": 6726 }, { "epoch": 0.13, "learning_rate": 4.877886647862693e-06, "loss": 0.8934, "step": 6727 }, { "epoch": 0.13, "learning_rate": 4.8778394824452725e-06, "loss": 1.054, "step": 6728 }, { "epoch": 0.13, "learning_rate": 4.8777923081490725e-06, "loss": 0.8897, "step": 6729 }, { "epoch": 0.13, "learning_rate": 4.877745124974269e-06, "loss": 1.1664, "step": 6730 }, { "epoch": 0.13, "learning_rate": 4.877697932921038e-06, "loss": 1.2156, "step": 6731 }, { "epoch": 0.13, "learning_rate": 4.8776507319895556e-06, "loss": 1.0564, "step": 6732 }, { "epoch": 0.13, "learning_rate": 4.877603522179998e-06, "loss": 0.7313, "step": 6733 }, { "epoch": 0.13, "learning_rate": 4.877556303492542e-06, "loss": 0.832, "step": 6734 }, { "epoch": 0.13, "learning_rate": 4.877509075927364e-06, "loss": 0.8304, "step": 6735 }, { "epoch": 0.13, "learning_rate": 4.8774618394846405e-06, "loss": 1.0034, "step": 6736 }, { "epoch": 0.13, "learning_rate": 4.877414594164547e-06, "loss": 0.9161, "step": 6737 }, { "epoch": 0.13, "learning_rate": 4.877367339967259e-06, "loss": 1.2986, "step": 6738 }, { "epoch": 0.13, "learning_rate": 4.877320076892955e-06, "loss": 0.9984, "step": 6739 }, { "epoch": 0.13, "learning_rate": 4.877272804941812e-06, "loss": 0.9273, "step": 6740 }, { "epoch": 0.13, "learning_rate": 4.877225524114003e-06, "loss": 0.9686, "step": 6741 }, { "epoch": 0.13, "learning_rate": 4.877178234409708e-06, "loss": 0.8831, "step": 6742 }, { "epoch": 0.13, "learning_rate": 4.877130935829103e-06, "loss": 1.1307, "step": 6743 }, { "epoch": 0.13, "learning_rate": 4.877083628372363e-06, "loss": 1.0789, "step": 6744 }, { "epoch": 0.13, "learning_rate": 4.877036312039666e-06, "loss": 0.9279, "step": 6745 }, { "epoch": 0.13, "learning_rate": 4.876988986831188e-06, "loss": 0.8453, "step": 6746 }, { "epoch": 0.13, "learning_rate": 4.876941652747107e-06, "loss": 1.0349, "step": 6747 }, { "epoch": 0.13, "learning_rate": 4.876894309787598e-06, "loss": 0.8907, "step": 6748 }, { "epoch": 0.13, "learning_rate": 4.876846957952838e-06, "loss": 0.9062, "step": 6749 }, { "epoch": 0.13, "learning_rate": 4.876799597243005e-06, "loss": 1.2352, "step": 6750 }, { "epoch": 0.13, "learning_rate": 4.876752227658275e-06, "loss": 0.9943, "step": 6751 }, { "epoch": 0.13, "learning_rate": 4.876704849198825e-06, "loss": 0.8734, "step": 6752 }, { "epoch": 0.13, "learning_rate": 4.8766574618648325e-06, "loss": 0.9622, "step": 6753 }, { "epoch": 0.13, "learning_rate": 4.876610065656473e-06, "loss": 1.0222, "step": 6754 }, { "epoch": 0.13, "learning_rate": 4.876562660573925e-06, "loss": 0.8565, "step": 6755 }, { "epoch": 0.13, "learning_rate": 4.8765152466173645e-06, "loss": 1.1497, "step": 6756 }, { "epoch": 0.13, "learning_rate": 4.876467823786969e-06, "loss": 1.204, "step": 6757 }, { "epoch": 0.13, "learning_rate": 4.876420392082916e-06, "loss": 0.7742, "step": 6758 }, { "epoch": 0.13, "learning_rate": 4.876372951505382e-06, "loss": 0.9737, "step": 6759 }, { "epoch": 0.13, "learning_rate": 4.8763255020545445e-06, "loss": 0.9312, "step": 6760 }, { "epoch": 0.13, "learning_rate": 4.876278043730579e-06, "loss": 0.9956, "step": 6761 }, { "epoch": 0.13, "learning_rate": 4.8762305765336654e-06, "loss": 1.1507, "step": 6762 }, { "epoch": 0.13, "learning_rate": 4.876183100463979e-06, "loss": 1.1465, "step": 6763 }, { "epoch": 0.13, "learning_rate": 4.8761356155216985e-06, "loss": 0.8251, "step": 6764 }, { "epoch": 0.13, "learning_rate": 4.876088121707e-06, "loss": 0.9418, "step": 6765 }, { "epoch": 0.13, "learning_rate": 4.876040619020062e-06, "loss": 0.7779, "step": 6766 }, { "epoch": 0.13, "learning_rate": 4.8759931074610604e-06, "loss": 0.9405, "step": 6767 }, { "epoch": 0.13, "learning_rate": 4.875945587030173e-06, "loss": 0.9958, "step": 6768 }, { "epoch": 0.13, "learning_rate": 4.875898057727579e-06, "loss": 1.0519, "step": 6769 }, { "epoch": 0.13, "learning_rate": 4.875850519553453e-06, "loss": 0.9649, "step": 6770 }, { "epoch": 0.13, "learning_rate": 4.875802972507975e-06, "loss": 0.9703, "step": 6771 }, { "epoch": 0.13, "learning_rate": 4.875755416591321e-06, "loss": 1.0359, "step": 6772 }, { "epoch": 0.13, "learning_rate": 4.8757078518036695e-06, "loss": 0.8705, "step": 6773 }, { "epoch": 0.13, "learning_rate": 4.875660278145197e-06, "loss": 1.0353, "step": 6774 }, { "epoch": 0.13, "learning_rate": 4.875612695616083e-06, "loss": 1.1502, "step": 6775 }, { "epoch": 0.13, "learning_rate": 4.875565104216504e-06, "loss": 1.0172, "step": 6776 }, { "epoch": 0.13, "learning_rate": 4.875517503946637e-06, "loss": 0.8801, "step": 6777 }, { "epoch": 0.13, "learning_rate": 4.875469894806661e-06, "loss": 0.837, "step": 6778 }, { "epoch": 0.13, "learning_rate": 4.875422276796753e-06, "loss": 0.9324, "step": 6779 }, { "epoch": 0.13, "learning_rate": 4.875374649917091e-06, "loss": 0.8413, "step": 6780 }, { "epoch": 0.13, "learning_rate": 4.875327014167853e-06, "loss": 1.2331, "step": 6781 }, { "epoch": 0.13, "learning_rate": 4.875279369549216e-06, "loss": 0.9012, "step": 6782 }, { "epoch": 0.13, "learning_rate": 4.87523171606136e-06, "loss": 0.9844, "step": 6783 }, { "epoch": 0.13, "learning_rate": 4.87518405370446e-06, "loss": 0.9735, "step": 6784 }, { "epoch": 0.13, "learning_rate": 4.875136382478697e-06, "loss": 0.7554, "step": 6785 }, { "epoch": 0.13, "learning_rate": 4.875088702384247e-06, "loss": 0.9512, "step": 6786 }, { "epoch": 0.13, "learning_rate": 4.875041013421289e-06, "loss": 1.1345, "step": 6787 }, { "epoch": 0.13, "learning_rate": 4.8749933155899994e-06, "loss": 0.9555, "step": 6788 }, { "epoch": 0.13, "learning_rate": 4.8749456088905585e-06, "loss": 0.8797, "step": 6789 }, { "epoch": 0.13, "learning_rate": 4.8748978933231435e-06, "loss": 1.0682, "step": 6790 }, { "epoch": 0.13, "learning_rate": 4.874850168887934e-06, "loss": 0.7932, "step": 6791 }, { "epoch": 0.13, "learning_rate": 4.874802435585105e-06, "loss": 1.0727, "step": 6792 }, { "epoch": 0.13, "learning_rate": 4.874754693414837e-06, "loss": 0.8538, "step": 6793 }, { "epoch": 0.13, "learning_rate": 4.8747069423773075e-06, "loss": 0.8265, "step": 6794 }, { "epoch": 0.13, "learning_rate": 4.874659182472695e-06, "loss": 0.8429, "step": 6795 }, { "epoch": 0.13, "learning_rate": 4.874611413701179e-06, "loss": 0.887, "step": 6796 }, { "epoch": 0.13, "learning_rate": 4.874563636062936e-06, "loss": 0.9708, "step": 6797 }, { "epoch": 0.13, "learning_rate": 4.874515849558145e-06, "loss": 0.9684, "step": 6798 }, { "epoch": 0.13, "learning_rate": 4.874468054186984e-06, "loss": 0.9049, "step": 6799 }, { "epoch": 0.13, "learning_rate": 4.8744202499496336e-06, "loss": 1.3153, "step": 6800 }, { "epoch": 0.13, "learning_rate": 4.87437243684627e-06, "loss": 1.1735, "step": 6801 }, { "epoch": 0.13, "learning_rate": 4.874324614877072e-06, "loss": 1.1351, "step": 6802 }, { "epoch": 0.13, "learning_rate": 4.87427678404222e-06, "loss": 0.9714, "step": 6803 }, { "epoch": 0.13, "learning_rate": 4.87422894434189e-06, "loss": 0.9412, "step": 6804 }, { "epoch": 0.13, "learning_rate": 4.874181095776263e-06, "loss": 0.8686, "step": 6805 }, { "epoch": 0.13, "learning_rate": 4.874133238345516e-06, "loss": 1.1402, "step": 6806 }, { "epoch": 0.13, "learning_rate": 4.874085372049828e-06, "loss": 1.0468, "step": 6807 }, { "epoch": 0.13, "learning_rate": 4.8740374968893786e-06, "loss": 0.8043, "step": 6808 }, { "epoch": 0.13, "learning_rate": 4.873989612864346e-06, "loss": 0.8292, "step": 6809 }, { "epoch": 0.13, "learning_rate": 4.873941719974908e-06, "loss": 0.8054, "step": 6810 }, { "epoch": 0.13, "learning_rate": 4.873893818221246e-06, "loss": 1.0376, "step": 6811 }, { "epoch": 0.13, "learning_rate": 4.873845907603536e-06, "loss": 1.2803, "step": 6812 }, { "epoch": 0.13, "learning_rate": 4.873797988121959e-06, "loss": 0.9572, "step": 6813 }, { "epoch": 0.13, "learning_rate": 4.873750059776692e-06, "loss": 0.8204, "step": 6814 }, { "epoch": 0.13, "learning_rate": 4.8737021225679156e-06, "loss": 1.0209, "step": 6815 }, { "epoch": 0.13, "learning_rate": 4.873654176495809e-06, "loss": 0.7865, "step": 6816 }, { "epoch": 0.13, "learning_rate": 4.873606221560549e-06, "loss": 1.0341, "step": 6817 }, { "epoch": 0.13, "learning_rate": 4.873558257762318e-06, "loss": 1.13, "step": 6818 }, { "epoch": 0.13, "learning_rate": 4.8735102851012915e-06, "loss": 1.1415, "step": 6819 }, { "epoch": 0.13, "learning_rate": 4.873462303577652e-06, "loss": 0.9945, "step": 6820 }, { "epoch": 0.13, "learning_rate": 4.8734143131915755e-06, "loss": 0.8731, "step": 6821 }, { "epoch": 0.13, "learning_rate": 4.873366313943243e-06, "loss": 1.0094, "step": 6822 }, { "epoch": 0.13, "learning_rate": 4.873318305832834e-06, "loss": 1.0255, "step": 6823 }, { "epoch": 0.13, "learning_rate": 4.873270288860527e-06, "loss": 0.8885, "step": 6824 }, { "epoch": 0.13, "learning_rate": 4.873222263026502e-06, "loss": 1.0267, "step": 6825 }, { "epoch": 0.13, "learning_rate": 4.873174228330937e-06, "loss": 0.9417, "step": 6826 }, { "epoch": 0.13, "learning_rate": 4.873126184774013e-06, "loss": 0.9993, "step": 6827 }, { "epoch": 0.13, "learning_rate": 4.873078132355908e-06, "loss": 0.8948, "step": 6828 }, { "epoch": 0.13, "learning_rate": 4.873030071076802e-06, "loss": 0.9337, "step": 6829 }, { "epoch": 0.13, "learning_rate": 4.872982000936875e-06, "loss": 1.0922, "step": 6830 }, { "epoch": 0.13, "learning_rate": 4.872933921936305e-06, "loss": 1.0594, "step": 6831 }, { "epoch": 0.13, "learning_rate": 4.872885834075273e-06, "loss": 1.014, "step": 6832 }, { "epoch": 0.13, "learning_rate": 4.872837737353958e-06, "loss": 0.9406, "step": 6833 }, { "epoch": 0.13, "learning_rate": 4.87278963177254e-06, "loss": 0.9914, "step": 6834 }, { "epoch": 0.13, "learning_rate": 4.872741517331199e-06, "loss": 0.9949, "step": 6835 }, { "epoch": 0.13, "learning_rate": 4.872693394030112e-06, "loss": 0.9845, "step": 6836 }, { "epoch": 0.13, "learning_rate": 4.872645261869462e-06, "loss": 1.2223, "step": 6837 }, { "epoch": 0.13, "learning_rate": 4.872597120849427e-06, "loss": 0.999, "step": 6838 }, { "epoch": 0.13, "learning_rate": 4.872548970970186e-06, "loss": 0.8965, "step": 6839 }, { "epoch": 0.13, "learning_rate": 4.872500812231921e-06, "loss": 0.9444, "step": 6840 }, { "epoch": 0.13, "learning_rate": 4.8724526446348115e-06, "loss": 0.8394, "step": 6841 }, { "epoch": 0.13, "learning_rate": 4.8724044681790355e-06, "loss": 0.9489, "step": 6842 }, { "epoch": 0.13, "learning_rate": 4.872356282864774e-06, "loss": 1.0306, "step": 6843 }, { "epoch": 0.13, "learning_rate": 4.872308088692207e-06, "loss": 0.8503, "step": 6844 }, { "epoch": 0.13, "learning_rate": 4.872259885661514e-06, "loss": 0.9272, "step": 6845 }, { "epoch": 0.13, "learning_rate": 4.872211673772876e-06, "loss": 0.8437, "step": 6846 }, { "epoch": 0.13, "learning_rate": 4.872163453026472e-06, "loss": 0.8546, "step": 6847 }, { "epoch": 0.13, "learning_rate": 4.872115223422482e-06, "loss": 0.8206, "step": 6848 }, { "epoch": 0.13, "learning_rate": 4.872066984961088e-06, "loss": 0.9729, "step": 6849 }, { "epoch": 0.13, "learning_rate": 4.8720187376424675e-06, "loss": 1.0898, "step": 6850 }, { "epoch": 0.13, "learning_rate": 4.871970481466801e-06, "loss": 0.8902, "step": 6851 }, { "epoch": 0.13, "learning_rate": 4.87192221643427e-06, "loss": 0.8286, "step": 6852 }, { "epoch": 0.13, "learning_rate": 4.871873942545055e-06, "loss": 1.0314, "step": 6853 }, { "epoch": 0.13, "learning_rate": 4.871825659799335e-06, "loss": 0.9518, "step": 6854 }, { "epoch": 0.13, "learning_rate": 4.87177736819729e-06, "loss": 0.9619, "step": 6855 }, { "epoch": 0.13, "learning_rate": 4.8717290677391014e-06, "loss": 1.0777, "step": 6856 }, { "epoch": 0.13, "learning_rate": 4.87168075842495e-06, "loss": 0.8427, "step": 6857 }, { "epoch": 0.13, "learning_rate": 4.8716324402550145e-06, "loss": 0.8509, "step": 6858 }, { "epoch": 0.13, "learning_rate": 4.871584113229476e-06, "loss": 0.9949, "step": 6859 }, { "epoch": 0.13, "learning_rate": 4.871535777348516e-06, "loss": 0.8965, "step": 6860 }, { "epoch": 0.13, "learning_rate": 4.871487432612313e-06, "loss": 1.0401, "step": 6861 }, { "epoch": 0.13, "learning_rate": 4.87143907902105e-06, "loss": 1.1284, "step": 6862 }, { "epoch": 0.13, "learning_rate": 4.871390716574905e-06, "loss": 0.9063, "step": 6863 }, { "epoch": 0.13, "learning_rate": 4.87134234527406e-06, "loss": 1.0052, "step": 6864 }, { "epoch": 0.13, "learning_rate": 4.871293965118697e-06, "loss": 0.9501, "step": 6865 }, { "epoch": 0.13, "learning_rate": 4.871245576108993e-06, "loss": 0.8429, "step": 6866 }, { "epoch": 0.13, "learning_rate": 4.871197178245131e-06, "loss": 0.8614, "step": 6867 }, { "epoch": 0.13, "learning_rate": 4.871148771527292e-06, "loss": 1.0208, "step": 6868 }, { "epoch": 0.13, "learning_rate": 4.871100355955656e-06, "loss": 1.1042, "step": 6869 }, { "epoch": 0.13, "learning_rate": 4.871051931530404e-06, "loss": 0.9968, "step": 6870 }, { "epoch": 0.13, "learning_rate": 4.871003498251716e-06, "loss": 0.9419, "step": 6871 }, { "epoch": 0.13, "learning_rate": 4.870955056119775e-06, "loss": 1.1522, "step": 6872 }, { "epoch": 0.13, "learning_rate": 4.87090660513476e-06, "loss": 0.9282, "step": 6873 }, { "epoch": 0.13, "learning_rate": 4.870858145296852e-06, "loss": 0.9116, "step": 6874 }, { "epoch": 0.13, "learning_rate": 4.870809676606233e-06, "loss": 0.9879, "step": 6875 }, { "epoch": 0.13, "learning_rate": 4.870761199063083e-06, "loss": 0.9897, "step": 6876 }, { "epoch": 0.13, "learning_rate": 4.870712712667583e-06, "loss": 0.9357, "step": 6877 }, { "epoch": 0.13, "learning_rate": 4.870664217419916e-06, "loss": 1.0474, "step": 6878 }, { "epoch": 0.13, "learning_rate": 4.87061571332026e-06, "loss": 0.7551, "step": 6879 }, { "epoch": 0.13, "learning_rate": 4.870567200368797e-06, "loss": 0.8384, "step": 6880 }, { "epoch": 0.13, "learning_rate": 4.870518678565711e-06, "loss": 1.3048, "step": 6881 }, { "epoch": 0.13, "learning_rate": 4.870470147911179e-06, "loss": 0.9641, "step": 6882 }, { "epoch": 0.13, "learning_rate": 4.870421608405385e-06, "loss": 0.9877, "step": 6883 }, { "epoch": 0.13, "learning_rate": 4.87037306004851e-06, "loss": 0.9992, "step": 6884 }, { "epoch": 0.13, "learning_rate": 4.8703245028407335e-06, "loss": 0.8251, "step": 6885 }, { "epoch": 0.13, "learning_rate": 4.870275936782238e-06, "loss": 1.0444, "step": 6886 }, { "epoch": 0.13, "learning_rate": 4.8702273618732054e-06, "loss": 1.0636, "step": 6887 }, { "epoch": 0.13, "learning_rate": 4.870178778113817e-06, "loss": 0.9989, "step": 6888 }, { "epoch": 0.13, "learning_rate": 4.870130185504252e-06, "loss": 0.9971, "step": 6889 }, { "epoch": 0.13, "learning_rate": 4.870081584044695e-06, "loss": 0.9447, "step": 6890 }, { "epoch": 0.13, "learning_rate": 4.8700329737353254e-06, "loss": 0.8374, "step": 6891 }, { "epoch": 0.13, "learning_rate": 4.869984354576326e-06, "loss": 0.9808, "step": 6892 }, { "epoch": 0.13, "learning_rate": 4.869935726567877e-06, "loss": 1.0047, "step": 6893 }, { "epoch": 0.13, "learning_rate": 4.86988708971016e-06, "loss": 0.886, "step": 6894 }, { "epoch": 0.13, "learning_rate": 4.869838444003359e-06, "loss": 0.9753, "step": 6895 }, { "epoch": 0.13, "learning_rate": 4.869789789447653e-06, "loss": 0.7767, "step": 6896 }, { "epoch": 0.13, "learning_rate": 4.8697411260432246e-06, "loss": 0.7956, "step": 6897 }, { "epoch": 0.13, "learning_rate": 4.869692453790256e-06, "loss": 0.9311, "step": 6898 }, { "epoch": 0.13, "learning_rate": 4.869643772688928e-06, "loss": 1.0751, "step": 6899 }, { "epoch": 0.13, "learning_rate": 4.869595082739422e-06, "loss": 1.0894, "step": 6900 }, { "epoch": 0.13, "learning_rate": 4.869546383941922e-06, "loss": 1.2285, "step": 6901 }, { "epoch": 0.13, "learning_rate": 4.869497676296607e-06, "loss": 1.152, "step": 6902 }, { "epoch": 0.13, "learning_rate": 4.869448959803662e-06, "loss": 1.0316, "step": 6903 }, { "epoch": 0.13, "learning_rate": 4.869400234463266e-06, "loss": 0.8948, "step": 6904 }, { "epoch": 0.13, "learning_rate": 4.8693515002756035e-06, "loss": 0.9673, "step": 6905 }, { "epoch": 0.13, "learning_rate": 4.869302757240854e-06, "loss": 0.8956, "step": 6906 }, { "epoch": 0.13, "learning_rate": 4.8692540053592004e-06, "loss": 0.8859, "step": 6907 }, { "epoch": 0.13, "learning_rate": 4.869205244630826e-06, "loss": 0.7968, "step": 6908 }, { "epoch": 0.13, "learning_rate": 4.869156475055911e-06, "loss": 0.7273, "step": 6909 }, { "epoch": 0.13, "learning_rate": 4.869107696634638e-06, "loss": 0.9448, "step": 6910 }, { "epoch": 0.13, "learning_rate": 4.86905890936719e-06, "loss": 0.9584, "step": 6911 }, { "epoch": 0.13, "learning_rate": 4.869010113253749e-06, "loss": 0.994, "step": 6912 }, { "epoch": 0.13, "learning_rate": 4.868961308294497e-06, "loss": 1.197, "step": 6913 }, { "epoch": 0.13, "learning_rate": 4.868912494489616e-06, "loss": 0.952, "step": 6914 }, { "epoch": 0.13, "learning_rate": 4.868863671839288e-06, "loss": 0.7937, "step": 6915 }, { "epoch": 0.13, "learning_rate": 4.868814840343697e-06, "loss": 0.8894, "step": 6916 }, { "epoch": 0.13, "learning_rate": 4.868766000003022e-06, "loss": 1.0528, "step": 6917 }, { "epoch": 0.13, "learning_rate": 4.868717150817448e-06, "loss": 1.2024, "step": 6918 }, { "epoch": 0.13, "learning_rate": 4.868668292787157e-06, "loss": 1.1422, "step": 6919 }, { "epoch": 0.13, "learning_rate": 4.868619425912332e-06, "loss": 0.9883, "step": 6920 }, { "epoch": 0.13, "learning_rate": 4.8685705501931535e-06, "loss": 1.0441, "step": 6921 }, { "epoch": 0.13, "learning_rate": 4.8685216656298065e-06, "loss": 0.9277, "step": 6922 }, { "epoch": 0.13, "learning_rate": 4.8684727722224715e-06, "loss": 0.8661, "step": 6923 }, { "epoch": 0.13, "learning_rate": 4.868423869971331e-06, "loss": 1.1634, "step": 6924 }, { "epoch": 0.13, "learning_rate": 4.86837495887657e-06, "loss": 1.1099, "step": 6925 }, { "epoch": 0.13, "learning_rate": 4.868326038938368e-06, "loss": 0.833, "step": 6926 }, { "epoch": 0.13, "learning_rate": 4.868277110156909e-06, "loss": 0.9078, "step": 6927 }, { "epoch": 0.13, "learning_rate": 4.8682281725323775e-06, "loss": 0.9668, "step": 6928 }, { "epoch": 0.13, "learning_rate": 4.868179226064954e-06, "loss": 0.9236, "step": 6929 }, { "epoch": 0.13, "learning_rate": 4.8681302707548215e-06, "loss": 1.231, "step": 6930 }, { "epoch": 0.13, "learning_rate": 4.868081306602162e-06, "loss": 1.0901, "step": 6931 }, { "epoch": 0.13, "learning_rate": 4.868032333607162e-06, "loss": 0.9453, "step": 6932 }, { "epoch": 0.13, "learning_rate": 4.8679833517700005e-06, "loss": 0.8277, "step": 6933 }, { "epoch": 0.13, "learning_rate": 4.867934361090862e-06, "loss": 0.783, "step": 6934 }, { "epoch": 0.13, "learning_rate": 4.86788536156993e-06, "loss": 1.012, "step": 6935 }, { "epoch": 0.13, "learning_rate": 4.8678363532073844e-06, "loss": 0.8638, "step": 6936 }, { "epoch": 0.13, "learning_rate": 4.867787336003412e-06, "loss": 1.1213, "step": 6937 }, { "epoch": 0.13, "learning_rate": 4.867738309958194e-06, "loss": 1.1237, "step": 6938 }, { "epoch": 0.13, "learning_rate": 4.867689275071915e-06, "loss": 0.924, "step": 6939 }, { "epoch": 0.13, "learning_rate": 4.867640231344756e-06, "loss": 0.7417, "step": 6940 }, { "epoch": 0.13, "learning_rate": 4.8675911787769e-06, "loss": 0.9653, "step": 6941 }, { "epoch": 0.13, "learning_rate": 4.867542117368532e-06, "loss": 1.1074, "step": 6942 }, { "epoch": 0.13, "learning_rate": 4.867493047119834e-06, "loss": 1.0999, "step": 6943 }, { "epoch": 0.13, "learning_rate": 4.86744396803099e-06, "loss": 1.1889, "step": 6944 }, { "epoch": 0.13, "learning_rate": 4.867394880102183e-06, "loss": 0.9363, "step": 6945 }, { "epoch": 0.13, "learning_rate": 4.867345783333595e-06, "loss": 0.8416, "step": 6946 }, { "epoch": 0.13, "learning_rate": 4.867296677725411e-06, "loss": 0.9517, "step": 6947 }, { "epoch": 0.13, "learning_rate": 4.867247563277814e-06, "loss": 0.9534, "step": 6948 }, { "epoch": 0.13, "learning_rate": 4.867198439990988e-06, "loss": 0.944, "step": 6949 }, { "epoch": 0.13, "learning_rate": 4.8671493078651135e-06, "loss": 1.0942, "step": 6950 }, { "epoch": 0.13, "learning_rate": 4.867100166900378e-06, "loss": 1.0923, "step": 6951 }, { "epoch": 0.13, "learning_rate": 4.8670510170969624e-06, "loss": 0.8985, "step": 6952 }, { "epoch": 0.13, "learning_rate": 4.8670018584550506e-06, "loss": 1.1491, "step": 6953 }, { "epoch": 0.13, "learning_rate": 4.866952690974827e-06, "loss": 0.9905, "step": 6954 }, { "epoch": 0.13, "learning_rate": 4.866903514656473e-06, "loss": 1.0969, "step": 6955 }, { "epoch": 0.13, "learning_rate": 4.866854329500176e-06, "loss": 1.1431, "step": 6956 }, { "epoch": 0.13, "learning_rate": 4.866805135506116e-06, "loss": 0.9184, "step": 6957 }, { "epoch": 0.13, "learning_rate": 4.866755932674479e-06, "loss": 0.7328, "step": 6958 }, { "epoch": 0.13, "learning_rate": 4.866706721005448e-06, "loss": 0.9335, "step": 6959 }, { "epoch": 0.13, "learning_rate": 4.8666575004992056e-06, "loss": 0.9015, "step": 6960 }, { "epoch": 0.13, "learning_rate": 4.866608271155937e-06, "loss": 0.8759, "step": 6961 }, { "epoch": 0.13, "learning_rate": 4.866559032975827e-06, "loss": 1.0844, "step": 6962 }, { "epoch": 0.13, "learning_rate": 4.8665097859590574e-06, "loss": 1.0955, "step": 6963 }, { "epoch": 0.13, "learning_rate": 4.866460530105812e-06, "loss": 0.8748, "step": 6964 }, { "epoch": 0.13, "learning_rate": 4.866411265416276e-06, "loss": 0.931, "step": 6965 }, { "epoch": 0.13, "learning_rate": 4.8663619918906335e-06, "loss": 0.8408, "step": 6966 }, { "epoch": 0.13, "learning_rate": 4.8663127095290675e-06, "loss": 0.9606, "step": 6967 }, { "epoch": 0.13, "learning_rate": 4.866263418331763e-06, "loss": 1.0378, "step": 6968 }, { "epoch": 0.13, "learning_rate": 4.866214118298902e-06, "loss": 1.1984, "step": 6969 }, { "epoch": 0.13, "learning_rate": 4.86616480943067e-06, "loss": 0.8114, "step": 6970 }, { "epoch": 0.13, "learning_rate": 4.866115491727253e-06, "loss": 0.8814, "step": 6971 }, { "epoch": 0.13, "learning_rate": 4.866066165188832e-06, "loss": 0.9679, "step": 6972 }, { "epoch": 0.13, "learning_rate": 4.866016829815593e-06, "loss": 0.9789, "step": 6973 }, { "epoch": 0.13, "learning_rate": 4.865967485607719e-06, "loss": 0.948, "step": 6974 }, { "epoch": 0.13, "learning_rate": 4.865918132565396e-06, "loss": 1.3123, "step": 6975 }, { "epoch": 0.13, "learning_rate": 4.865868770688807e-06, "loss": 1.0232, "step": 6976 }, { "epoch": 0.13, "learning_rate": 4.865819399978136e-06, "loss": 0.8406, "step": 6977 }, { "epoch": 0.13, "learning_rate": 4.8657700204335675e-06, "loss": 0.976, "step": 6978 }, { "epoch": 0.13, "learning_rate": 4.865720632055286e-06, "loss": 0.89, "step": 6979 }, { "epoch": 0.13, "learning_rate": 4.865671234843477e-06, "loss": 0.8384, "step": 6980 }, { "epoch": 0.13, "learning_rate": 4.865621828798325e-06, "loss": 1.0936, "step": 6981 }, { "epoch": 0.13, "learning_rate": 4.865572413920013e-06, "loss": 0.925, "step": 6982 }, { "epoch": 0.13, "learning_rate": 4.865522990208726e-06, "loss": 1.0325, "step": 6983 }, { "epoch": 0.13, "learning_rate": 4.865473557664648e-06, "loss": 0.9573, "step": 6984 }, { "epoch": 0.13, "learning_rate": 4.865424116287966e-06, "loss": 1.0362, "step": 6985 }, { "epoch": 0.13, "learning_rate": 4.8653746660788616e-06, "loss": 0.9149, "step": 6986 }, { "epoch": 0.13, "learning_rate": 4.8653252070375205e-06, "loss": 1.0894, "step": 6987 }, { "epoch": 0.13, "learning_rate": 4.865275739164128e-06, "loss": 0.9409, "step": 6988 }, { "epoch": 0.13, "learning_rate": 4.8652262624588684e-06, "loss": 0.9526, "step": 6989 }, { "epoch": 0.13, "learning_rate": 4.865176776921926e-06, "loss": 1.0956, "step": 6990 }, { "epoch": 0.13, "learning_rate": 4.865127282553487e-06, "loss": 0.8383, "step": 6991 }, { "epoch": 0.13, "learning_rate": 4.865077779353735e-06, "loss": 0.9417, "step": 6992 }, { "epoch": 0.13, "learning_rate": 4.865028267322854e-06, "loss": 0.8969, "step": 6993 }, { "epoch": 0.13, "learning_rate": 4.864978746461031e-06, "loss": 1.027, "step": 6994 }, { "epoch": 0.13, "learning_rate": 4.864929216768449e-06, "loss": 1.035, "step": 6995 }, { "epoch": 0.13, "learning_rate": 4.864879678245296e-06, "loss": 1.053, "step": 6996 }, { "epoch": 0.13, "learning_rate": 4.864830130891752e-06, "loss": 1.012, "step": 6997 }, { "epoch": 0.13, "learning_rate": 4.8647805747080065e-06, "loss": 0.9491, "step": 6998 }, { "epoch": 0.13, "learning_rate": 4.864731009694242e-06, "loss": 0.957, "step": 6999 }, { "epoch": 0.13, "learning_rate": 4.864681435850645e-06, "loss": 1.0358, "step": 7000 }, { "epoch": 0.13, "learning_rate": 4.8646318531774e-06, "loss": 0.8172, "step": 7001 }, { "epoch": 0.13, "learning_rate": 4.864582261674692e-06, "loss": 0.9391, "step": 7002 }, { "epoch": 0.13, "learning_rate": 4.8645326613427065e-06, "loss": 1.0745, "step": 7003 }, { "epoch": 0.13, "learning_rate": 4.864483052181628e-06, "loss": 0.7966, "step": 7004 }, { "epoch": 0.13, "learning_rate": 4.864433434191643e-06, "loss": 0.9241, "step": 7005 }, { "epoch": 0.13, "learning_rate": 4.864383807372936e-06, "loss": 1.2325, "step": 7006 }, { "epoch": 0.13, "learning_rate": 4.864334171725692e-06, "loss": 1.0607, "step": 7007 }, { "epoch": 0.13, "learning_rate": 4.864284527250096e-06, "loss": 1.0328, "step": 7008 }, { "epoch": 0.13, "learning_rate": 4.864234873946335e-06, "loss": 0.7176, "step": 7009 }, { "epoch": 0.13, "learning_rate": 4.864185211814594e-06, "loss": 0.8636, "step": 7010 }, { "epoch": 0.13, "learning_rate": 4.864135540855056e-06, "loss": 0.7496, "step": 7011 }, { "epoch": 0.13, "learning_rate": 4.86408586106791e-06, "loss": 1.2164, "step": 7012 }, { "epoch": 0.13, "learning_rate": 4.8640361724533395e-06, "loss": 1.1283, "step": 7013 }, { "epoch": 0.13, "learning_rate": 4.86398647501153e-06, "loss": 0.8799, "step": 7014 }, { "epoch": 0.13, "learning_rate": 4.863936768742669e-06, "loss": 0.9839, "step": 7015 }, { "epoch": 0.13, "learning_rate": 4.863887053646939e-06, "loss": 0.7315, "step": 7016 }, { "epoch": 0.13, "learning_rate": 4.8638373297245275e-06, "loss": 0.945, "step": 7017 }, { "epoch": 0.13, "learning_rate": 4.8637875969756196e-06, "loss": 1.2266, "step": 7018 }, { "epoch": 0.13, "learning_rate": 4.863737855400402e-06, "loss": 1.0921, "step": 7019 }, { "epoch": 0.13, "learning_rate": 4.86368810499906e-06, "loss": 0.7393, "step": 7020 }, { "epoch": 0.13, "learning_rate": 4.863638345771778e-06, "loss": 0.9813, "step": 7021 }, { "epoch": 0.13, "learning_rate": 4.863588577718744e-06, "loss": 1.0942, "step": 7022 }, { "epoch": 0.13, "learning_rate": 4.863538800840142e-06, "loss": 0.9374, "step": 7023 }, { "epoch": 0.13, "learning_rate": 4.863489015136159e-06, "loss": 0.9677, "step": 7024 }, { "epoch": 0.13, "learning_rate": 4.86343922060698e-06, "loss": 1.0363, "step": 7025 }, { "epoch": 0.13, "learning_rate": 4.863389417252792e-06, "loss": 0.93, "step": 7026 }, { "epoch": 0.13, "learning_rate": 4.863339605073779e-06, "loss": 0.7177, "step": 7027 }, { "epoch": 0.13, "learning_rate": 4.86328978407013e-06, "loss": 0.9575, "step": 7028 }, { "epoch": 0.13, "learning_rate": 4.863239954242028e-06, "loss": 0.8399, "step": 7029 }, { "epoch": 0.13, "learning_rate": 4.863190115589662e-06, "loss": 0.9402, "step": 7030 }, { "epoch": 0.13, "learning_rate": 4.863140268113215e-06, "loss": 0.863, "step": 7031 }, { "epoch": 0.13, "learning_rate": 4.8630904118128765e-06, "loss": 0.9171, "step": 7032 }, { "epoch": 0.13, "learning_rate": 4.863040546688829e-06, "loss": 0.8121, "step": 7033 }, { "epoch": 0.13, "learning_rate": 4.862990672741262e-06, "loss": 0.9974, "step": 7034 }, { "epoch": 0.13, "learning_rate": 4.862940789970359e-06, "loss": 0.7972, "step": 7035 }, { "epoch": 0.13, "learning_rate": 4.862890898376309e-06, "loss": 1.0156, "step": 7036 }, { "epoch": 0.13, "learning_rate": 4.862840997959296e-06, "loss": 0.9599, "step": 7037 }, { "epoch": 0.13, "learning_rate": 4.862791088719507e-06, "loss": 0.9719, "step": 7038 }, { "epoch": 0.13, "learning_rate": 4.862741170657129e-06, "loss": 0.7965, "step": 7039 }, { "epoch": 0.13, "learning_rate": 4.862691243772348e-06, "loss": 1.0071, "step": 7040 }, { "epoch": 0.13, "learning_rate": 4.8626413080653505e-06, "loss": 0.9739, "step": 7041 }, { "epoch": 0.13, "learning_rate": 4.862591363536322e-06, "loss": 1.0688, "step": 7042 }, { "epoch": 0.13, "learning_rate": 4.86254141018545e-06, "loss": 1.1717, "step": 7043 }, { "epoch": 0.13, "learning_rate": 4.8624914480129206e-06, "loss": 0.8647, "step": 7044 }, { "epoch": 0.13, "learning_rate": 4.862441477018921e-06, "loss": 0.8184, "step": 7045 }, { "epoch": 0.13, "learning_rate": 4.862391497203637e-06, "loss": 0.7211, "step": 7046 }, { "epoch": 0.13, "learning_rate": 4.862341508567256e-06, "loss": 0.941, "step": 7047 }, { "epoch": 0.13, "learning_rate": 4.862291511109964e-06, "loss": 0.9413, "step": 7048 }, { "epoch": 0.13, "learning_rate": 4.8622415048319486e-06, "loss": 1.1392, "step": 7049 }, { "epoch": 0.13, "learning_rate": 4.862191489733395e-06, "loss": 1.2463, "step": 7050 }, { "epoch": 0.13, "learning_rate": 4.86214146581449e-06, "loss": 0.9224, "step": 7051 }, { "epoch": 0.13, "learning_rate": 4.862091433075423e-06, "loss": 0.9774, "step": 7052 }, { "epoch": 0.13, "learning_rate": 4.862041391516378e-06, "loss": 0.8883, "step": 7053 }, { "epoch": 0.13, "learning_rate": 4.861991341137543e-06, "loss": 0.9519, "step": 7054 }, { "epoch": 0.13, "learning_rate": 4.861941281939105e-06, "loss": 0.9856, "step": 7055 }, { "epoch": 0.13, "learning_rate": 4.86189121392125e-06, "loss": 1.1699, "step": 7056 }, { "epoch": 0.13, "learning_rate": 4.8618411370841665e-06, "loss": 1.0776, "step": 7057 }, { "epoch": 0.13, "learning_rate": 4.86179105142804e-06, "loss": 0.9667, "step": 7058 }, { "epoch": 0.13, "learning_rate": 4.861740956953059e-06, "loss": 0.8817, "step": 7059 }, { "epoch": 0.13, "learning_rate": 4.8616908536594085e-06, "loss": 0.8617, "step": 7060 }, { "epoch": 0.13, "learning_rate": 4.861640741547278e-06, "loss": 0.9924, "step": 7061 }, { "epoch": 0.13, "learning_rate": 4.861590620616852e-06, "loss": 0.9594, "step": 7062 }, { "epoch": 0.13, "learning_rate": 4.86154049086832e-06, "loss": 1.1561, "step": 7063 }, { "epoch": 0.13, "learning_rate": 4.861490352301868e-06, "loss": 0.884, "step": 7064 }, { "epoch": 0.13, "learning_rate": 4.8614402049176834e-06, "loss": 1.0148, "step": 7065 }, { "epoch": 0.13, "learning_rate": 4.861390048715954e-06, "loss": 0.9485, "step": 7066 }, { "epoch": 0.13, "learning_rate": 4.861339883696865e-06, "loss": 0.9146, "step": 7067 }, { "epoch": 0.13, "learning_rate": 4.861289709860607e-06, "loss": 1.0791, "step": 7068 }, { "epoch": 0.13, "learning_rate": 4.861239527207365e-06, "loss": 0.941, "step": 7069 }, { "epoch": 0.13, "learning_rate": 4.861189335737327e-06, "loss": 1.0045, "step": 7070 }, { "epoch": 0.13, "learning_rate": 4.86113913545068e-06, "loss": 0.9269, "step": 7071 }, { "epoch": 0.13, "learning_rate": 4.861088926347613e-06, "loss": 0.9307, "step": 7072 }, { "epoch": 0.13, "learning_rate": 4.861038708428311e-06, "loss": 0.8606, "step": 7073 }, { "epoch": 0.13, "learning_rate": 4.860988481692963e-06, "loss": 0.9528, "step": 7074 }, { "epoch": 0.13, "learning_rate": 4.860938246141757e-06, "loss": 1.1129, "step": 7075 }, { "epoch": 0.13, "learning_rate": 4.86088800177488e-06, "loss": 1.037, "step": 7076 }, { "epoch": 0.13, "learning_rate": 4.860837748592519e-06, "loss": 1.0064, "step": 7077 }, { "epoch": 0.13, "learning_rate": 4.860787486594863e-06, "loss": 0.9094, "step": 7078 }, { "epoch": 0.13, "learning_rate": 4.8607372157820985e-06, "loss": 0.9, "step": 7079 }, { "epoch": 0.13, "learning_rate": 4.860686936154413e-06, "loss": 0.9597, "step": 7080 }, { "epoch": 0.13, "learning_rate": 4.860636647711996e-06, "loss": 1.0758, "step": 7081 }, { "epoch": 0.13, "learning_rate": 4.860586350455033e-06, "loss": 1.01, "step": 7082 }, { "epoch": 0.13, "learning_rate": 4.860536044383714e-06, "loss": 0.7154, "step": 7083 }, { "epoch": 0.13, "learning_rate": 4.860485729498225e-06, "loss": 0.8926, "step": 7084 }, { "epoch": 0.13, "learning_rate": 4.860435405798756e-06, "loss": 0.7578, "step": 7085 }, { "epoch": 0.13, "learning_rate": 4.860385073285492e-06, "loss": 0.9672, "step": 7086 }, { "epoch": 0.13, "learning_rate": 4.860334731958623e-06, "loss": 1.1543, "step": 7087 }, { "epoch": 0.13, "learning_rate": 4.860284381818336e-06, "loss": 0.9393, "step": 7088 }, { "epoch": 0.13, "learning_rate": 4.86023402286482e-06, "loss": 0.9527, "step": 7089 }, { "epoch": 0.13, "learning_rate": 4.860183655098263e-06, "loss": 0.9227, "step": 7090 }, { "epoch": 0.13, "learning_rate": 4.860133278518853e-06, "loss": 0.824, "step": 7091 }, { "epoch": 0.13, "learning_rate": 4.860082893126776e-06, "loss": 1.0455, "step": 7092 }, { "epoch": 0.13, "learning_rate": 4.860032498922222e-06, "loss": 0.8664, "step": 7093 }, { "epoch": 0.13, "learning_rate": 4.859982095905381e-06, "loss": 1.0098, "step": 7094 }, { "epoch": 0.13, "learning_rate": 4.859931684076438e-06, "loss": 0.9794, "step": 7095 }, { "epoch": 0.13, "learning_rate": 4.859881263435582e-06, "loss": 0.783, "step": 7096 }, { "epoch": 0.13, "learning_rate": 4.859830833983002e-06, "loss": 0.8965, "step": 7097 }, { "epoch": 0.13, "learning_rate": 4.859780395718886e-06, "loss": 0.8712, "step": 7098 }, { "epoch": 0.13, "learning_rate": 4.859729948643422e-06, "loss": 1.0459, "step": 7099 }, { "epoch": 0.13, "learning_rate": 4.859679492756799e-06, "loss": 1.1386, "step": 7100 }, { "epoch": 0.13, "learning_rate": 4.859629028059207e-06, "loss": 0.8986, "step": 7101 }, { "epoch": 0.13, "learning_rate": 4.85957855455083e-06, "loss": 0.9854, "step": 7102 }, { "epoch": 0.13, "learning_rate": 4.85952807223186e-06, "loss": 0.8843, "step": 7103 }, { "epoch": 0.13, "learning_rate": 4.859477581102484e-06, "loss": 0.9636, "step": 7104 }, { "epoch": 0.13, "learning_rate": 4.859427081162892e-06, "loss": 0.8566, "step": 7105 }, { "epoch": 0.13, "learning_rate": 4.8593765724132705e-06, "loss": 1.0541, "step": 7106 }, { "epoch": 0.13, "learning_rate": 4.85932605485381e-06, "loss": 1.1338, "step": 7107 }, { "epoch": 0.13, "learning_rate": 4.859275528484698e-06, "loss": 0.8564, "step": 7108 }, { "epoch": 0.13, "learning_rate": 4.859224993306124e-06, "loss": 1.0255, "step": 7109 }, { "epoch": 0.13, "learning_rate": 4.859174449318276e-06, "loss": 0.8914, "step": 7110 }, { "epoch": 0.13, "learning_rate": 4.859123896521343e-06, "loss": 0.8873, "step": 7111 }, { "epoch": 0.13, "learning_rate": 4.859073334915514e-06, "loss": 1.1281, "step": 7112 }, { "epoch": 0.13, "learning_rate": 4.859022764500976e-06, "loss": 1.0974, "step": 7113 }, { "epoch": 0.13, "learning_rate": 4.858972185277921e-06, "loss": 0.9918, "step": 7114 }, { "epoch": 0.13, "learning_rate": 4.858921597246535e-06, "loss": 0.9436, "step": 7115 }, { "epoch": 0.13, "learning_rate": 4.858871000407009e-06, "loss": 0.8492, "step": 7116 }, { "epoch": 0.13, "learning_rate": 4.85882039475953e-06, "loss": 0.7631, "step": 7117 }, { "epoch": 0.13, "learning_rate": 4.858769780304289e-06, "loss": 1.1443, "step": 7118 }, { "epoch": 0.13, "learning_rate": 4.858719157041474e-06, "loss": 0.8741, "step": 7119 }, { "epoch": 0.13, "learning_rate": 4.858668524971273e-06, "loss": 0.9693, "step": 7120 }, { "epoch": 0.13, "learning_rate": 4.858617884093877e-06, "loss": 0.9429, "step": 7121 }, { "epoch": 0.13, "learning_rate": 4.858567234409473e-06, "loss": 1.0335, "step": 7122 }, { "epoch": 0.13, "learning_rate": 4.858516575918253e-06, "loss": 1.0442, "step": 7123 }, { "epoch": 0.13, "learning_rate": 4.858465908620403e-06, "loss": 1.1102, "step": 7124 }, { "epoch": 0.13, "learning_rate": 4.858415232516113e-06, "loss": 1.0771, "step": 7125 }, { "epoch": 0.13, "learning_rate": 4.858364547605575e-06, "loss": 1.0606, "step": 7126 }, { "epoch": 0.13, "learning_rate": 4.858313853888975e-06, "loss": 0.8757, "step": 7127 }, { "epoch": 0.13, "learning_rate": 4.858263151366503e-06, "loss": 0.9259, "step": 7128 }, { "epoch": 0.13, "learning_rate": 4.858212440038349e-06, "loss": 0.8068, "step": 7129 }, { "epoch": 0.13, "learning_rate": 4.858161719904702e-06, "loss": 0.8496, "step": 7130 }, { "epoch": 0.13, "learning_rate": 4.858110990965752e-06, "loss": 0.9385, "step": 7131 }, { "epoch": 0.13, "learning_rate": 4.858060253221687e-06, "loss": 1.074, "step": 7132 }, { "epoch": 0.13, "learning_rate": 4.858009506672698e-06, "loss": 0.9151, "step": 7133 }, { "epoch": 0.13, "learning_rate": 4.857958751318973e-06, "loss": 0.8456, "step": 7134 }, { "epoch": 0.13, "learning_rate": 4.8579079871607024e-06, "loss": 0.91, "step": 7135 }, { "epoch": 0.13, "learning_rate": 4.857857214198077e-06, "loss": 1.0597, "step": 7136 }, { "epoch": 0.13, "learning_rate": 4.857806432431284e-06, "loss": 1.1598, "step": 7137 }, { "epoch": 0.13, "learning_rate": 4.857755641860514e-06, "loss": 0.8896, "step": 7138 }, { "epoch": 0.13, "learning_rate": 4.857704842485958e-06, "loss": 1.0123, "step": 7139 }, { "epoch": 0.13, "learning_rate": 4.8576540343078025e-06, "loss": 0.9772, "step": 7140 }, { "epoch": 0.13, "learning_rate": 4.85760321732624e-06, "loss": 1.0327, "step": 7141 }, { "epoch": 0.13, "learning_rate": 4.857552391541459e-06, "loss": 1.0591, "step": 7142 }, { "epoch": 0.13, "learning_rate": 4.85750155695365e-06, "loss": 1.0973, "step": 7143 }, { "epoch": 0.13, "learning_rate": 4.857450713563002e-06, "loss": 1.0794, "step": 7144 }, { "epoch": 0.13, "learning_rate": 4.857399861369707e-06, "loss": 0.9487, "step": 7145 }, { "epoch": 0.13, "learning_rate": 4.8573490003739514e-06, "loss": 0.9197, "step": 7146 }, { "epoch": 0.13, "learning_rate": 4.857298130575927e-06, "loss": 0.8511, "step": 7147 }, { "epoch": 0.13, "learning_rate": 4.8572472519758246e-06, "loss": 1.085, "step": 7148 }, { "epoch": 0.13, "learning_rate": 4.857196364573833e-06, "loss": 1.1159, "step": 7149 }, { "epoch": 0.13, "learning_rate": 4.857145468370142e-06, "loss": 1.1718, "step": 7150 }, { "epoch": 0.13, "learning_rate": 4.857094563364943e-06, "loss": 0.9665, "step": 7151 }, { "epoch": 0.13, "learning_rate": 4.857043649558424e-06, "loss": 0.8743, "step": 7152 }, { "epoch": 0.13, "learning_rate": 4.856992726950777e-06, "loss": 0.8843, "step": 7153 }, { "epoch": 0.13, "learning_rate": 4.85694179554219e-06, "loss": 0.7327, "step": 7154 }, { "epoch": 0.13, "learning_rate": 4.856890855332856e-06, "loss": 0.9493, "step": 7155 }, { "epoch": 0.14, "learning_rate": 4.856839906322965e-06, "loss": 1.1536, "step": 7156 }, { "epoch": 0.14, "learning_rate": 4.856788948512704e-06, "loss": 0.8793, "step": 7157 }, { "epoch": 0.14, "learning_rate": 4.8567379819022655e-06, "loss": 0.8211, "step": 7158 }, { "epoch": 0.14, "learning_rate": 4.85668700649184e-06, "loss": 0.9132, "step": 7159 }, { "epoch": 0.14, "learning_rate": 4.856636022281618e-06, "loss": 1.1182, "step": 7160 }, { "epoch": 0.14, "learning_rate": 4.856585029271788e-06, "loss": 0.9634, "step": 7161 }, { "epoch": 0.14, "learning_rate": 4.856534027462544e-06, "loss": 1.2101, "step": 7162 }, { "epoch": 0.14, "learning_rate": 4.856483016854072e-06, "loss": 1.1572, "step": 7163 }, { "epoch": 0.14, "learning_rate": 4.8564319974465665e-06, "loss": 0.986, "step": 7164 }, { "epoch": 0.14, "learning_rate": 4.856380969240216e-06, "loss": 0.861, "step": 7165 }, { "epoch": 0.14, "learning_rate": 4.856329932235209e-06, "loss": 1.0116, "step": 7166 }, { "epoch": 0.14, "learning_rate": 4.85627888643174e-06, "loss": 0.9886, "step": 7167 }, { "epoch": 0.14, "learning_rate": 4.8562278318299975e-06, "loss": 1.0457, "step": 7168 }, { "epoch": 0.14, "learning_rate": 4.856176768430173e-06, "loss": 1.2575, "step": 7169 }, { "epoch": 0.14, "learning_rate": 4.856125696232456e-06, "loss": 0.8593, "step": 7170 }, { "epoch": 0.14, "learning_rate": 4.856074615237039e-06, "loss": 0.914, "step": 7171 }, { "epoch": 0.14, "learning_rate": 4.85602352544411e-06, "loss": 0.8206, "step": 7172 }, { "epoch": 0.14, "learning_rate": 4.855972426853862e-06, "loss": 0.8311, "step": 7173 }, { "epoch": 0.14, "learning_rate": 4.855921319466486e-06, "loss": 0.9516, "step": 7174 }, { "epoch": 0.14, "learning_rate": 4.855870203282171e-06, "loss": 1.0677, "step": 7175 }, { "epoch": 0.14, "learning_rate": 4.855819078301109e-06, "loss": 1.1368, "step": 7176 }, { "epoch": 0.14, "learning_rate": 4.855767944523492e-06, "loss": 1.0508, "step": 7177 }, { "epoch": 0.14, "learning_rate": 4.855716801949508e-06, "loss": 1.0095, "step": 7178 }, { "epoch": 0.14, "learning_rate": 4.855665650579351e-06, "loss": 0.6688, "step": 7179 }, { "epoch": 0.14, "learning_rate": 4.85561449041321e-06, "loss": 0.8934, "step": 7180 }, { "epoch": 0.14, "learning_rate": 4.855563321451277e-06, "loss": 1.1765, "step": 7181 }, { "epoch": 0.14, "learning_rate": 4.855512143693743e-06, "loss": 1.106, "step": 7182 }, { "epoch": 0.14, "learning_rate": 4.855460957140798e-06, "loss": 1.1994, "step": 7183 }, { "epoch": 0.14, "learning_rate": 4.855409761792635e-06, "loss": 0.9885, "step": 7184 }, { "epoch": 0.14, "learning_rate": 4.8553585576494435e-06, "loss": 0.8716, "step": 7185 }, { "epoch": 0.14, "learning_rate": 4.8553073447114165e-06, "loss": 0.8926, "step": 7186 }, { "epoch": 0.14, "learning_rate": 4.855256122978743e-06, "loss": 1.1214, "step": 7187 }, { "epoch": 0.14, "learning_rate": 4.855204892451615e-06, "loss": 1.0723, "step": 7188 }, { "epoch": 0.14, "learning_rate": 4.855153653130225e-06, "loss": 0.968, "step": 7189 }, { "epoch": 0.14, "learning_rate": 4.855102405014763e-06, "loss": 0.9305, "step": 7190 }, { "epoch": 0.14, "learning_rate": 4.8550511481054214e-06, "loss": 0.937, "step": 7191 }, { "epoch": 0.14, "learning_rate": 4.85499988240239e-06, "loss": 0.9187, "step": 7192 }, { "epoch": 0.14, "learning_rate": 4.8549486079058625e-06, "loss": 1.0086, "step": 7193 }, { "epoch": 0.14, "learning_rate": 4.854897324616028e-06, "loss": 1.1396, "step": 7194 }, { "epoch": 0.14, "learning_rate": 4.854846032533081e-06, "loss": 1.0268, "step": 7195 }, { "epoch": 0.14, "learning_rate": 4.854794731657209e-06, "loss": 0.9283, "step": 7196 }, { "epoch": 0.14, "learning_rate": 4.854743421988606e-06, "loss": 0.9512, "step": 7197 }, { "epoch": 0.14, "learning_rate": 4.8546921035274645e-06, "loss": 0.7983, "step": 7198 }, { "epoch": 0.14, "learning_rate": 4.854640776273973e-06, "loss": 1.157, "step": 7199 }, { "epoch": 0.14, "learning_rate": 4.854589440228327e-06, "loss": 1.1974, "step": 7200 }, { "epoch": 0.14, "learning_rate": 4.854538095390715e-06, "loss": 1.0056, "step": 7201 }, { "epoch": 0.14, "learning_rate": 4.854486741761329e-06, "loss": 0.9227, "step": 7202 }, { "epoch": 0.14, "learning_rate": 4.8544353793403634e-06, "loss": 0.9933, "step": 7203 }, { "epoch": 0.14, "learning_rate": 4.854384008128008e-06, "loss": 1.079, "step": 7204 }, { "epoch": 0.14, "learning_rate": 4.854332628124455e-06, "loss": 0.9066, "step": 7205 }, { "epoch": 0.14, "learning_rate": 4.854281239329895e-06, "loss": 1.0903, "step": 7206 }, { "epoch": 0.14, "learning_rate": 4.854229841744522e-06, "loss": 0.8667, "step": 7207 }, { "epoch": 0.14, "learning_rate": 4.854178435368527e-06, "loss": 1.0233, "step": 7208 }, { "epoch": 0.14, "learning_rate": 4.854127020202102e-06, "loss": 0.9124, "step": 7209 }, { "epoch": 0.14, "learning_rate": 4.854075596245439e-06, "loss": 0.8483, "step": 7210 }, { "epoch": 0.14, "learning_rate": 4.85402416349873e-06, "loss": 1.0953, "step": 7211 }, { "epoch": 0.14, "learning_rate": 4.853972721962166e-06, "loss": 1.1222, "step": 7212 }, { "epoch": 0.14, "learning_rate": 4.8539212716359405e-06, "loss": 1.2044, "step": 7213 }, { "epoch": 0.14, "learning_rate": 4.853869812520245e-06, "loss": 0.9755, "step": 7214 }, { "epoch": 0.14, "learning_rate": 4.853818344615272e-06, "loss": 0.9541, "step": 7215 }, { "epoch": 0.14, "learning_rate": 4.853766867921214e-06, "loss": 1.0217, "step": 7216 }, { "epoch": 0.14, "learning_rate": 4.853715382438261e-06, "loss": 1.0652, "step": 7217 }, { "epoch": 0.14, "learning_rate": 4.853663888166609e-06, "loss": 0.9521, "step": 7218 }, { "epoch": 0.14, "learning_rate": 4.8536123851064466e-06, "loss": 1.0895, "step": 7219 }, { "epoch": 0.14, "learning_rate": 4.853560873257968e-06, "loss": 0.9075, "step": 7220 }, { "epoch": 0.14, "learning_rate": 4.853509352621366e-06, "loss": 1.0605, "step": 7221 }, { "epoch": 0.14, "learning_rate": 4.853457823196832e-06, "loss": 0.9774, "step": 7222 }, { "epoch": 0.14, "learning_rate": 4.853406284984558e-06, "loss": 0.9319, "step": 7223 }, { "epoch": 0.14, "learning_rate": 4.853354737984738e-06, "loss": 1.0457, "step": 7224 }, { "epoch": 0.14, "learning_rate": 4.853303182197563e-06, "loss": 0.851, "step": 7225 }, { "epoch": 0.14, "learning_rate": 4.8532516176232256e-06, "loss": 0.785, "step": 7226 }, { "epoch": 0.14, "learning_rate": 4.85320004426192e-06, "loss": 0.9596, "step": 7227 }, { "epoch": 0.14, "learning_rate": 4.853148462113837e-06, "loss": 0.8879, "step": 7228 }, { "epoch": 0.14, "learning_rate": 4.85309687117917e-06, "loss": 0.7495, "step": 7229 }, { "epoch": 0.14, "learning_rate": 4.853045271458111e-06, "loss": 0.9393, "step": 7230 }, { "epoch": 0.14, "learning_rate": 4.852993662950853e-06, "loss": 0.9997, "step": 7231 }, { "epoch": 0.14, "learning_rate": 4.8529420456575895e-06, "loss": 0.8181, "step": 7232 }, { "epoch": 0.14, "learning_rate": 4.852890419578512e-06, "loss": 0.955, "step": 7233 }, { "epoch": 0.14, "learning_rate": 4.852838784713815e-06, "loss": 0.8854, "step": 7234 }, { "epoch": 0.14, "learning_rate": 4.852787141063689e-06, "loss": 0.9795, "step": 7235 }, { "epoch": 0.14, "learning_rate": 4.8527354886283275e-06, "loss": 0.6837, "step": 7236 }, { "epoch": 0.14, "learning_rate": 4.852683827407924e-06, "loss": 1.067, "step": 7237 }, { "epoch": 0.14, "learning_rate": 4.852632157402672e-06, "loss": 1.0626, "step": 7238 }, { "epoch": 0.14, "learning_rate": 4.852580478612764e-06, "loss": 1.254, "step": 7239 }, { "epoch": 0.14, "learning_rate": 4.852528791038391e-06, "loss": 0.9014, "step": 7240 }, { "epoch": 0.14, "learning_rate": 4.852477094679748e-06, "loss": 0.8899, "step": 7241 }, { "epoch": 0.14, "learning_rate": 4.852425389537029e-06, "loss": 1.0309, "step": 7242 }, { "epoch": 0.14, "learning_rate": 4.852373675610424e-06, "loss": 1.0963, "step": 7243 }, { "epoch": 0.14, "learning_rate": 4.852321952900129e-06, "loss": 1.0389, "step": 7244 }, { "epoch": 0.14, "learning_rate": 4.852270221406336e-06, "loss": 1.02, "step": 7245 }, { "epoch": 0.14, "learning_rate": 4.852218481129238e-06, "loss": 0.9154, "step": 7246 }, { "epoch": 0.14, "learning_rate": 4.852166732069028e-06, "loss": 0.9119, "step": 7247 }, { "epoch": 0.14, "learning_rate": 4.8521149742259e-06, "loss": 0.8375, "step": 7248 }, { "epoch": 0.14, "learning_rate": 4.852063207600046e-06, "loss": 0.9998, "step": 7249 }, { "epoch": 0.14, "learning_rate": 4.852011432191661e-06, "loss": 1.1245, "step": 7250 }, { "epoch": 0.14, "learning_rate": 4.8519596480009364e-06, "loss": 0.874, "step": 7251 }, { "epoch": 0.14, "learning_rate": 4.851907855028068e-06, "loss": 0.9726, "step": 7252 }, { "epoch": 0.14, "learning_rate": 4.851856053273246e-06, "loss": 1.0214, "step": 7253 }, { "epoch": 0.14, "learning_rate": 4.851804242736667e-06, "loss": 0.938, "step": 7254 }, { "epoch": 0.14, "learning_rate": 4.851752423418523e-06, "loss": 0.9977, "step": 7255 }, { "epoch": 0.14, "learning_rate": 4.851700595319006e-06, "loss": 1.0705, "step": 7256 }, { "epoch": 0.14, "learning_rate": 4.851648758438313e-06, "loss": 1.0331, "step": 7257 }, { "epoch": 0.14, "learning_rate": 4.851596912776635e-06, "loss": 0.9041, "step": 7258 }, { "epoch": 0.14, "learning_rate": 4.851545058334166e-06, "loss": 1.1143, "step": 7259 }, { "epoch": 0.14, "learning_rate": 4.8514931951111e-06, "loss": 0.9285, "step": 7260 }, { "epoch": 0.14, "learning_rate": 4.851441323107631e-06, "loss": 1.0251, "step": 7261 }, { "epoch": 0.14, "learning_rate": 4.8513894423239514e-06, "loss": 1.2021, "step": 7262 }, { "epoch": 0.14, "learning_rate": 4.851337552760256e-06, "loss": 1.0106, "step": 7263 }, { "epoch": 0.14, "learning_rate": 4.851285654416738e-06, "loss": 1.0177, "step": 7264 }, { "epoch": 0.14, "learning_rate": 4.851233747293592e-06, "loss": 0.8859, "step": 7265 }, { "epoch": 0.14, "learning_rate": 4.851181831391011e-06, "loss": 0.9571, "step": 7266 }, { "epoch": 0.14, "learning_rate": 4.851129906709189e-06, "loss": 0.8146, "step": 7267 }, { "epoch": 0.14, "learning_rate": 4.85107797324832e-06, "loss": 1.0051, "step": 7268 }, { "epoch": 0.14, "learning_rate": 4.851026031008598e-06, "loss": 0.9401, "step": 7269 }, { "epoch": 0.14, "learning_rate": 4.850974079990217e-06, "loss": 0.7987, "step": 7270 }, { "epoch": 0.14, "learning_rate": 4.850922120193371e-06, "loss": 0.9626, "step": 7271 }, { "epoch": 0.14, "learning_rate": 4.850870151618253e-06, "loss": 0.9631, "step": 7272 }, { "epoch": 0.14, "learning_rate": 4.85081817426506e-06, "loss": 0.8975, "step": 7273 }, { "epoch": 0.14, "learning_rate": 4.850766188133982e-06, "loss": 0.9439, "step": 7274 }, { "epoch": 0.14, "learning_rate": 4.850714193225215e-06, "loss": 1.1049, "step": 7275 }, { "epoch": 0.14, "learning_rate": 4.850662189538955e-06, "loss": 0.7785, "step": 7276 }, { "epoch": 0.14, "learning_rate": 4.850610177075393e-06, "loss": 0.949, "step": 7277 }, { "epoch": 0.14, "learning_rate": 4.850558155834726e-06, "loss": 0.9417, "step": 7278 }, { "epoch": 0.14, "learning_rate": 4.850506125817146e-06, "loss": 0.7826, "step": 7279 }, { "epoch": 0.14, "learning_rate": 4.850454087022847e-06, "loss": 0.9444, "step": 7280 }, { "epoch": 0.14, "learning_rate": 4.850402039452026e-06, "loss": 0.9842, "step": 7281 }, { "epoch": 0.14, "learning_rate": 4.850349983104876e-06, "loss": 0.9611, "step": 7282 }, { "epoch": 0.14, "learning_rate": 4.850297917981591e-06, "loss": 0.9225, "step": 7283 }, { "epoch": 0.14, "learning_rate": 4.850245844082366e-06, "loss": 1.0095, "step": 7284 }, { "epoch": 0.14, "learning_rate": 4.850193761407394e-06, "loss": 0.843, "step": 7285 }, { "epoch": 0.14, "learning_rate": 4.850141669956872e-06, "loss": 1.2025, "step": 7286 }, { "epoch": 0.14, "learning_rate": 4.850089569730992e-06, "loss": 1.0786, "step": 7287 }, { "epoch": 0.14, "learning_rate": 4.850037460729949e-06, "loss": 0.9301, "step": 7288 }, { "epoch": 0.14, "learning_rate": 4.84998534295394e-06, "loss": 1.0214, "step": 7289 }, { "epoch": 0.14, "learning_rate": 4.8499332164031565e-06, "loss": 0.8944, "step": 7290 }, { "epoch": 0.14, "learning_rate": 4.849881081077794e-06, "loss": 0.9276, "step": 7291 }, { "epoch": 0.14, "learning_rate": 4.849828936978049e-06, "loss": 0.942, "step": 7292 }, { "epoch": 0.14, "learning_rate": 4.849776784104114e-06, "loss": 1.213, "step": 7293 }, { "epoch": 0.14, "learning_rate": 4.849724622456184e-06, "loss": 1.1014, "step": 7294 }, { "epoch": 0.14, "learning_rate": 4.8496724520344555e-06, "loss": 1.0307, "step": 7295 }, { "epoch": 0.14, "learning_rate": 4.849620272839122e-06, "loss": 0.9865, "step": 7296 }, { "epoch": 0.14, "learning_rate": 4.849568084870377e-06, "loss": 0.9084, "step": 7297 }, { "epoch": 0.14, "learning_rate": 4.849515888128419e-06, "loss": 0.7249, "step": 7298 }, { "epoch": 0.14, "learning_rate": 4.849463682613439e-06, "loss": 1.0123, "step": 7299 }, { "epoch": 0.14, "learning_rate": 4.849411468325634e-06, "loss": 1.029, "step": 7300 }, { "epoch": 0.14, "learning_rate": 4.849359245265199e-06, "loss": 0.9035, "step": 7301 }, { "epoch": 0.14, "learning_rate": 4.849307013432328e-06, "loss": 0.9342, "step": 7302 }, { "epoch": 0.14, "learning_rate": 4.849254772827217e-06, "loss": 0.9404, "step": 7303 }, { "epoch": 0.14, "learning_rate": 4.849202523450061e-06, "loss": 0.8813, "step": 7304 }, { "epoch": 0.14, "learning_rate": 4.8491502653010546e-06, "loss": 0.9857, "step": 7305 }, { "epoch": 0.14, "learning_rate": 4.849097998380393e-06, "loss": 1.1024, "step": 7306 }, { "epoch": 0.14, "learning_rate": 4.849045722688271e-06, "loss": 1.0316, "step": 7307 }, { "epoch": 0.14, "learning_rate": 4.848993438224885e-06, "loss": 0.8168, "step": 7308 }, { "epoch": 0.14, "learning_rate": 4.84894114499043e-06, "loss": 0.9171, "step": 7309 }, { "epoch": 0.14, "learning_rate": 4.8488888429850996e-06, "loss": 0.8247, "step": 7310 }, { "epoch": 0.14, "learning_rate": 4.848836532209091e-06, "loss": 0.8755, "step": 7311 }, { "epoch": 0.14, "learning_rate": 4.848784212662598e-06, "loss": 1.2488, "step": 7312 }, { "epoch": 0.14, "learning_rate": 4.848731884345818e-06, "loss": 1.1293, "step": 7313 }, { "epoch": 0.14, "learning_rate": 4.848679547258944e-06, "loss": 1.0115, "step": 7314 }, { "epoch": 0.14, "learning_rate": 4.848627201402174e-06, "loss": 0.8047, "step": 7315 }, { "epoch": 0.14, "learning_rate": 4.848574846775701e-06, "loss": 0.874, "step": 7316 }, { "epoch": 0.14, "learning_rate": 4.848522483379722e-06, "loss": 0.9383, "step": 7317 }, { "epoch": 0.14, "learning_rate": 4.848470111214431e-06, "loss": 0.8248, "step": 7318 }, { "epoch": 0.14, "learning_rate": 4.848417730280026e-06, "loss": 1.0223, "step": 7319 }, { "epoch": 0.14, "learning_rate": 4.848365340576701e-06, "loss": 1.0372, "step": 7320 }, { "epoch": 0.14, "learning_rate": 4.848312942104651e-06, "loss": 0.9531, "step": 7321 }, { "epoch": 0.14, "learning_rate": 4.8482605348640736e-06, "loss": 0.9838, "step": 7322 }, { "epoch": 0.14, "learning_rate": 4.848208118855162e-06, "loss": 0.954, "step": 7323 }, { "epoch": 0.14, "learning_rate": 4.848155694078113e-06, "loss": 0.9316, "step": 7324 }, { "epoch": 0.14, "learning_rate": 4.848103260533125e-06, "loss": 0.8957, "step": 7325 }, { "epoch": 0.14, "learning_rate": 4.84805081822039e-06, "loss": 0.9969, "step": 7326 }, { "epoch": 0.14, "learning_rate": 4.847998367140104e-06, "loss": 0.942, "step": 7327 }, { "epoch": 0.14, "learning_rate": 4.8479459072924665e-06, "loss": 0.981, "step": 7328 }, { "epoch": 0.14, "learning_rate": 4.847893438677669e-06, "loss": 0.9933, "step": 7329 }, { "epoch": 0.14, "learning_rate": 4.8478409612959095e-06, "loss": 1.0311, "step": 7330 }, { "epoch": 0.14, "learning_rate": 4.847788475147386e-06, "loss": 1.2354, "step": 7331 }, { "epoch": 0.14, "learning_rate": 4.84773598023229e-06, "loss": 1.0773, "step": 7332 }, { "epoch": 0.14, "learning_rate": 4.84768347655082e-06, "loss": 1.0139, "step": 7333 }, { "epoch": 0.14, "learning_rate": 4.847630964103173e-06, "loss": 0.948, "step": 7334 }, { "epoch": 0.14, "learning_rate": 4.847578442889543e-06, "loss": 0.9795, "step": 7335 }, { "epoch": 0.14, "learning_rate": 4.847525912910128e-06, "loss": 0.9724, "step": 7336 }, { "epoch": 0.14, "learning_rate": 4.847473374165123e-06, "loss": 1.0245, "step": 7337 }, { "epoch": 0.14, "learning_rate": 4.847420826654724e-06, "loss": 1.0637, "step": 7338 }, { "epoch": 0.14, "learning_rate": 4.847368270379128e-06, "loss": 0.9547, "step": 7339 }, { "epoch": 0.14, "learning_rate": 4.847315705338531e-06, "loss": 1.1406, "step": 7340 }, { "epoch": 0.14, "learning_rate": 4.847263131533129e-06, "loss": 0.9523, "step": 7341 }, { "epoch": 0.14, "learning_rate": 4.847210548963118e-06, "loss": 0.8428, "step": 7342 }, { "epoch": 0.14, "learning_rate": 4.847157957628695e-06, "loss": 1.0203, "step": 7343 }, { "epoch": 0.14, "learning_rate": 4.847105357530056e-06, "loss": 1.0753, "step": 7344 }, { "epoch": 0.14, "learning_rate": 4.8470527486673974e-06, "loss": 0.9259, "step": 7345 }, { "epoch": 0.14, "learning_rate": 4.847000131040917e-06, "loss": 1.1548, "step": 7346 }, { "epoch": 0.14, "learning_rate": 4.846947504650809e-06, "loss": 0.868, "step": 7347 }, { "epoch": 0.14, "learning_rate": 4.84689486949727e-06, "loss": 0.8878, "step": 7348 }, { "epoch": 0.14, "learning_rate": 4.846842225580499e-06, "loss": 1.0572, "step": 7349 }, { "epoch": 0.14, "learning_rate": 4.8467895729006906e-06, "loss": 1.0751, "step": 7350 }, { "epoch": 0.14, "learning_rate": 4.846736911458042e-06, "loss": 0.8252, "step": 7351 }, { "epoch": 0.14, "learning_rate": 4.84668424125275e-06, "loss": 0.8647, "step": 7352 }, { "epoch": 0.14, "learning_rate": 4.846631562285011e-06, "loss": 0.8572, "step": 7353 }, { "epoch": 0.14, "learning_rate": 4.8465788745550214e-06, "loss": 0.7397, "step": 7354 }, { "epoch": 0.14, "learning_rate": 4.846526178062978e-06, "loss": 1.1673, "step": 7355 }, { "epoch": 0.14, "learning_rate": 4.846473472809078e-06, "loss": 1.1401, "step": 7356 }, { "epoch": 0.14, "learning_rate": 4.846420758793518e-06, "loss": 1.067, "step": 7357 }, { "epoch": 0.14, "learning_rate": 4.846368036016495e-06, "loss": 0.9197, "step": 7358 }, { "epoch": 0.14, "learning_rate": 4.846315304478206e-06, "loss": 0.749, "step": 7359 }, { "epoch": 0.14, "learning_rate": 4.846262564178847e-06, "loss": 0.8076, "step": 7360 }, { "epoch": 0.14, "learning_rate": 4.846209815118615e-06, "loss": 0.8395, "step": 7361 }, { "epoch": 0.14, "learning_rate": 4.846157057297709e-06, "loss": 1.0155, "step": 7362 }, { "epoch": 0.14, "learning_rate": 4.846104290716323e-06, "loss": 1.0013, "step": 7363 }, { "epoch": 0.14, "learning_rate": 4.846051515374657e-06, "loss": 0.8678, "step": 7364 }, { "epoch": 0.14, "learning_rate": 4.845998731272905e-06, "loss": 0.8936, "step": 7365 }, { "epoch": 0.14, "learning_rate": 4.845945938411267e-06, "loss": 0.9598, "step": 7366 }, { "epoch": 0.14, "learning_rate": 4.845893136789938e-06, "loss": 0.9431, "step": 7367 }, { "epoch": 0.14, "learning_rate": 4.8458403264091154e-06, "loss": 1.1045, "step": 7368 }, { "epoch": 0.14, "learning_rate": 4.845787507268999e-06, "loss": 1.0765, "step": 7369 }, { "epoch": 0.14, "learning_rate": 4.8457346793697826e-06, "loss": 0.9488, "step": 7370 }, { "epoch": 0.14, "learning_rate": 4.845681842711664e-06, "loss": 0.8812, "step": 7371 }, { "epoch": 0.14, "learning_rate": 4.845628997294843e-06, "loss": 0.9595, "step": 7372 }, { "epoch": 0.14, "learning_rate": 4.845576143119514e-06, "loss": 0.8262, "step": 7373 }, { "epoch": 0.14, "learning_rate": 4.8455232801858765e-06, "loss": 1.1431, "step": 7374 }, { "epoch": 0.14, "learning_rate": 4.845470408494126e-06, "loss": 1.0489, "step": 7375 }, { "epoch": 0.14, "learning_rate": 4.845417528044462e-06, "loss": 0.8936, "step": 7376 }, { "epoch": 0.14, "learning_rate": 4.84536463883708e-06, "loss": 1.0391, "step": 7377 }, { "epoch": 0.14, "learning_rate": 4.845311740872179e-06, "loss": 1.0068, "step": 7378 }, { "epoch": 0.14, "learning_rate": 4.845258834149955e-06, "loss": 0.9686, "step": 7379 }, { "epoch": 0.14, "learning_rate": 4.845205918670607e-06, "loss": 0.877, "step": 7380 }, { "epoch": 0.14, "learning_rate": 4.845152994434332e-06, "loss": 1.1771, "step": 7381 }, { "epoch": 0.14, "learning_rate": 4.8451000614413276e-06, "loss": 1.0582, "step": 7382 }, { "epoch": 0.14, "learning_rate": 4.845047119691792e-06, "loss": 1.0956, "step": 7383 }, { "epoch": 0.14, "learning_rate": 4.844994169185922e-06, "loss": 0.9951, "step": 7384 }, { "epoch": 0.14, "learning_rate": 4.8449412099239154e-06, "loss": 0.9137, "step": 7385 }, { "epoch": 0.14, "learning_rate": 4.84488824190597e-06, "loss": 1.1985, "step": 7386 }, { "epoch": 0.14, "learning_rate": 4.844835265132284e-06, "loss": 1.2614, "step": 7387 }, { "epoch": 0.14, "learning_rate": 4.844782279603056e-06, "loss": 1.0383, "step": 7388 }, { "epoch": 0.14, "learning_rate": 4.844729285318482e-06, "loss": 0.9358, "step": 7389 }, { "epoch": 0.14, "learning_rate": 4.84467628227876e-06, "loss": 0.8433, "step": 7390 }, { "epoch": 0.14, "learning_rate": 4.84462327048409e-06, "loss": 0.8976, "step": 7391 }, { "epoch": 0.14, "learning_rate": 4.844570249934667e-06, "loss": 0.7926, "step": 7392 }, { "epoch": 0.14, "learning_rate": 4.844517220630692e-06, "loss": 1.0651, "step": 7393 }, { "epoch": 0.14, "learning_rate": 4.844464182572361e-06, "loss": 1.1779, "step": 7394 }, { "epoch": 0.14, "learning_rate": 4.844411135759873e-06, "loss": 1.0281, "step": 7395 }, { "epoch": 0.14, "learning_rate": 4.844358080193425e-06, "loss": 0.8238, "step": 7396 }, { "epoch": 0.14, "learning_rate": 4.844305015873216e-06, "loss": 0.9372, "step": 7397 }, { "epoch": 0.14, "learning_rate": 4.844251942799445e-06, "loss": 0.975, "step": 7398 }, { "epoch": 0.14, "learning_rate": 4.844198860972308e-06, "loss": 0.8777, "step": 7399 }, { "epoch": 0.14, "learning_rate": 4.844145770392005e-06, "loss": 1.201, "step": 7400 }, { "epoch": 0.14, "learning_rate": 4.844092671058733e-06, "loss": 0.961, "step": 7401 }, { "epoch": 0.14, "learning_rate": 4.844039562972691e-06, "loss": 1.0074, "step": 7402 }, { "epoch": 0.14, "learning_rate": 4.8439864461340776e-06, "loss": 0.7667, "step": 7403 }, { "epoch": 0.14, "learning_rate": 4.8439333205430905e-06, "loss": 0.824, "step": 7404 }, { "epoch": 0.14, "learning_rate": 4.843880186199927e-06, "loss": 1.0364, "step": 7405 }, { "epoch": 0.14, "learning_rate": 4.843827043104788e-06, "loss": 1.136, "step": 7406 }, { "epoch": 0.14, "learning_rate": 4.843773891257871e-06, "loss": 0.8949, "step": 7407 }, { "epoch": 0.14, "learning_rate": 4.843720730659374e-06, "loss": 0.98, "step": 7408 }, { "epoch": 0.14, "learning_rate": 4.843667561309495e-06, "loss": 1.0944, "step": 7409 }, { "epoch": 0.14, "learning_rate": 4.8436143832084335e-06, "loss": 0.8631, "step": 7410 }, { "epoch": 0.14, "learning_rate": 4.843561196356387e-06, "loss": 0.9843, "step": 7411 }, { "epoch": 0.14, "learning_rate": 4.843508000753557e-06, "loss": 1.1598, "step": 7412 }, { "epoch": 0.14, "learning_rate": 4.843454796400138e-06, "loss": 1.0038, "step": 7413 }, { "epoch": 0.14, "learning_rate": 4.843401583296331e-06, "loss": 1.0201, "step": 7414 }, { "epoch": 0.14, "learning_rate": 4.8433483614423344e-06, "loss": 0.8937, "step": 7415 }, { "epoch": 0.14, "learning_rate": 4.843295130838347e-06, "loss": 0.959, "step": 7416 }, { "epoch": 0.14, "learning_rate": 4.843241891484567e-06, "loss": 0.8439, "step": 7417 }, { "epoch": 0.14, "learning_rate": 4.8431886433811945e-06, "loss": 1.0582, "step": 7418 }, { "epoch": 0.14, "learning_rate": 4.843135386528427e-06, "loss": 1.0906, "step": 7419 }, { "epoch": 0.14, "learning_rate": 4.843082120926463e-06, "loss": 0.849, "step": 7420 }, { "epoch": 0.14, "learning_rate": 4.843028846575504e-06, "loss": 0.9175, "step": 7421 }, { "epoch": 0.14, "learning_rate": 4.842975563475746e-06, "loss": 0.9503, "step": 7422 }, { "epoch": 0.14, "learning_rate": 4.8429222716273895e-06, "loss": 0.9233, "step": 7423 }, { "epoch": 0.14, "learning_rate": 4.842868971030632e-06, "loss": 1.0314, "step": 7424 }, { "epoch": 0.14, "learning_rate": 4.8428156616856744e-06, "loss": 1.2141, "step": 7425 }, { "epoch": 0.14, "learning_rate": 4.8427623435927155e-06, "loss": 0.9898, "step": 7426 }, { "epoch": 0.14, "learning_rate": 4.842709016751953e-06, "loss": 0.9897, "step": 7427 }, { "epoch": 0.14, "learning_rate": 4.842655681163587e-06, "loss": 1.1802, "step": 7428 }, { "epoch": 0.14, "learning_rate": 4.842602336827816e-06, "loss": 0.9228, "step": 7429 }, { "epoch": 0.14, "learning_rate": 4.842548983744841e-06, "loss": 0.8509, "step": 7430 }, { "epoch": 0.14, "learning_rate": 4.84249562191486e-06, "loss": 1.0948, "step": 7431 }, { "epoch": 0.14, "learning_rate": 4.842442251338071e-06, "loss": 0.8519, "step": 7432 }, { "epoch": 0.14, "learning_rate": 4.842388872014675e-06, "loss": 0.8508, "step": 7433 }, { "epoch": 0.14, "learning_rate": 4.84233548394487e-06, "loss": 1.0956, "step": 7434 }, { "epoch": 0.14, "learning_rate": 4.842282087128857e-06, "loss": 0.8931, "step": 7435 }, { "epoch": 0.14, "learning_rate": 4.842228681566834e-06, "loss": 0.9134, "step": 7436 }, { "epoch": 0.14, "learning_rate": 4.842175267259002e-06, "loss": 1.0801, "step": 7437 }, { "epoch": 0.14, "learning_rate": 4.842121844205559e-06, "loss": 0.9702, "step": 7438 }, { "epoch": 0.14, "learning_rate": 4.842068412406704e-06, "loss": 0.796, "step": 7439 }, { "epoch": 0.14, "learning_rate": 4.842014971862638e-06, "loss": 0.8827, "step": 7440 }, { "epoch": 0.14, "learning_rate": 4.8419615225735586e-06, "loss": 0.805, "step": 7441 }, { "epoch": 0.14, "learning_rate": 4.841908064539668e-06, "loss": 0.7749, "step": 7442 }, { "epoch": 0.14, "learning_rate": 4.841854597761164e-06, "loss": 0.8377, "step": 7443 }, { "epoch": 0.14, "learning_rate": 4.841801122238248e-06, "loss": 1.1563, "step": 7444 }, { "epoch": 0.14, "learning_rate": 4.841747637971117e-06, "loss": 1.0547, "step": 7445 }, { "epoch": 0.14, "learning_rate": 4.841694144959972e-06, "loss": 0.7676, "step": 7446 }, { "epoch": 0.14, "learning_rate": 4.841640643205013e-06, "loss": 0.9859, "step": 7447 }, { "epoch": 0.14, "learning_rate": 4.8415871327064406e-06, "loss": 0.8864, "step": 7448 }, { "epoch": 0.14, "learning_rate": 4.841533613464453e-06, "loss": 0.9174, "step": 7449 }, { "epoch": 0.14, "learning_rate": 4.841480085479251e-06, "loss": 1.2018, "step": 7450 }, { "epoch": 0.14, "learning_rate": 4.841426548751034e-06, "loss": 0.8493, "step": 7451 }, { "epoch": 0.14, "learning_rate": 4.8413730032800015e-06, "loss": 0.8748, "step": 7452 }, { "epoch": 0.14, "learning_rate": 4.841319449066354e-06, "loss": 0.798, "step": 7453 }, { "epoch": 0.14, "learning_rate": 4.841265886110292e-06, "loss": 1.0078, "step": 7454 }, { "epoch": 0.14, "learning_rate": 4.8412123144120145e-06, "loss": 1.0679, "step": 7455 }, { "epoch": 0.14, "learning_rate": 4.8411587339717234e-06, "loss": 1.0549, "step": 7456 }, { "epoch": 0.14, "learning_rate": 4.841105144789616e-06, "loss": 1.0424, "step": 7457 }, { "epoch": 0.14, "learning_rate": 4.841051546865894e-06, "loss": 0.9335, "step": 7458 }, { "epoch": 0.14, "learning_rate": 4.8409979402007574e-06, "loss": 1.0008, "step": 7459 }, { "epoch": 0.14, "learning_rate": 4.840944324794407e-06, "loss": 0.877, "step": 7460 }, { "epoch": 0.14, "learning_rate": 4.840890700647041e-06, "loss": 0.8505, "step": 7461 }, { "epoch": 0.14, "learning_rate": 4.840837067758861e-06, "loss": 1.0184, "step": 7462 }, { "epoch": 0.14, "learning_rate": 4.840783426130068e-06, "loss": 0.9453, "step": 7463 }, { "epoch": 0.14, "learning_rate": 4.84072977576086e-06, "loss": 0.7497, "step": 7464 }, { "epoch": 0.14, "learning_rate": 4.840676116651441e-06, "loss": 0.9925, "step": 7465 }, { "epoch": 0.14, "learning_rate": 4.840622448802007e-06, "loss": 0.8383, "step": 7466 }, { "epoch": 0.14, "learning_rate": 4.8405687722127625e-06, "loss": 1.0075, "step": 7467 }, { "epoch": 0.14, "learning_rate": 4.840515086883905e-06, "loss": 1.1477, "step": 7468 }, { "epoch": 0.14, "learning_rate": 4.840461392815635e-06, "loss": 1.0033, "step": 7469 }, { "epoch": 0.14, "learning_rate": 4.840407690008155e-06, "loss": 1.0454, "step": 7470 }, { "epoch": 0.14, "learning_rate": 4.840353978461665e-06, "loss": 1.012, "step": 7471 }, { "epoch": 0.14, "learning_rate": 4.840300258176363e-06, "loss": 1.0862, "step": 7472 }, { "epoch": 0.14, "learning_rate": 4.840246529152454e-06, "loss": 0.8343, "step": 7473 }, { "epoch": 0.14, "learning_rate": 4.8401927913901345e-06, "loss": 0.9599, "step": 7474 }, { "epoch": 0.14, "learning_rate": 4.840139044889608e-06, "loss": 1.0728, "step": 7475 }, { "epoch": 0.14, "learning_rate": 4.840085289651073e-06, "loss": 1.094, "step": 7476 }, { "epoch": 0.14, "learning_rate": 4.840031525674732e-06, "loss": 0.9282, "step": 7477 }, { "epoch": 0.14, "learning_rate": 4.839977752960785e-06, "loss": 0.8439, "step": 7478 }, { "epoch": 0.14, "learning_rate": 4.8399239715094326e-06, "loss": 0.8189, "step": 7479 }, { "epoch": 0.14, "learning_rate": 4.839870181320876e-06, "loss": 1.1357, "step": 7480 }, { "epoch": 0.14, "learning_rate": 4.8398163823953155e-06, "loss": 1.0537, "step": 7481 }, { "epoch": 0.14, "learning_rate": 4.839762574732953e-06, "loss": 1.1086, "step": 7482 }, { "epoch": 0.14, "learning_rate": 4.839708758333989e-06, "loss": 0.8436, "step": 7483 }, { "epoch": 0.14, "learning_rate": 4.839654933198623e-06, "loss": 1.1183, "step": 7484 }, { "epoch": 0.14, "learning_rate": 4.839601099327057e-06, "loss": 0.9479, "step": 7485 }, { "epoch": 0.14, "learning_rate": 4.839547256719494e-06, "loss": 1.0088, "step": 7486 }, { "epoch": 0.14, "learning_rate": 4.839493405376132e-06, "loss": 1.1481, "step": 7487 }, { "epoch": 0.14, "learning_rate": 4.8394395452971734e-06, "loss": 0.9809, "step": 7488 }, { "epoch": 0.14, "learning_rate": 4.83938567648282e-06, "loss": 1.0402, "step": 7489 }, { "epoch": 0.14, "learning_rate": 4.839331798933272e-06, "loss": 0.9463, "step": 7490 }, { "epoch": 0.14, "learning_rate": 4.839277912648731e-06, "loss": 0.806, "step": 7491 }, { "epoch": 0.14, "learning_rate": 4.839224017629397e-06, "loss": 0.9487, "step": 7492 }, { "epoch": 0.14, "learning_rate": 4.839170113875473e-06, "loss": 0.9276, "step": 7493 }, { "epoch": 0.14, "learning_rate": 4.839116201387159e-06, "loss": 1.1291, "step": 7494 }, { "epoch": 0.14, "learning_rate": 4.839062280164657e-06, "loss": 0.796, "step": 7495 }, { "epoch": 0.14, "learning_rate": 4.839008350208168e-06, "loss": 0.9153, "step": 7496 }, { "epoch": 0.14, "learning_rate": 4.838954411517894e-06, "loss": 0.7629, "step": 7497 }, { "epoch": 0.14, "learning_rate": 4.838900464094036e-06, "loss": 1.0413, "step": 7498 }, { "epoch": 0.14, "learning_rate": 4.838846507936795e-06, "loss": 1.0482, "step": 7499 }, { "epoch": 0.14, "learning_rate": 4.838792543046373e-06, "loss": 1.1047, "step": 7500 }, { "epoch": 0.14, "learning_rate": 4.838738569422971e-06, "loss": 0.8541, "step": 7501 }, { "epoch": 0.14, "learning_rate": 4.838684587066792e-06, "loss": 1.0344, "step": 7502 }, { "epoch": 0.14, "learning_rate": 4.838630595978036e-06, "loss": 0.859, "step": 7503 }, { "epoch": 0.14, "learning_rate": 4.838576596156904e-06, "loss": 0.8474, "step": 7504 }, { "epoch": 0.14, "learning_rate": 4.8385225876036e-06, "loss": 0.9578, "step": 7505 }, { "epoch": 0.14, "learning_rate": 4.838468570318324e-06, "loss": 0.958, "step": 7506 }, { "epoch": 0.14, "learning_rate": 4.838414544301277e-06, "loss": 0.9853, "step": 7507 }, { "epoch": 0.14, "learning_rate": 4.8383605095526635e-06, "loss": 1.0128, "step": 7508 }, { "epoch": 0.14, "learning_rate": 4.8383064660726825e-06, "loss": 0.7773, "step": 7509 }, { "epoch": 0.14, "learning_rate": 4.8382524138615375e-06, "loss": 0.8258, "step": 7510 }, { "epoch": 0.14, "learning_rate": 4.8381983529194285e-06, "loss": 1.0053, "step": 7511 }, { "epoch": 0.14, "learning_rate": 4.8381442832465596e-06, "loss": 1.0126, "step": 7512 }, { "epoch": 0.14, "learning_rate": 4.8380902048431314e-06, "loss": 0.9946, "step": 7513 }, { "epoch": 0.14, "learning_rate": 4.838036117709346e-06, "loss": 0.7886, "step": 7514 }, { "epoch": 0.14, "learning_rate": 4.837982021845406e-06, "loss": 0.9159, "step": 7515 }, { "epoch": 0.14, "learning_rate": 4.8379279172515114e-06, "loss": 0.9283, "step": 7516 }, { "epoch": 0.14, "learning_rate": 4.837873803927867e-06, "loss": 0.9094, "step": 7517 }, { "epoch": 0.14, "learning_rate": 4.837819681874673e-06, "loss": 1.067, "step": 7518 }, { "epoch": 0.14, "learning_rate": 4.8377655510921315e-06, "loss": 1.0125, "step": 7519 }, { "epoch": 0.14, "learning_rate": 4.837711411580446e-06, "loss": 1.0626, "step": 7520 }, { "epoch": 0.14, "learning_rate": 4.837657263339817e-06, "loss": 0.8978, "step": 7521 }, { "epoch": 0.14, "learning_rate": 4.8376031063704474e-06, "loss": 0.9229, "step": 7522 }, { "epoch": 0.14, "learning_rate": 4.837548940672541e-06, "loss": 0.9451, "step": 7523 }, { "epoch": 0.14, "learning_rate": 4.8374947662462966e-06, "loss": 0.8122, "step": 7524 }, { "epoch": 0.14, "learning_rate": 4.837440583091919e-06, "loss": 0.948, "step": 7525 }, { "epoch": 0.14, "learning_rate": 4.837386391209611e-06, "loss": 0.9445, "step": 7526 }, { "epoch": 0.14, "learning_rate": 4.837332190599573e-06, "loss": 0.8005, "step": 7527 }, { "epoch": 0.14, "learning_rate": 4.8372779812620075e-06, "loss": 1.0197, "step": 7528 }, { "epoch": 0.14, "learning_rate": 4.837223763197119e-06, "loss": 0.7863, "step": 7529 }, { "epoch": 0.14, "learning_rate": 4.8371695364051075e-06, "loss": 0.8929, "step": 7530 }, { "epoch": 0.14, "learning_rate": 4.8371153008861776e-06, "loss": 1.0658, "step": 7531 }, { "epoch": 0.14, "learning_rate": 4.8370610566405306e-06, "loss": 1.0452, "step": 7532 }, { "epoch": 0.14, "learning_rate": 4.837006803668369e-06, "loss": 0.9754, "step": 7533 }, { "epoch": 0.14, "learning_rate": 4.836952541969896e-06, "loss": 1.044, "step": 7534 }, { "epoch": 0.14, "learning_rate": 4.836898271545313e-06, "loss": 0.7334, "step": 7535 }, { "epoch": 0.14, "learning_rate": 4.8368439923948244e-06, "loss": 0.9879, "step": 7536 }, { "epoch": 0.14, "learning_rate": 4.8367897045186314e-06, "loss": 0.9586, "step": 7537 }, { "epoch": 0.14, "learning_rate": 4.836735407916938e-06, "loss": 1.0203, "step": 7538 }, { "epoch": 0.14, "learning_rate": 4.836681102589945e-06, "loss": 0.9599, "step": 7539 }, { "epoch": 0.14, "learning_rate": 4.836626788537857e-06, "loss": 1.0355, "step": 7540 }, { "epoch": 0.14, "learning_rate": 4.836572465760877e-06, "loss": 0.9581, "step": 7541 }, { "epoch": 0.14, "learning_rate": 4.836518134259207e-06, "loss": 0.8879, "step": 7542 }, { "epoch": 0.14, "learning_rate": 4.8364637940330495e-06, "loss": 1.228, "step": 7543 }, { "epoch": 0.14, "learning_rate": 4.836409445082607e-06, "loss": 1.1976, "step": 7544 }, { "epoch": 0.14, "learning_rate": 4.836355087408085e-06, "loss": 1.0649, "step": 7545 }, { "epoch": 0.14, "learning_rate": 4.836300721009683e-06, "loss": 0.7384, "step": 7546 }, { "epoch": 0.14, "learning_rate": 4.836246345887606e-06, "loss": 0.9019, "step": 7547 }, { "epoch": 0.14, "learning_rate": 4.8361919620420575e-06, "loss": 0.9055, "step": 7548 }, { "epoch": 0.14, "learning_rate": 4.83613756947324e-06, "loss": 1.032, "step": 7549 }, { "epoch": 0.14, "learning_rate": 4.836083168181356e-06, "loss": 1.1919, "step": 7550 }, { "epoch": 0.14, "learning_rate": 4.836028758166609e-06, "loss": 1.0692, "step": 7551 }, { "epoch": 0.14, "learning_rate": 4.835974339429203e-06, "loss": 0.9024, "step": 7552 }, { "epoch": 0.14, "learning_rate": 4.835919911969339e-06, "loss": 0.7321, "step": 7553 }, { "epoch": 0.14, "learning_rate": 4.835865475787222e-06, "loss": 0.7464, "step": 7554 }, { "epoch": 0.14, "learning_rate": 4.835811030883056e-06, "loss": 1.2028, "step": 7555 }, { "epoch": 0.14, "learning_rate": 4.835756577257042e-06, "loss": 1.0759, "step": 7556 }, { "epoch": 0.14, "learning_rate": 4.8357021149093856e-06, "loss": 1.1508, "step": 7557 }, { "epoch": 0.14, "learning_rate": 4.835647643840289e-06, "loss": 0.7575, "step": 7558 }, { "epoch": 0.14, "learning_rate": 4.8355931640499556e-06, "loss": 1.0375, "step": 7559 }, { "epoch": 0.14, "learning_rate": 4.835538675538589e-06, "loss": 1.0018, "step": 7560 }, { "epoch": 0.14, "learning_rate": 4.835484178306392e-06, "loss": 0.8754, "step": 7561 }, { "epoch": 0.14, "learning_rate": 4.835429672353569e-06, "loss": 1.0067, "step": 7562 }, { "epoch": 0.14, "learning_rate": 4.835375157680323e-06, "loss": 1.1284, "step": 7563 }, { "epoch": 0.14, "learning_rate": 4.835320634286858e-06, "loss": 1.0549, "step": 7564 }, { "epoch": 0.14, "learning_rate": 4.835266102173378e-06, "loss": 0.8607, "step": 7565 }, { "epoch": 0.14, "learning_rate": 4.835211561340085e-06, "loss": 0.8762, "step": 7566 }, { "epoch": 0.14, "learning_rate": 4.835157011787184e-06, "loss": 1.009, "step": 7567 }, { "epoch": 0.14, "learning_rate": 4.835102453514878e-06, "loss": 1.0751, "step": 7568 }, { "epoch": 0.14, "learning_rate": 4.835047886523371e-06, "loss": 1.1389, "step": 7569 }, { "epoch": 0.14, "learning_rate": 4.834993310812868e-06, "loss": 0.8907, "step": 7570 }, { "epoch": 0.14, "learning_rate": 4.83493872638357e-06, "loss": 1.0531, "step": 7571 }, { "epoch": 0.14, "learning_rate": 4.8348841332356835e-06, "loss": 0.9509, "step": 7572 }, { "epoch": 0.14, "learning_rate": 4.83482953136941e-06, "loss": 0.9667, "step": 7573 }, { "epoch": 0.14, "learning_rate": 4.834774920784956e-06, "loss": 1.0974, "step": 7574 }, { "epoch": 0.14, "learning_rate": 4.834720301482524e-06, "loss": 0.978, "step": 7575 }, { "epoch": 0.14, "learning_rate": 4.8346656734623165e-06, "loss": 1.0039, "step": 7576 }, { "epoch": 0.14, "learning_rate": 4.83461103672454e-06, "loss": 0.8197, "step": 7577 }, { "epoch": 0.14, "learning_rate": 4.834556391269397e-06, "loss": 0.8237, "step": 7578 }, { "epoch": 0.14, "learning_rate": 4.834501737097093e-06, "loss": 0.9238, "step": 7579 }, { "epoch": 0.14, "learning_rate": 4.834447074207831e-06, "loss": 1.0361, "step": 7580 }, { "epoch": 0.14, "learning_rate": 4.834392402601814e-06, "loss": 0.9982, "step": 7581 }, { "epoch": 0.14, "learning_rate": 4.834337722279248e-06, "loss": 0.6931, "step": 7582 }, { "epoch": 0.14, "learning_rate": 4.8342830332403365e-06, "loss": 0.8698, "step": 7583 }, { "epoch": 0.14, "learning_rate": 4.834228335485284e-06, "loss": 0.9831, "step": 7584 }, { "epoch": 0.14, "learning_rate": 4.834173629014294e-06, "loss": 0.9576, "step": 7585 }, { "epoch": 0.14, "learning_rate": 4.834118913827571e-06, "loss": 1.0096, "step": 7586 }, { "epoch": 0.14, "learning_rate": 4.83406418992532e-06, "loss": 1.1859, "step": 7587 }, { "epoch": 0.14, "learning_rate": 4.834009457307745e-06, "loss": 1.1084, "step": 7588 }, { "epoch": 0.14, "learning_rate": 4.83395471597505e-06, "loss": 0.8055, "step": 7589 }, { "epoch": 0.14, "learning_rate": 4.83389996592744e-06, "loss": 0.8229, "step": 7590 }, { "epoch": 0.14, "learning_rate": 4.8338452071651185e-06, "loss": 0.8597, "step": 7591 }, { "epoch": 0.14, "learning_rate": 4.833790439688292e-06, "loss": 0.8671, "step": 7592 }, { "epoch": 0.14, "learning_rate": 4.833735663497162e-06, "loss": 1.3386, "step": 7593 }, { "epoch": 0.14, "learning_rate": 4.833680878591935e-06, "loss": 1.0831, "step": 7594 }, { "epoch": 0.14, "learning_rate": 4.833626084972815e-06, "loss": 0.8924, "step": 7595 }, { "epoch": 0.14, "learning_rate": 4.8335712826400075e-06, "loss": 0.8829, "step": 7596 }, { "epoch": 0.14, "learning_rate": 4.8335164715937156e-06, "loss": 0.9173, "step": 7597 }, { "epoch": 0.14, "learning_rate": 4.833461651834145e-06, "loss": 0.938, "step": 7598 }, { "epoch": 0.14, "learning_rate": 4.833406823361499e-06, "loss": 1.1247, "step": 7599 }, { "epoch": 0.14, "learning_rate": 4.833351986175985e-06, "loss": 1.2001, "step": 7600 }, { "epoch": 0.14, "learning_rate": 4.833297140277806e-06, "loss": 0.8653, "step": 7601 }, { "epoch": 0.14, "learning_rate": 4.833242285667167e-06, "loss": 1.0145, "step": 7602 }, { "epoch": 0.14, "learning_rate": 4.833187422344272e-06, "loss": 0.9207, "step": 7603 }, { "epoch": 0.14, "learning_rate": 4.833132550309328e-06, "loss": 0.8499, "step": 7604 }, { "epoch": 0.14, "learning_rate": 4.833077669562538e-06, "loss": 1.0759, "step": 7605 }, { "epoch": 0.14, "learning_rate": 4.833022780104107e-06, "loss": 1.0997, "step": 7606 }, { "epoch": 0.14, "learning_rate": 4.832967881934241e-06, "loss": 0.91, "step": 7607 }, { "epoch": 0.14, "learning_rate": 4.832912975053145e-06, "loss": 0.805, "step": 7608 }, { "epoch": 0.14, "learning_rate": 4.832858059461023e-06, "loss": 0.9004, "step": 7609 }, { "epoch": 0.14, "learning_rate": 4.83280313515808e-06, "loss": 1.0444, "step": 7610 }, { "epoch": 0.14, "learning_rate": 4.832748202144521e-06, "loss": 0.9189, "step": 7611 }, { "epoch": 0.14, "learning_rate": 4.832693260420554e-06, "loss": 1.1339, "step": 7612 }, { "epoch": 0.14, "learning_rate": 4.83263830998638e-06, "loss": 0.9536, "step": 7613 }, { "epoch": 0.14, "learning_rate": 4.8325833508422075e-06, "loss": 0.8083, "step": 7614 }, { "epoch": 0.14, "learning_rate": 4.832528382988239e-06, "loss": 0.8835, "step": 7615 }, { "epoch": 0.14, "learning_rate": 4.832473406424681e-06, "loss": 0.7859, "step": 7616 }, { "epoch": 0.14, "learning_rate": 4.83241842115174e-06, "loss": 0.9232, "step": 7617 }, { "epoch": 0.14, "learning_rate": 4.832363427169619e-06, "loss": 1.0298, "step": 7618 }, { "epoch": 0.14, "learning_rate": 4.832308424478526e-06, "loss": 1.1086, "step": 7619 }, { "epoch": 0.14, "learning_rate": 4.832253413078664e-06, "loss": 0.9892, "step": 7620 }, { "epoch": 0.14, "learning_rate": 4.832198392970239e-06, "loss": 0.9163, "step": 7621 }, { "epoch": 0.14, "learning_rate": 4.832143364153456e-06, "loss": 0.7892, "step": 7622 }, { "epoch": 0.14, "learning_rate": 4.832088326628522e-06, "loss": 0.7275, "step": 7623 }, { "epoch": 0.14, "learning_rate": 4.8320332803956416e-06, "loss": 1.017, "step": 7624 }, { "epoch": 0.14, "learning_rate": 4.831978225455021e-06, "loss": 0.9225, "step": 7625 }, { "epoch": 0.14, "learning_rate": 4.831923161806864e-06, "loss": 1.0186, "step": 7626 }, { "epoch": 0.14, "learning_rate": 4.831868089451378e-06, "loss": 0.9797, "step": 7627 }, { "epoch": 0.14, "learning_rate": 4.8318130083887684e-06, "loss": 0.9373, "step": 7628 }, { "epoch": 0.14, "learning_rate": 4.8317579186192405e-06, "loss": 1.0386, "step": 7629 }, { "epoch": 0.14, "learning_rate": 4.831702820143e-06, "loss": 0.9444, "step": 7630 }, { "epoch": 0.14, "learning_rate": 4.831647712960252e-06, "loss": 0.9571, "step": 7631 }, { "epoch": 0.14, "learning_rate": 4.831592597071204e-06, "loss": 1.1738, "step": 7632 }, { "epoch": 0.14, "learning_rate": 4.83153747247606e-06, "loss": 0.9226, "step": 7633 }, { "epoch": 0.14, "learning_rate": 4.8314823391750265e-06, "loss": 0.9553, "step": 7634 }, { "epoch": 0.14, "learning_rate": 4.83142719716831e-06, "loss": 0.928, "step": 7635 }, { "epoch": 0.14, "learning_rate": 4.831372046456115e-06, "loss": 0.9435, "step": 7636 }, { "epoch": 0.14, "learning_rate": 4.831316887038648e-06, "loss": 0.9657, "step": 7637 }, { "epoch": 0.14, "learning_rate": 4.831261718916117e-06, "loss": 0.9692, "step": 7638 }, { "epoch": 0.14, "learning_rate": 4.831206542088725e-06, "loss": 0.8308, "step": 7639 }, { "epoch": 0.14, "learning_rate": 4.831151356556679e-06, "loss": 0.995, "step": 7640 }, { "epoch": 0.14, "learning_rate": 4.831096162320186e-06, "loss": 0.8865, "step": 7641 }, { "epoch": 0.14, "learning_rate": 4.831040959379451e-06, "loss": 0.9809, "step": 7642 }, { "epoch": 0.14, "learning_rate": 4.830985747734681e-06, "loss": 1.1584, "step": 7643 }, { "epoch": 0.14, "learning_rate": 4.830930527386081e-06, "loss": 1.0218, "step": 7644 }, { "epoch": 0.14, "learning_rate": 4.830875298333858e-06, "loss": 0.9601, "step": 7645 }, { "epoch": 0.14, "learning_rate": 4.8308200605782185e-06, "loss": 0.8596, "step": 7646 }, { "epoch": 0.14, "learning_rate": 4.830764814119369e-06, "loss": 1.0219, "step": 7647 }, { "epoch": 0.14, "learning_rate": 4.8307095589575135e-06, "loss": 0.8594, "step": 7648 }, { "epoch": 0.14, "learning_rate": 4.830654295092861e-06, "loss": 1.1865, "step": 7649 }, { "epoch": 0.14, "learning_rate": 4.830599022525617e-06, "loss": 1.164, "step": 7650 }, { "epoch": 0.14, "learning_rate": 4.830543741255987e-06, "loss": 0.8331, "step": 7651 }, { "epoch": 0.14, "learning_rate": 4.830488451284178e-06, "loss": 0.9878, "step": 7652 }, { "epoch": 0.14, "learning_rate": 4.830433152610398e-06, "loss": 0.836, "step": 7653 }, { "epoch": 0.14, "learning_rate": 4.83037784523485e-06, "loss": 0.8264, "step": 7654 }, { "epoch": 0.14, "learning_rate": 4.830322529157744e-06, "loss": 0.9236, "step": 7655 }, { "epoch": 0.14, "learning_rate": 4.830267204379285e-06, "loss": 1.2264, "step": 7656 }, { "epoch": 0.14, "learning_rate": 4.8302118708996794e-06, "loss": 0.8838, "step": 7657 }, { "epoch": 0.14, "learning_rate": 4.830156528719134e-06, "loss": 0.9927, "step": 7658 }, { "epoch": 0.14, "learning_rate": 4.830101177837856e-06, "loss": 0.896, "step": 7659 }, { "epoch": 0.14, "learning_rate": 4.830045818256052e-06, "loss": 0.6944, "step": 7660 }, { "epoch": 0.14, "learning_rate": 4.829990449973927e-06, "loss": 1.1454, "step": 7661 }, { "epoch": 0.14, "learning_rate": 4.82993507299169e-06, "loss": 1.0867, "step": 7662 }, { "epoch": 0.14, "learning_rate": 4.829879687309546e-06, "loss": 0.8849, "step": 7663 }, { "epoch": 0.14, "learning_rate": 4.829824292927704e-06, "loss": 0.9155, "step": 7664 }, { "epoch": 0.14, "learning_rate": 4.829768889846369e-06, "loss": 0.7856, "step": 7665 }, { "epoch": 0.14, "learning_rate": 4.829713478065748e-06, "loss": 0.7881, "step": 7666 }, { "epoch": 0.14, "learning_rate": 4.829658057586049e-06, "loss": 0.9453, "step": 7667 }, { "epoch": 0.14, "learning_rate": 4.829602628407478e-06, "loss": 1.1238, "step": 7668 }, { "epoch": 0.14, "learning_rate": 4.829547190530242e-06, "loss": 0.967, "step": 7669 }, { "epoch": 0.14, "learning_rate": 4.829491743954549e-06, "loss": 0.9785, "step": 7670 }, { "epoch": 0.14, "learning_rate": 4.829436288680604e-06, "loss": 0.7995, "step": 7671 }, { "epoch": 0.14, "learning_rate": 4.829380824708616e-06, "loss": 0.9426, "step": 7672 }, { "epoch": 0.14, "learning_rate": 4.829325352038791e-06, "loss": 1.1268, "step": 7673 }, { "epoch": 0.14, "learning_rate": 4.829269870671337e-06, "loss": 1.0624, "step": 7674 }, { "epoch": 0.14, "learning_rate": 4.829214380606461e-06, "loss": 0.9915, "step": 7675 }, { "epoch": 0.14, "learning_rate": 4.829158881844369e-06, "loss": 1.0119, "step": 7676 }, { "epoch": 0.14, "learning_rate": 4.82910337438527e-06, "loss": 0.9077, "step": 7677 }, { "epoch": 0.14, "learning_rate": 4.82904785822937e-06, "loss": 1.0408, "step": 7678 }, { "epoch": 0.14, "learning_rate": 4.828992333376877e-06, "loss": 0.7836, "step": 7679 }, { "epoch": 0.14, "learning_rate": 4.828936799827998e-06, "loss": 0.8655, "step": 7680 }, { "epoch": 0.14, "learning_rate": 4.82888125758294e-06, "loss": 1.1294, "step": 7681 }, { "epoch": 0.14, "learning_rate": 4.8288257066419105e-06, "loss": 0.769, "step": 7682 }, { "epoch": 0.14, "learning_rate": 4.828770147005118e-06, "loss": 0.8842, "step": 7683 }, { "epoch": 0.14, "learning_rate": 4.828714578672769e-06, "loss": 0.7995, "step": 7684 }, { "epoch": 0.14, "learning_rate": 4.8286590016450705e-06, "loss": 1.0031, "step": 7685 }, { "epoch": 0.15, "learning_rate": 4.828603415922232e-06, "loss": 0.9907, "step": 7686 }, { "epoch": 0.15, "learning_rate": 4.828547821504459e-06, "loss": 1.0268, "step": 7687 }, { "epoch": 0.15, "learning_rate": 4.828492218391959e-06, "loss": 1.0465, "step": 7688 }, { "epoch": 0.15, "learning_rate": 4.828436606584942e-06, "loss": 1.1268, "step": 7689 }, { "epoch": 0.15, "learning_rate": 4.828380986083613e-06, "loss": 0.9616, "step": 7690 }, { "epoch": 0.15, "learning_rate": 4.828325356888182e-06, "loss": 0.7943, "step": 7691 }, { "epoch": 0.15, "learning_rate": 4.828269718998854e-06, "loss": 1.0372, "step": 7692 }, { "epoch": 0.15, "learning_rate": 4.828214072415839e-06, "loss": 1.2158, "step": 7693 }, { "epoch": 0.15, "learning_rate": 4.828158417139344e-06, "loss": 0.9953, "step": 7694 }, { "epoch": 0.15, "learning_rate": 4.8281027531695765e-06, "loss": 0.8237, "step": 7695 }, { "epoch": 0.15, "learning_rate": 4.828047080506745e-06, "loss": 0.9039, "step": 7696 }, { "epoch": 0.15, "learning_rate": 4.827991399151057e-06, "loss": 0.827, "step": 7697 }, { "epoch": 0.15, "learning_rate": 4.82793570910272e-06, "loss": 0.8642, "step": 7698 }, { "epoch": 0.15, "learning_rate": 4.827880010361944e-06, "loss": 1.0276, "step": 7699 }, { "epoch": 0.15, "learning_rate": 4.827824302928934e-06, "loss": 1.1288, "step": 7700 }, { "epoch": 0.15, "learning_rate": 4.8277685868038994e-06, "loss": 0.9076, "step": 7701 }, { "epoch": 0.15, "learning_rate": 4.8277128619870495e-06, "loss": 0.7385, "step": 7702 }, { "epoch": 0.15, "learning_rate": 4.8276571284785904e-06, "loss": 0.993, "step": 7703 }, { "epoch": 0.15, "learning_rate": 4.8276013862787305e-06, "loss": 0.8862, "step": 7704 }, { "epoch": 0.15, "learning_rate": 4.827545635387679e-06, "loss": 0.8948, "step": 7705 }, { "epoch": 0.15, "learning_rate": 4.827489875805643e-06, "loss": 1.1561, "step": 7706 }, { "epoch": 0.15, "learning_rate": 4.827434107532831e-06, "loss": 0.9122, "step": 7707 }, { "epoch": 0.15, "learning_rate": 4.827378330569452e-06, "loss": 0.8936, "step": 7708 }, { "epoch": 0.15, "learning_rate": 4.827322544915714e-06, "loss": 0.8309, "step": 7709 }, { "epoch": 0.15, "learning_rate": 4.8272667505718245e-06, "loss": 0.9144, "step": 7710 }, { "epoch": 0.15, "learning_rate": 4.827210947537992e-06, "loss": 0.98, "step": 7711 }, { "epoch": 0.15, "learning_rate": 4.827155135814426e-06, "loss": 0.9929, "step": 7712 }, { "epoch": 0.15, "learning_rate": 4.827099315401334e-06, "loss": 1.1435, "step": 7713 }, { "epoch": 0.15, "learning_rate": 4.827043486298923e-06, "loss": 0.7533, "step": 7714 }, { "epoch": 0.15, "learning_rate": 4.826987648507404e-06, "loss": 0.7903, "step": 7715 }, { "epoch": 0.15, "learning_rate": 4.826931802026985e-06, "loss": 0.9501, "step": 7716 }, { "epoch": 0.15, "learning_rate": 4.826875946857873e-06, "loss": 0.8254, "step": 7717 }, { "epoch": 0.15, "learning_rate": 4.826820083000279e-06, "loss": 1.0774, "step": 7718 }, { "epoch": 0.15, "learning_rate": 4.826764210454409e-06, "loss": 0.9661, "step": 7719 }, { "epoch": 0.15, "learning_rate": 4.8267083292204724e-06, "loss": 0.9337, "step": 7720 }, { "epoch": 0.15, "learning_rate": 4.826652439298679e-06, "loss": 1.0803, "step": 7721 }, { "epoch": 0.15, "learning_rate": 4.826596540689237e-06, "loss": 0.9802, "step": 7722 }, { "epoch": 0.15, "learning_rate": 4.826540633392354e-06, "loss": 0.8662, "step": 7723 }, { "epoch": 0.15, "learning_rate": 4.82648471740824e-06, "loss": 1.0905, "step": 7724 }, { "epoch": 0.15, "learning_rate": 4.826428792737104e-06, "loss": 1.0419, "step": 7725 }, { "epoch": 0.15, "learning_rate": 4.826372859379152e-06, "loss": 0.9031, "step": 7726 }, { "epoch": 0.15, "learning_rate": 4.826316917334598e-06, "loss": 0.7618, "step": 7727 }, { "epoch": 0.15, "learning_rate": 4.8262609666036464e-06, "loss": 0.8604, "step": 7728 }, { "epoch": 0.15, "learning_rate": 4.826205007186507e-06, "loss": 0.7777, "step": 7729 }, { "epoch": 0.15, "learning_rate": 4.826149039083391e-06, "loss": 0.8931, "step": 7730 }, { "epoch": 0.15, "learning_rate": 4.826093062294505e-06, "loss": 1.049, "step": 7731 }, { "epoch": 0.15, "learning_rate": 4.8260370768200595e-06, "loss": 0.8464, "step": 7732 }, { "epoch": 0.15, "learning_rate": 4.825981082660262e-06, "loss": 1.0192, "step": 7733 }, { "epoch": 0.15, "learning_rate": 4.825925079815323e-06, "loss": 0.9463, "step": 7734 }, { "epoch": 0.15, "learning_rate": 4.82586906828545e-06, "loss": 0.8812, "step": 7735 }, { "epoch": 0.15, "learning_rate": 4.825813048070855e-06, "loss": 0.9122, "step": 7736 }, { "epoch": 0.15, "learning_rate": 4.825757019171744e-06, "loss": 0.9827, "step": 7737 }, { "epoch": 0.15, "learning_rate": 4.825700981588328e-06, "loss": 0.9927, "step": 7738 }, { "epoch": 0.15, "learning_rate": 4.825644935320816e-06, "loss": 1.1402, "step": 7739 }, { "epoch": 0.15, "learning_rate": 4.825588880369418e-06, "loss": 0.9606, "step": 7740 }, { "epoch": 0.15, "learning_rate": 4.8255328167343405e-06, "loss": 0.8513, "step": 7741 }, { "epoch": 0.15, "learning_rate": 4.825476744415796e-06, "loss": 1.0468, "step": 7742 }, { "epoch": 0.15, "learning_rate": 4.825420663413992e-06, "loss": 1.03, "step": 7743 }, { "epoch": 0.15, "learning_rate": 4.825364573729139e-06, "loss": 0.8566, "step": 7744 }, { "epoch": 0.15, "learning_rate": 4.8253084753614465e-06, "loss": 0.9141, "step": 7745 }, { "epoch": 0.15, "learning_rate": 4.825252368311122e-06, "loss": 0.9236, "step": 7746 }, { "epoch": 0.15, "learning_rate": 4.825196252578378e-06, "loss": 0.9449, "step": 7747 }, { "epoch": 0.15, "learning_rate": 4.825140128163421e-06, "loss": 0.8947, "step": 7748 }, { "epoch": 0.15, "learning_rate": 4.825083995066463e-06, "loss": 1.0333, "step": 7749 }, { "epoch": 0.15, "learning_rate": 4.825027853287712e-06, "loss": 1.1848, "step": 7750 }, { "epoch": 0.15, "learning_rate": 4.82497170282738e-06, "loss": 0.868, "step": 7751 }, { "epoch": 0.15, "learning_rate": 4.8249155436856735e-06, "loss": 0.9089, "step": 7752 }, { "epoch": 0.15, "learning_rate": 4.824859375862804e-06, "loss": 0.9365, "step": 7753 }, { "epoch": 0.15, "learning_rate": 4.82480319935898e-06, "loss": 0.8862, "step": 7754 }, { "epoch": 0.15, "learning_rate": 4.824747014174413e-06, "loss": 1.0278, "step": 7755 }, { "epoch": 0.15, "learning_rate": 4.824690820309312e-06, "loss": 1.0403, "step": 7756 }, { "epoch": 0.15, "learning_rate": 4.8246346177638865e-06, "loss": 0.8768, "step": 7757 }, { "epoch": 0.15, "learning_rate": 4.824578406538346e-06, "loss": 0.9207, "step": 7758 }, { "epoch": 0.15, "learning_rate": 4.824522186632902e-06, "loss": 0.9039, "step": 7759 }, { "epoch": 0.15, "learning_rate": 4.824465958047763e-06, "loss": 0.9956, "step": 7760 }, { "epoch": 0.15, "learning_rate": 4.82440972078314e-06, "loss": 0.962, "step": 7761 }, { "epoch": 0.15, "learning_rate": 4.8243534748392414e-06, "loss": 1.0914, "step": 7762 }, { "epoch": 0.15, "learning_rate": 4.824297220216278e-06, "loss": 1.0838, "step": 7763 }, { "epoch": 0.15, "learning_rate": 4.824240956914461e-06, "loss": 1.029, "step": 7764 }, { "epoch": 0.15, "learning_rate": 4.824184684934e-06, "loss": 0.9186, "step": 7765 }, { "epoch": 0.15, "learning_rate": 4.824128404275104e-06, "loss": 0.9421, "step": 7766 }, { "epoch": 0.15, "learning_rate": 4.8240721149379835e-06, "loss": 0.8417, "step": 7767 }, { "epoch": 0.15, "learning_rate": 4.824015816922849e-06, "loss": 1.0291, "step": 7768 }, { "epoch": 0.15, "learning_rate": 4.82395951022991e-06, "loss": 1.1815, "step": 7769 }, { "epoch": 0.15, "learning_rate": 4.8239031948593785e-06, "loss": 1.0825, "step": 7770 }, { "epoch": 0.15, "learning_rate": 4.823846870811464e-06, "loss": 1.0839, "step": 7771 }, { "epoch": 0.15, "learning_rate": 4.823790538086376e-06, "loss": 0.913, "step": 7772 }, { "epoch": 0.15, "learning_rate": 4.823734196684326e-06, "loss": 1.0535, "step": 7773 }, { "epoch": 0.15, "learning_rate": 4.823677846605522e-06, "loss": 1.0245, "step": 7774 }, { "epoch": 0.15, "learning_rate": 4.8236214878501775e-06, "loss": 1.1533, "step": 7775 }, { "epoch": 0.15, "learning_rate": 4.823565120418502e-06, "loss": 0.9938, "step": 7776 }, { "epoch": 0.15, "learning_rate": 4.823508744310704e-06, "loss": 0.8529, "step": 7777 }, { "epoch": 0.15, "learning_rate": 4.823452359526997e-06, "loss": 0.9769, "step": 7778 }, { "epoch": 0.15, "learning_rate": 4.82339596606759e-06, "loss": 1.1108, "step": 7779 }, { "epoch": 0.15, "learning_rate": 4.823339563932693e-06, "loss": 1.0524, "step": 7780 }, { "epoch": 0.15, "learning_rate": 4.823283153122518e-06, "loss": 1.1985, "step": 7781 }, { "epoch": 0.15, "learning_rate": 4.823226733637274e-06, "loss": 0.9287, "step": 7782 }, { "epoch": 0.15, "learning_rate": 4.823170305477174e-06, "loss": 0.9464, "step": 7783 }, { "epoch": 0.15, "learning_rate": 4.823113868642426e-06, "loss": 0.8159, "step": 7784 }, { "epoch": 0.15, "learning_rate": 4.823057423133242e-06, "loss": 0.9155, "step": 7785 }, { "epoch": 0.15, "learning_rate": 4.823000968949834e-06, "loss": 1.1066, "step": 7786 }, { "epoch": 0.15, "learning_rate": 4.822944506092412e-06, "loss": 1.1353, "step": 7787 }, { "epoch": 0.15, "learning_rate": 4.822888034561185e-06, "loss": 1.1273, "step": 7788 }, { "epoch": 0.15, "learning_rate": 4.822831554356365e-06, "loss": 1.0781, "step": 7789 }, { "epoch": 0.15, "learning_rate": 4.822775065478165e-06, "loss": 0.9595, "step": 7790 }, { "epoch": 0.15, "learning_rate": 4.822718567926793e-06, "loss": 0.8761, "step": 7791 }, { "epoch": 0.15, "learning_rate": 4.822662061702461e-06, "loss": 0.9766, "step": 7792 }, { "epoch": 0.15, "learning_rate": 4.82260554680538e-06, "loss": 1.2315, "step": 7793 }, { "epoch": 0.15, "learning_rate": 4.822549023235761e-06, "loss": 1.1483, "step": 7794 }, { "epoch": 0.15, "learning_rate": 4.822492490993816e-06, "loss": 0.8702, "step": 7795 }, { "epoch": 0.15, "learning_rate": 4.822435950079755e-06, "loss": 0.9318, "step": 7796 }, { "epoch": 0.15, "learning_rate": 4.8223794004937885e-06, "loss": 1.0182, "step": 7797 }, { "epoch": 0.15, "learning_rate": 4.82232284223613e-06, "loss": 0.9323, "step": 7798 }, { "epoch": 0.15, "learning_rate": 4.822266275306989e-06, "loss": 1.1322, "step": 7799 }, { "epoch": 0.15, "learning_rate": 4.8222096997065744e-06, "loss": 1.1108, "step": 7800 }, { "epoch": 0.15, "learning_rate": 4.822153115435103e-06, "loss": 0.8244, "step": 7801 }, { "epoch": 0.15, "learning_rate": 4.822096522492782e-06, "loss": 0.8806, "step": 7802 }, { "epoch": 0.15, "learning_rate": 4.822039920879823e-06, "loss": 0.8034, "step": 7803 }, { "epoch": 0.15, "learning_rate": 4.8219833105964395e-06, "loss": 0.8146, "step": 7804 }, { "epoch": 0.15, "learning_rate": 4.821926691642841e-06, "loss": 0.9339, "step": 7805 }, { "epoch": 0.15, "learning_rate": 4.821870064019238e-06, "loss": 1.1237, "step": 7806 }, { "epoch": 0.15, "learning_rate": 4.821813427725845e-06, "loss": 0.9512, "step": 7807 }, { "epoch": 0.15, "learning_rate": 4.821756782762872e-06, "loss": 0.7782, "step": 7808 }, { "epoch": 0.15, "learning_rate": 4.82170012913053e-06, "loss": 0.8087, "step": 7809 }, { "epoch": 0.15, "learning_rate": 4.821643466829031e-06, "loss": 0.9691, "step": 7810 }, { "epoch": 0.15, "learning_rate": 4.821586795858586e-06, "loss": 0.9591, "step": 7811 }, { "epoch": 0.15, "learning_rate": 4.821530116219407e-06, "loss": 1.1228, "step": 7812 }, { "epoch": 0.15, "learning_rate": 4.821473427911706e-06, "loss": 0.9706, "step": 7813 }, { "epoch": 0.15, "learning_rate": 4.821416730935695e-06, "loss": 0.8666, "step": 7814 }, { "epoch": 0.15, "learning_rate": 4.821360025291585e-06, "loss": 1.0375, "step": 7815 }, { "epoch": 0.15, "learning_rate": 4.821303310979587e-06, "loss": 0.9409, "step": 7816 }, { "epoch": 0.15, "learning_rate": 4.821246587999914e-06, "loss": 0.8956, "step": 7817 }, { "epoch": 0.15, "learning_rate": 4.821189856352777e-06, "loss": 1.1087, "step": 7818 }, { "epoch": 0.15, "learning_rate": 4.821133116038389e-06, "loss": 1.1184, "step": 7819 }, { "epoch": 0.15, "learning_rate": 4.82107636705696e-06, "loss": 0.8293, "step": 7820 }, { "epoch": 0.15, "learning_rate": 4.821019609408705e-06, "loss": 0.9017, "step": 7821 }, { "epoch": 0.15, "learning_rate": 4.820962843093832e-06, "loss": 0.9698, "step": 7822 }, { "epoch": 0.15, "learning_rate": 4.820906068112556e-06, "loss": 1.0273, "step": 7823 }, { "epoch": 0.15, "learning_rate": 4.820849284465087e-06, "loss": 0.889, "step": 7824 }, { "epoch": 0.15, "learning_rate": 4.820792492151639e-06, "loss": 1.1439, "step": 7825 }, { "epoch": 0.15, "learning_rate": 4.820735691172422e-06, "loss": 1.0672, "step": 7826 }, { "epoch": 0.15, "learning_rate": 4.820678881527649e-06, "loss": 0.9683, "step": 7827 }, { "epoch": 0.15, "learning_rate": 4.8206220632175335e-06, "loss": 1.2481, "step": 7828 }, { "epoch": 0.15, "learning_rate": 4.820565236242286e-06, "loss": 1.0631, "step": 7829 }, { "epoch": 0.15, "learning_rate": 4.820508400602118e-06, "loss": 0.8802, "step": 7830 }, { "epoch": 0.15, "learning_rate": 4.820451556297244e-06, "loss": 1.058, "step": 7831 }, { "epoch": 0.15, "learning_rate": 4.820394703327874e-06, "loss": 1.1835, "step": 7832 }, { "epoch": 0.15, "learning_rate": 4.820337841694222e-06, "loss": 0.873, "step": 7833 }, { "epoch": 0.15, "learning_rate": 4.8202809713964994e-06, "loss": 0.9918, "step": 7834 }, { "epoch": 0.15, "learning_rate": 4.820224092434919e-06, "loss": 0.8845, "step": 7835 }, { "epoch": 0.15, "learning_rate": 4.820167204809692e-06, "loss": 0.9942, "step": 7836 }, { "epoch": 0.15, "learning_rate": 4.820110308521033e-06, "loss": 1.2073, "step": 7837 }, { "epoch": 0.15, "learning_rate": 4.820053403569154e-06, "loss": 0.8991, "step": 7838 }, { "epoch": 0.15, "learning_rate": 4.819996489954265e-06, "loss": 1.0179, "step": 7839 }, { "epoch": 0.15, "learning_rate": 4.8199395676765806e-06, "loss": 1.1005, "step": 7840 }, { "epoch": 0.15, "learning_rate": 4.819882636736314e-06, "loss": 1.0601, "step": 7841 }, { "epoch": 0.15, "learning_rate": 4.819825697133676e-06, "loss": 0.8185, "step": 7842 }, { "epoch": 0.15, "learning_rate": 4.819768748868879e-06, "loss": 1.0558, "step": 7843 }, { "epoch": 0.15, "learning_rate": 4.819711791942138e-06, "loss": 0.9233, "step": 7844 }, { "epoch": 0.15, "learning_rate": 4.819654826353663e-06, "loss": 0.8175, "step": 7845 }, { "epoch": 0.15, "learning_rate": 4.81959785210367e-06, "loss": 0.8347, "step": 7846 }, { "epoch": 0.15, "learning_rate": 4.819540869192368e-06, "loss": 1.0011, "step": 7847 }, { "epoch": 0.15, "learning_rate": 4.819483877619972e-06, "loss": 0.9939, "step": 7848 }, { "epoch": 0.15, "learning_rate": 4.819426877386695e-06, "loss": 1.0633, "step": 7849 }, { "epoch": 0.15, "learning_rate": 4.819369868492748e-06, "loss": 1.1141, "step": 7850 }, { "epoch": 0.15, "learning_rate": 4.819312850938346e-06, "loss": 1.024, "step": 7851 }, { "epoch": 0.15, "learning_rate": 4.819255824723701e-06, "loss": 0.894, "step": 7852 }, { "epoch": 0.15, "learning_rate": 4.819198789849025e-06, "loss": 0.8816, "step": 7853 }, { "epoch": 0.15, "learning_rate": 4.819141746314533e-06, "loss": 0.7923, "step": 7854 }, { "epoch": 0.15, "learning_rate": 4.819084694120435e-06, "loss": 1.0419, "step": 7855 }, { "epoch": 0.15, "learning_rate": 4.819027633266947e-06, "loss": 1.1486, "step": 7856 }, { "epoch": 0.15, "learning_rate": 4.818970563754281e-06, "loss": 0.8723, "step": 7857 }, { "epoch": 0.15, "learning_rate": 4.8189134855826505e-06, "loss": 0.9244, "step": 7858 }, { "epoch": 0.15, "learning_rate": 4.818856398752267e-06, "loss": 0.9718, "step": 7859 }, { "epoch": 0.15, "learning_rate": 4.818799303263345e-06, "loss": 0.9173, "step": 7860 }, { "epoch": 0.15, "learning_rate": 4.818742199116098e-06, "loss": 0.929, "step": 7861 }, { "epoch": 0.15, "learning_rate": 4.818685086310739e-06, "loss": 0.9885, "step": 7862 }, { "epoch": 0.15, "learning_rate": 4.8186279648474795e-06, "loss": 0.9721, "step": 7863 }, { "epoch": 0.15, "learning_rate": 4.8185708347265355e-06, "loss": 0.8909, "step": 7864 }, { "epoch": 0.15, "learning_rate": 4.8185136959481195e-06, "loss": 0.9752, "step": 7865 }, { "epoch": 0.15, "learning_rate": 4.818456548512443e-06, "loss": 0.839, "step": 7866 }, { "epoch": 0.15, "learning_rate": 4.818399392419722e-06, "loss": 0.8225, "step": 7867 }, { "epoch": 0.15, "learning_rate": 4.818342227670168e-06, "loss": 1.0615, "step": 7868 }, { "epoch": 0.15, "learning_rate": 4.818285054263997e-06, "loss": 0.9941, "step": 7869 }, { "epoch": 0.15, "learning_rate": 4.818227872201419e-06, "loss": 0.9938, "step": 7870 }, { "epoch": 0.15, "learning_rate": 4.818170681482649e-06, "loss": 1.0958, "step": 7871 }, { "epoch": 0.15, "learning_rate": 4.818113482107901e-06, "loss": 0.8733, "step": 7872 }, { "epoch": 0.15, "learning_rate": 4.818056274077389e-06, "loss": 0.9354, "step": 7873 }, { "epoch": 0.15, "learning_rate": 4.8179990573913256e-06, "loss": 1.0258, "step": 7874 }, { "epoch": 0.15, "learning_rate": 4.817941832049925e-06, "loss": 0.9409, "step": 7875 }, { "epoch": 0.15, "learning_rate": 4.8178845980534e-06, "loss": 0.69, "step": 7876 }, { "epoch": 0.15, "learning_rate": 4.817827355401965e-06, "loss": 0.8502, "step": 7877 }, { "epoch": 0.15, "learning_rate": 4.817770104095835e-06, "loss": 0.9414, "step": 7878 }, { "epoch": 0.15, "learning_rate": 4.817712844135221e-06, "loss": 0.7808, "step": 7879 }, { "epoch": 0.15, "learning_rate": 4.817655575520339e-06, "loss": 0.9011, "step": 7880 }, { "epoch": 0.15, "learning_rate": 4.817598298251402e-06, "loss": 1.0062, "step": 7881 }, { "epoch": 0.15, "learning_rate": 4.8175410123286235e-06, "loss": 1.0363, "step": 7882 }, { "epoch": 0.15, "learning_rate": 4.81748371775222e-06, "loss": 1.0927, "step": 7883 }, { "epoch": 0.15, "learning_rate": 4.817426414522401e-06, "loss": 0.9238, "step": 7884 }, { "epoch": 0.15, "learning_rate": 4.8173691026393834e-06, "loss": 0.8276, "step": 7885 }, { "epoch": 0.15, "learning_rate": 4.817311782103381e-06, "loss": 0.8777, "step": 7886 }, { "epoch": 0.15, "learning_rate": 4.817254452914607e-06, "loss": 1.1553, "step": 7887 }, { "epoch": 0.15, "learning_rate": 4.817197115073277e-06, "loss": 1.1322, "step": 7888 }, { "epoch": 0.15, "learning_rate": 4.817139768579603e-06, "loss": 1.0278, "step": 7889 }, { "epoch": 0.15, "learning_rate": 4.8170824134338e-06, "loss": 0.9068, "step": 7890 }, { "epoch": 0.15, "learning_rate": 4.817025049636082e-06, "loss": 0.9027, "step": 7891 }, { "epoch": 0.15, "learning_rate": 4.816967677186665e-06, "loss": 0.823, "step": 7892 }, { "epoch": 0.15, "learning_rate": 4.816910296085761e-06, "loss": 0.9152, "step": 7893 }, { "epoch": 0.15, "learning_rate": 4.816852906333585e-06, "loss": 0.9291, "step": 7894 }, { "epoch": 0.15, "learning_rate": 4.816795507930351e-06, "loss": 0.8693, "step": 7895 }, { "epoch": 0.15, "learning_rate": 4.816738100876274e-06, "loss": 1.0213, "step": 7896 }, { "epoch": 0.15, "learning_rate": 4.8166806851715675e-06, "loss": 0.8697, "step": 7897 }, { "epoch": 0.15, "learning_rate": 4.816623260816447e-06, "loss": 0.8765, "step": 7898 }, { "epoch": 0.15, "learning_rate": 4.816565827811126e-06, "loss": 1.0807, "step": 7899 }, { "epoch": 0.15, "learning_rate": 4.8165083861558194e-06, "loss": 1.0087, "step": 7900 }, { "epoch": 0.15, "learning_rate": 4.81645093585074e-06, "loss": 1.0698, "step": 7901 }, { "epoch": 0.15, "learning_rate": 4.8163934768961064e-06, "loss": 0.8712, "step": 7902 }, { "epoch": 0.15, "learning_rate": 4.8163360092921286e-06, "loss": 0.9446, "step": 7903 }, { "epoch": 0.15, "learning_rate": 4.8162785330390236e-06, "loss": 0.9139, "step": 7904 }, { "epoch": 0.15, "learning_rate": 4.816221048137007e-06, "loss": 1.0994, "step": 7905 }, { "epoch": 0.15, "learning_rate": 4.81616355458629e-06, "loss": 1.0641, "step": 7906 }, { "epoch": 0.15, "learning_rate": 4.8161060523870905e-06, "loss": 0.9429, "step": 7907 }, { "epoch": 0.15, "learning_rate": 4.816048541539622e-06, "loss": 0.9139, "step": 7908 }, { "epoch": 0.15, "learning_rate": 4.815991022044099e-06, "loss": 0.9996, "step": 7909 }, { "epoch": 0.15, "learning_rate": 4.815933493900736e-06, "loss": 0.858, "step": 7910 }, { "epoch": 0.15, "learning_rate": 4.815875957109748e-06, "loss": 1.0002, "step": 7911 }, { "epoch": 0.15, "learning_rate": 4.815818411671351e-06, "loss": 1.1338, "step": 7912 }, { "epoch": 0.15, "learning_rate": 4.815760857585759e-06, "loss": 1.0088, "step": 7913 }, { "epoch": 0.15, "learning_rate": 4.815703294853188e-06, "loss": 1.0559, "step": 7914 }, { "epoch": 0.15, "learning_rate": 4.815645723473851e-06, "loss": 0.8776, "step": 7915 }, { "epoch": 0.15, "learning_rate": 4.8155881434479635e-06, "loss": 1.0328, "step": 7916 }, { "epoch": 0.15, "learning_rate": 4.815530554775741e-06, "loss": 0.8853, "step": 7917 }, { "epoch": 0.15, "learning_rate": 4.815472957457399e-06, "loss": 0.8737, "step": 7918 }, { "epoch": 0.15, "learning_rate": 4.815415351493151e-06, "loss": 1.1262, "step": 7919 }, { "epoch": 0.15, "learning_rate": 4.815357736883214e-06, "loss": 0.8725, "step": 7920 }, { "epoch": 0.15, "learning_rate": 4.815300113627801e-06, "loss": 0.8369, "step": 7921 }, { "epoch": 0.15, "learning_rate": 4.815242481727129e-06, "loss": 0.8027, "step": 7922 }, { "epoch": 0.15, "learning_rate": 4.815184841181413e-06, "loss": 0.8123, "step": 7923 }, { "epoch": 0.15, "learning_rate": 4.815127191990867e-06, "loss": 1.0868, "step": 7924 }, { "epoch": 0.15, "learning_rate": 4.815069534155708e-06, "loss": 1.1138, "step": 7925 }, { "epoch": 0.15, "learning_rate": 4.8150118676761496e-06, "loss": 0.9182, "step": 7926 }, { "epoch": 0.15, "learning_rate": 4.814954192552408e-06, "loss": 0.9103, "step": 7927 }, { "epoch": 0.15, "learning_rate": 4.814896508784699e-06, "loss": 1.0099, "step": 7928 }, { "epoch": 0.15, "learning_rate": 4.814838816373237e-06, "loss": 0.8081, "step": 7929 }, { "epoch": 0.15, "learning_rate": 4.814781115318238e-06, "loss": 1.0101, "step": 7930 }, { "epoch": 0.15, "learning_rate": 4.814723405619916e-06, "loss": 1.1453, "step": 7931 }, { "epoch": 0.15, "learning_rate": 4.81466568727849e-06, "loss": 0.9661, "step": 7932 }, { "epoch": 0.15, "learning_rate": 4.814607960294172e-06, "loss": 1.0445, "step": 7933 }, { "epoch": 0.15, "learning_rate": 4.8145502246671785e-06, "loss": 0.9064, "step": 7934 }, { "epoch": 0.15, "learning_rate": 4.814492480397726e-06, "loss": 0.8395, "step": 7935 }, { "epoch": 0.15, "learning_rate": 4.8144347274860295e-06, "loss": 0.8756, "step": 7936 }, { "epoch": 0.15, "learning_rate": 4.814376965932305e-06, "loss": 1.3069, "step": 7937 }, { "epoch": 0.15, "learning_rate": 4.814319195736767e-06, "loss": 1.0967, "step": 7938 }, { "epoch": 0.15, "learning_rate": 4.8142614168996324e-06, "loss": 0.8849, "step": 7939 }, { "epoch": 0.15, "learning_rate": 4.814203629421118e-06, "loss": 0.9105, "step": 7940 }, { "epoch": 0.15, "learning_rate": 4.814145833301437e-06, "loss": 1.0246, "step": 7941 }, { "epoch": 0.15, "learning_rate": 4.8140880285408055e-06, "loss": 0.8665, "step": 7942 }, { "epoch": 0.15, "learning_rate": 4.814030215139441e-06, "loss": 1.002, "step": 7943 }, { "epoch": 0.15, "learning_rate": 4.813972393097559e-06, "loss": 1.1462, "step": 7944 }, { "epoch": 0.15, "learning_rate": 4.8139145624153755e-06, "loss": 0.798, "step": 7945 }, { "epoch": 0.15, "learning_rate": 4.8138567230931054e-06, "loss": 0.9893, "step": 7946 }, { "epoch": 0.15, "learning_rate": 4.813798875130965e-06, "loss": 0.8556, "step": 7947 }, { "epoch": 0.15, "learning_rate": 4.813741018529171e-06, "loss": 0.8792, "step": 7948 }, { "epoch": 0.15, "learning_rate": 4.813683153287938e-06, "loss": 1.1829, "step": 7949 }, { "epoch": 0.15, "learning_rate": 4.8136252794074845e-06, "loss": 1.0505, "step": 7950 }, { "epoch": 0.15, "learning_rate": 4.813567396888023e-06, "loss": 0.8682, "step": 7951 }, { "epoch": 0.15, "learning_rate": 4.813509505729775e-06, "loss": 0.7693, "step": 7952 }, { "epoch": 0.15, "learning_rate": 4.81345160593295e-06, "loss": 0.8328, "step": 7953 }, { "epoch": 0.15, "learning_rate": 4.813393697497771e-06, "loss": 0.8822, "step": 7954 }, { "epoch": 0.15, "learning_rate": 4.813335780424448e-06, "loss": 1.2114, "step": 7955 }, { "epoch": 0.15, "learning_rate": 4.8132778547132005e-06, "loss": 1.1473, "step": 7956 }, { "epoch": 0.15, "learning_rate": 4.813219920364246e-06, "loss": 0.9024, "step": 7957 }, { "epoch": 0.15, "learning_rate": 4.813161977377798e-06, "loss": 0.8374, "step": 7958 }, { "epoch": 0.15, "learning_rate": 4.813104025754075e-06, "loss": 0.8909, "step": 7959 }, { "epoch": 0.15, "learning_rate": 4.813046065493292e-06, "loss": 0.9982, "step": 7960 }, { "epoch": 0.15, "learning_rate": 4.812988096595665e-06, "loss": 0.7742, "step": 7961 }, { "epoch": 0.15, "learning_rate": 4.812930119061413e-06, "loss": 1.1257, "step": 7962 }, { "epoch": 0.15, "learning_rate": 4.81287213289075e-06, "loss": 1.0128, "step": 7963 }, { "epoch": 0.15, "learning_rate": 4.812814138083894e-06, "loss": 0.8659, "step": 7964 }, { "epoch": 0.15, "learning_rate": 4.81275613464106e-06, "loss": 1.0139, "step": 7965 }, { "epoch": 0.15, "learning_rate": 4.812698122562466e-06, "loss": 0.9745, "step": 7966 }, { "epoch": 0.15, "learning_rate": 4.812640101848328e-06, "loss": 0.6977, "step": 7967 }, { "epoch": 0.15, "learning_rate": 4.812582072498862e-06, "loss": 1.2153, "step": 7968 }, { "epoch": 0.15, "learning_rate": 4.812524034514287e-06, "loss": 1.1798, "step": 7969 }, { "epoch": 0.15, "learning_rate": 4.812465987894817e-06, "loss": 1.0944, "step": 7970 }, { "epoch": 0.15, "learning_rate": 4.8124079326406706e-06, "loss": 0.7928, "step": 7971 }, { "epoch": 0.15, "learning_rate": 4.812349868752063e-06, "loss": 0.8134, "step": 7972 }, { "epoch": 0.15, "learning_rate": 4.812291796229213e-06, "loss": 1.0217, "step": 7973 }, { "epoch": 0.15, "learning_rate": 4.812233715072336e-06, "loss": 1.1865, "step": 7974 }, { "epoch": 0.15, "learning_rate": 4.812175625281649e-06, "loss": 0.894, "step": 7975 }, { "epoch": 0.15, "learning_rate": 4.812117526857368e-06, "loss": 1.0853, "step": 7976 }, { "epoch": 0.15, "learning_rate": 4.812059419799713e-06, "loss": 0.9035, "step": 7977 }, { "epoch": 0.15, "learning_rate": 4.812001304108898e-06, "loss": 0.9537, "step": 7978 }, { "epoch": 0.15, "learning_rate": 4.811943179785142e-06, "loss": 0.9345, "step": 7979 }, { "epoch": 0.15, "learning_rate": 4.811885046828659e-06, "loss": 1.0846, "step": 7980 }, { "epoch": 0.15, "learning_rate": 4.8118269052396696e-06, "loss": 1.1375, "step": 7981 }, { "epoch": 0.15, "learning_rate": 4.811768755018389e-06, "loss": 0.9955, "step": 7982 }, { "epoch": 0.15, "learning_rate": 4.811710596165035e-06, "loss": 0.8607, "step": 7983 }, { "epoch": 0.15, "learning_rate": 4.811652428679825e-06, "loss": 1.0412, "step": 7984 }, { "epoch": 0.15, "learning_rate": 4.811594252562974e-06, "loss": 0.9681, "step": 7985 }, { "epoch": 0.15, "learning_rate": 4.811536067814703e-06, "loss": 0.9858, "step": 7986 }, { "epoch": 0.15, "learning_rate": 4.811477874435226e-06, "loss": 1.0361, "step": 7987 }, { "epoch": 0.15, "learning_rate": 4.811419672424762e-06, "loss": 0.8756, "step": 7988 }, { "epoch": 0.15, "learning_rate": 4.8113614617835276e-06, "loss": 0.862, "step": 7989 }, { "epoch": 0.15, "learning_rate": 4.81130324251174e-06, "loss": 0.7515, "step": 7990 }, { "epoch": 0.15, "learning_rate": 4.811245014609617e-06, "loss": 0.9982, "step": 7991 }, { "epoch": 0.15, "learning_rate": 4.811186778077377e-06, "loss": 1.1221, "step": 7992 }, { "epoch": 0.15, "learning_rate": 4.811128532915235e-06, "loss": 1.1089, "step": 7993 }, { "epoch": 0.15, "learning_rate": 4.811070279123411e-06, "loss": 0.8039, "step": 7994 }, { "epoch": 0.15, "learning_rate": 4.8110120167021214e-06, "loss": 1.0923, "step": 7995 }, { "epoch": 0.15, "learning_rate": 4.810953745651583e-06, "loss": 1.0321, "step": 7996 }, { "epoch": 0.15, "learning_rate": 4.810895465972015e-06, "loss": 1.0374, "step": 7997 }, { "epoch": 0.15, "learning_rate": 4.810837177663634e-06, "loss": 0.8532, "step": 7998 }, { "epoch": 0.15, "learning_rate": 4.810778880726658e-06, "loss": 0.8838, "step": 7999 }, { "epoch": 0.15, "learning_rate": 4.810720575161303e-06, "loss": 1.077, "step": 8000 }, { "epoch": 0.15, "learning_rate": 4.81066226096779e-06, "loss": 1.081, "step": 8001 }, { "epoch": 0.15, "learning_rate": 4.810603938146334e-06, "loss": 0.8487, "step": 8002 }, { "epoch": 0.15, "learning_rate": 4.810545606697154e-06, "loss": 1.0265, "step": 8003 }, { "epoch": 0.15, "learning_rate": 4.810487266620468e-06, "loss": 0.8037, "step": 8004 }, { "epoch": 0.15, "learning_rate": 4.8104289179164925e-06, "loss": 0.9357, "step": 8005 }, { "epoch": 0.15, "learning_rate": 4.810370560585447e-06, "loss": 1.1129, "step": 8006 }, { "epoch": 0.15, "learning_rate": 4.810312194627548e-06, "loss": 0.757, "step": 8007 }, { "epoch": 0.15, "learning_rate": 4.810253820043015e-06, "loss": 0.7153, "step": 8008 }, { "epoch": 0.15, "learning_rate": 4.810195436832064e-06, "loss": 1.1076, "step": 8009 }, { "epoch": 0.15, "learning_rate": 4.810137044994915e-06, "loss": 0.8738, "step": 8010 }, { "epoch": 0.15, "learning_rate": 4.810078644531785e-06, "loss": 0.9111, "step": 8011 }, { "epoch": 0.15, "learning_rate": 4.810020235442892e-06, "loss": 1.0329, "step": 8012 }, { "epoch": 0.15, "learning_rate": 4.809961817728454e-06, "loss": 0.9108, "step": 8013 }, { "epoch": 0.15, "learning_rate": 4.8099033913886895e-06, "loss": 0.8166, "step": 8014 }, { "epoch": 0.15, "learning_rate": 4.809844956423817e-06, "loss": 0.6729, "step": 8015 }, { "epoch": 0.15, "learning_rate": 4.809786512834054e-06, "loss": 1.1087, "step": 8016 }, { "epoch": 0.15, "learning_rate": 4.809728060619619e-06, "loss": 1.0241, "step": 8017 }, { "epoch": 0.15, "learning_rate": 4.80966959978073e-06, "loss": 0.9445, "step": 8018 }, { "epoch": 0.15, "learning_rate": 4.809611130317605e-06, "loss": 1.081, "step": 8019 }, { "epoch": 0.15, "learning_rate": 4.8095526522304635e-06, "loss": 0.9019, "step": 8020 }, { "epoch": 0.15, "learning_rate": 4.809494165519524e-06, "loss": 0.8502, "step": 8021 }, { "epoch": 0.15, "learning_rate": 4.809435670185003e-06, "loss": 0.9891, "step": 8022 }, { "epoch": 0.15, "learning_rate": 4.8093771662271205e-06, "loss": 0.935, "step": 8023 }, { "epoch": 0.15, "learning_rate": 4.809318653646094e-06, "loss": 1.0374, "step": 8024 }, { "epoch": 0.15, "learning_rate": 4.809260132442143e-06, "loss": 1.1077, "step": 8025 }, { "epoch": 0.15, "learning_rate": 4.809201602615486e-06, "loss": 1.0184, "step": 8026 }, { "epoch": 0.15, "learning_rate": 4.809143064166339e-06, "loss": 0.9082, "step": 8027 }, { "epoch": 0.15, "learning_rate": 4.809084517094924e-06, "loss": 0.9145, "step": 8028 }, { "epoch": 0.15, "learning_rate": 4.8090259614014585e-06, "loss": 0.9514, "step": 8029 }, { "epoch": 0.15, "learning_rate": 4.8089673970861604e-06, "loss": 1.0455, "step": 8030 }, { "epoch": 0.15, "learning_rate": 4.8089088241492485e-06, "loss": 1.0164, "step": 8031 }, { "epoch": 0.15, "learning_rate": 4.808850242590942e-06, "loss": 1.0338, "step": 8032 }, { "epoch": 0.15, "learning_rate": 4.80879165241146e-06, "loss": 0.8104, "step": 8033 }, { "epoch": 0.15, "learning_rate": 4.8087330536110205e-06, "loss": 0.8779, "step": 8034 }, { "epoch": 0.15, "learning_rate": 4.808674446189843e-06, "loss": 0.7396, "step": 8035 }, { "epoch": 0.15, "learning_rate": 4.808615830148145e-06, "loss": 0.9517, "step": 8036 }, { "epoch": 0.15, "learning_rate": 4.808557205486147e-06, "loss": 1.0518, "step": 8037 }, { "epoch": 0.15, "learning_rate": 4.8084985722040664e-06, "loss": 1.1221, "step": 8038 }, { "epoch": 0.15, "learning_rate": 4.808439930302123e-06, "loss": 0.9576, "step": 8039 }, { "epoch": 0.15, "learning_rate": 4.8083812797805366e-06, "loss": 0.776, "step": 8040 }, { "epoch": 0.15, "learning_rate": 4.808322620639525e-06, "loss": 0.8087, "step": 8041 }, { "epoch": 0.15, "learning_rate": 4.8082639528793065e-06, "loss": 0.7728, "step": 8042 }, { "epoch": 0.15, "learning_rate": 4.808205276500102e-06, "loss": 1.0555, "step": 8043 }, { "epoch": 0.15, "learning_rate": 4.8081465915021295e-06, "loss": 0.9998, "step": 8044 }, { "epoch": 0.15, "learning_rate": 4.80808789788561e-06, "loss": 0.7998, "step": 8045 }, { "epoch": 0.15, "learning_rate": 4.808029195650758e-06, "loss": 0.7538, "step": 8046 }, { "epoch": 0.15, "learning_rate": 4.807970484797798e-06, "loss": 1.0078, "step": 8047 }, { "epoch": 0.15, "learning_rate": 4.807911765326947e-06, "loss": 0.9225, "step": 8048 }, { "epoch": 0.15, "learning_rate": 4.807853037238423e-06, "loss": 1.1555, "step": 8049 }, { "epoch": 0.15, "learning_rate": 4.807794300532447e-06, "loss": 0.8549, "step": 8050 }, { "epoch": 0.15, "learning_rate": 4.807735555209238e-06, "loss": 1.0625, "step": 8051 }, { "epoch": 0.15, "learning_rate": 4.807676801269015e-06, "loss": 0.6803, "step": 8052 }, { "epoch": 0.15, "learning_rate": 4.807618038711998e-06, "loss": 0.9587, "step": 8053 }, { "epoch": 0.15, "learning_rate": 4.8075592675384056e-06, "loss": 0.9976, "step": 8054 }, { "epoch": 0.15, "learning_rate": 4.807500487748458e-06, "loss": 0.9062, "step": 8055 }, { "epoch": 0.15, "learning_rate": 4.807441699342374e-06, "loss": 0.8801, "step": 8056 }, { "epoch": 0.15, "learning_rate": 4.807382902320373e-06, "loss": 0.9487, "step": 8057 }, { "epoch": 0.15, "learning_rate": 4.807324096682676e-06, "loss": 0.8803, "step": 8058 }, { "epoch": 0.15, "learning_rate": 4.8072652824295005e-06, "loss": 0.8884, "step": 8059 }, { "epoch": 0.15, "learning_rate": 4.807206459561068e-06, "loss": 0.9294, "step": 8060 }, { "epoch": 0.15, "learning_rate": 4.807147628077597e-06, "loss": 0.806, "step": 8061 }, { "epoch": 0.15, "learning_rate": 4.807088787979308e-06, "loss": 1.085, "step": 8062 }, { "epoch": 0.15, "learning_rate": 4.80702993926642e-06, "loss": 0.7994, "step": 8063 }, { "epoch": 0.15, "learning_rate": 4.806971081939152e-06, "loss": 1.0522, "step": 8064 }, { "epoch": 0.15, "learning_rate": 4.806912215997726e-06, "loss": 0.7563, "step": 8065 }, { "epoch": 0.15, "learning_rate": 4.80685334144236e-06, "loss": 0.8353, "step": 8066 }, { "epoch": 0.15, "learning_rate": 4.806794458273274e-06, "loss": 0.9722, "step": 8067 }, { "epoch": 0.15, "learning_rate": 4.806735566490689e-06, "loss": 1.1049, "step": 8068 }, { "epoch": 0.15, "learning_rate": 4.8066766660948236e-06, "loss": 0.9888, "step": 8069 }, { "epoch": 0.15, "learning_rate": 4.806617757085898e-06, "loss": 0.8272, "step": 8070 }, { "epoch": 0.15, "learning_rate": 4.806558839464133e-06, "loss": 1.0224, "step": 8071 }, { "epoch": 0.15, "learning_rate": 4.806499913229747e-06, "loss": 1.0684, "step": 8072 }, { "epoch": 0.15, "learning_rate": 4.806440978382963e-06, "loss": 0.8912, "step": 8073 }, { "epoch": 0.15, "learning_rate": 4.806382034923997e-06, "loss": 0.896, "step": 8074 }, { "epoch": 0.15, "learning_rate": 4.806323082853072e-06, "loss": 1.0947, "step": 8075 }, { "epoch": 0.15, "learning_rate": 4.806264122170408e-06, "loss": 0.9358, "step": 8076 }, { "epoch": 0.15, "learning_rate": 4.806205152876223e-06, "loss": 0.8672, "step": 8077 }, { "epoch": 0.15, "learning_rate": 4.80614617497074e-06, "loss": 0.8969, "step": 8078 }, { "epoch": 0.15, "learning_rate": 4.8060871884541775e-06, "loss": 0.8459, "step": 8079 }, { "epoch": 0.15, "learning_rate": 4.806028193326756e-06, "loss": 0.8763, "step": 8080 }, { "epoch": 0.15, "learning_rate": 4.8059691895886965e-06, "loss": 0.9875, "step": 8081 }, { "epoch": 0.15, "learning_rate": 4.805910177240218e-06, "loss": 1.1064, "step": 8082 }, { "epoch": 0.15, "learning_rate": 4.805851156281541e-06, "loss": 0.8681, "step": 8083 }, { "epoch": 0.15, "learning_rate": 4.805792126712889e-06, "loss": 0.9417, "step": 8084 }, { "epoch": 0.15, "learning_rate": 4.805733088534477e-06, "loss": 0.998, "step": 8085 }, { "epoch": 0.15, "learning_rate": 4.80567404174653e-06, "loss": 0.9999, "step": 8086 }, { "epoch": 0.15, "learning_rate": 4.8056149863492666e-06, "loss": 1.1843, "step": 8087 }, { "epoch": 0.15, "learning_rate": 4.805555922342907e-06, "loss": 1.0114, "step": 8088 }, { "epoch": 0.15, "learning_rate": 4.805496849727672e-06, "loss": 0.7915, "step": 8089 }, { "epoch": 0.15, "learning_rate": 4.805437768503783e-06, "loss": 0.8257, "step": 8090 }, { "epoch": 0.15, "learning_rate": 4.8053786786714605e-06, "loss": 0.9192, "step": 8091 }, { "epoch": 0.15, "learning_rate": 4.805319580230925e-06, "loss": 0.9407, "step": 8092 }, { "epoch": 0.15, "learning_rate": 4.805260473182396e-06, "loss": 0.8837, "step": 8093 }, { "epoch": 0.15, "learning_rate": 4.805201357526095e-06, "loss": 1.0535, "step": 8094 }, { "epoch": 0.15, "learning_rate": 4.805142233262243e-06, "loss": 0.6916, "step": 8095 }, { "epoch": 0.15, "learning_rate": 4.805083100391061e-06, "loss": 0.896, "step": 8096 }, { "epoch": 0.15, "learning_rate": 4.805023958912769e-06, "loss": 0.7762, "step": 8097 }, { "epoch": 0.15, "learning_rate": 4.804964808827588e-06, "loss": 0.8299, "step": 8098 }, { "epoch": 0.15, "learning_rate": 4.804905650135739e-06, "loss": 0.9396, "step": 8099 }, { "epoch": 0.15, "learning_rate": 4.804846482837444e-06, "loss": 1.0612, "step": 8100 }, { "epoch": 0.15, "learning_rate": 4.804787306932922e-06, "loss": 0.8421, "step": 8101 }, { "epoch": 0.15, "learning_rate": 4.804728122422395e-06, "loss": 0.9026, "step": 8102 }, { "epoch": 0.15, "learning_rate": 4.804668929306083e-06, "loss": 0.7946, "step": 8103 }, { "epoch": 0.15, "learning_rate": 4.80460972758421e-06, "loss": 1.0079, "step": 8104 }, { "epoch": 0.15, "learning_rate": 4.804550517256993e-06, "loss": 0.9454, "step": 8105 }, { "epoch": 0.15, "learning_rate": 4.804491298324656e-06, "loss": 1.1531, "step": 8106 }, { "epoch": 0.15, "learning_rate": 4.804432070787419e-06, "loss": 0.8549, "step": 8107 }, { "epoch": 0.15, "learning_rate": 4.804372834645503e-06, "loss": 0.9973, "step": 8108 }, { "epoch": 0.15, "learning_rate": 4.80431358989913e-06, "loss": 0.9255, "step": 8109 }, { "epoch": 0.15, "learning_rate": 4.80425433654852e-06, "loss": 0.8157, "step": 8110 }, { "epoch": 0.15, "learning_rate": 4.804195074593896e-06, "loss": 0.7839, "step": 8111 }, { "epoch": 0.15, "learning_rate": 4.8041358040354764e-06, "loss": 1.0199, "step": 8112 }, { "epoch": 0.15, "learning_rate": 4.804076524873487e-06, "loss": 1.0352, "step": 8113 }, { "epoch": 0.15, "learning_rate": 4.804017237108144e-06, "loss": 0.9563, "step": 8114 }, { "epoch": 0.15, "learning_rate": 4.803957940739673e-06, "loss": 0.6836, "step": 8115 }, { "epoch": 0.15, "learning_rate": 4.803898635768293e-06, "loss": 0.9307, "step": 8116 }, { "epoch": 0.15, "learning_rate": 4.803839322194226e-06, "loss": 0.8585, "step": 8117 }, { "epoch": 0.15, "learning_rate": 4.803780000017694e-06, "loss": 1.0387, "step": 8118 }, { "epoch": 0.15, "learning_rate": 4.803720669238917e-06, "loss": 1.0306, "step": 8119 }, { "epoch": 0.15, "learning_rate": 4.803661329858119e-06, "loss": 0.9576, "step": 8120 }, { "epoch": 0.15, "learning_rate": 4.80360198187552e-06, "loss": 0.9979, "step": 8121 }, { "epoch": 0.15, "learning_rate": 4.803542625291342e-06, "loss": 0.9623, "step": 8122 }, { "epoch": 0.15, "learning_rate": 4.803483260105806e-06, "loss": 0.9292, "step": 8123 }, { "epoch": 0.15, "learning_rate": 4.803423886319134e-06, "loss": 0.9979, "step": 8124 }, { "epoch": 0.15, "learning_rate": 4.803364503931548e-06, "loss": 0.95, "step": 8125 }, { "epoch": 0.15, "learning_rate": 4.80330511294327e-06, "loss": 0.9647, "step": 8126 }, { "epoch": 0.15, "learning_rate": 4.80324571335452e-06, "loss": 0.9101, "step": 8127 }, { "epoch": 0.15, "learning_rate": 4.803186305165523e-06, "loss": 0.8365, "step": 8128 }, { "epoch": 0.15, "learning_rate": 4.803126888376497e-06, "loss": 0.6776, "step": 8129 }, { "epoch": 0.15, "learning_rate": 4.803067462987667e-06, "loss": 0.8599, "step": 8130 }, { "epoch": 0.15, "learning_rate": 4.803008028999253e-06, "loss": 1.1533, "step": 8131 }, { "epoch": 0.15, "learning_rate": 4.8029485864114785e-06, "loss": 1.0656, "step": 8132 }, { "epoch": 0.15, "learning_rate": 4.802889135224564e-06, "loss": 0.9672, "step": 8133 }, { "epoch": 0.15, "learning_rate": 4.802829675438733e-06, "loss": 0.9002, "step": 8134 }, { "epoch": 0.15, "learning_rate": 4.802770207054206e-06, "loss": 0.7479, "step": 8135 }, { "epoch": 0.15, "learning_rate": 4.802710730071205e-06, "loss": 0.8675, "step": 8136 }, { "epoch": 0.15, "learning_rate": 4.802651244489953e-06, "loss": 1.3878, "step": 8137 }, { "epoch": 0.15, "learning_rate": 4.8025917503106725e-06, "loss": 0.9824, "step": 8138 }, { "epoch": 0.15, "learning_rate": 4.802532247533584e-06, "loss": 1.0031, "step": 8139 }, { "epoch": 0.15, "learning_rate": 4.802472736158912e-06, "loss": 1.104, "step": 8140 }, { "epoch": 0.15, "learning_rate": 4.802413216186876e-06, "loss": 0.9641, "step": 8141 }, { "epoch": 0.15, "learning_rate": 4.8023536876177015e-06, "loss": 0.7851, "step": 8142 }, { "epoch": 0.15, "learning_rate": 4.802294150451607e-06, "loss": 1.1205, "step": 8143 }, { "epoch": 0.15, "learning_rate": 4.802234604688818e-06, "loss": 1.2119, "step": 8144 }, { "epoch": 0.15, "learning_rate": 4.802175050329555e-06, "loss": 1.0494, "step": 8145 }, { "epoch": 0.15, "learning_rate": 4.802115487374041e-06, "loss": 1.0033, "step": 8146 }, { "epoch": 0.15, "learning_rate": 4.802055915822499e-06, "loss": 0.9433, "step": 8147 }, { "epoch": 0.15, "learning_rate": 4.8019963356751495e-06, "loss": 1.0659, "step": 8148 }, { "epoch": 0.15, "learning_rate": 4.801936746932217e-06, "loss": 0.9253, "step": 8149 }, { "epoch": 0.15, "learning_rate": 4.801877149593923e-06, "loss": 1.1546, "step": 8150 }, { "epoch": 0.15, "learning_rate": 4.801817543660491e-06, "loss": 1.0394, "step": 8151 }, { "epoch": 0.15, "learning_rate": 4.801757929132143e-06, "loss": 0.9136, "step": 8152 }, { "epoch": 0.15, "learning_rate": 4.8016983060091e-06, "loss": 1.0548, "step": 8153 }, { "epoch": 0.15, "learning_rate": 4.801638674291588e-06, "loss": 0.9866, "step": 8154 }, { "epoch": 0.15, "learning_rate": 4.801579033979826e-06, "loss": 1.095, "step": 8155 }, { "epoch": 0.15, "learning_rate": 4.801519385074039e-06, "loss": 1.2366, "step": 8156 }, { "epoch": 0.15, "learning_rate": 4.80145972757445e-06, "loss": 1.1323, "step": 8157 }, { "epoch": 0.15, "learning_rate": 4.8014000614812795e-06, "loss": 1.0584, "step": 8158 }, { "epoch": 0.15, "learning_rate": 4.801340386794753e-06, "loss": 0.8907, "step": 8159 }, { "epoch": 0.15, "learning_rate": 4.801280703515092e-06, "loss": 0.8203, "step": 8160 }, { "epoch": 0.15, "learning_rate": 4.8012210116425185e-06, "loss": 0.649, "step": 8161 }, { "epoch": 0.15, "learning_rate": 4.801161311177257e-06, "loss": 0.9666, "step": 8162 }, { "epoch": 0.15, "learning_rate": 4.801101602119529e-06, "loss": 0.9339, "step": 8163 }, { "epoch": 0.15, "learning_rate": 4.80104188446956e-06, "loss": 0.9821, "step": 8164 }, { "epoch": 0.15, "learning_rate": 4.800982158227569e-06, "loss": 0.827, "step": 8165 }, { "epoch": 0.15, "learning_rate": 4.800922423393782e-06, "loss": 0.8755, "step": 8166 }, { "epoch": 0.15, "learning_rate": 4.800862679968421e-06, "loss": 0.874, "step": 8167 }, { "epoch": 0.15, "learning_rate": 4.80080292795171e-06, "loss": 0.9373, "step": 8168 }, { "epoch": 0.15, "learning_rate": 4.800743167343871e-06, "loss": 0.9521, "step": 8169 }, { "epoch": 0.15, "learning_rate": 4.800683398145127e-06, "loss": 0.8093, "step": 8170 }, { "epoch": 0.15, "learning_rate": 4.800623620355702e-06, "loss": 1.0256, "step": 8171 }, { "epoch": 0.15, "learning_rate": 4.80056383397582e-06, "loss": 1.0393, "step": 8172 }, { "epoch": 0.15, "learning_rate": 4.800504039005702e-06, "loss": 0.9498, "step": 8173 }, { "epoch": 0.15, "learning_rate": 4.800444235445573e-06, "loss": 0.9178, "step": 8174 }, { "epoch": 0.15, "learning_rate": 4.800384423295656e-06, "loss": 0.9769, "step": 8175 }, { "epoch": 0.15, "learning_rate": 4.800324602556173e-06, "loss": 0.9311, "step": 8176 }, { "epoch": 0.15, "learning_rate": 4.800264773227349e-06, "loss": 0.8924, "step": 8177 }, { "epoch": 0.15, "learning_rate": 4.800204935309407e-06, "loss": 0.9913, "step": 8178 }, { "epoch": 0.15, "learning_rate": 4.8001450888025706e-06, "loss": 1.0964, "step": 8179 }, { "epoch": 0.15, "learning_rate": 4.8000852337070626e-06, "loss": 1.0711, "step": 8180 }, { "epoch": 0.15, "learning_rate": 4.800025370023107e-06, "loss": 0.9946, "step": 8181 }, { "epoch": 0.15, "learning_rate": 4.799965497750927e-06, "loss": 1.0509, "step": 8182 }, { "epoch": 0.15, "learning_rate": 4.799905616890746e-06, "loss": 1.0355, "step": 8183 }, { "epoch": 0.15, "learning_rate": 4.799845727442789e-06, "loss": 0.7987, "step": 8184 }, { "epoch": 0.15, "learning_rate": 4.7997858294072775e-06, "loss": 0.8729, "step": 8185 }, { "epoch": 0.15, "learning_rate": 4.799725922784437e-06, "loss": 1.2029, "step": 8186 }, { "epoch": 0.15, "learning_rate": 4.79966600757449e-06, "loss": 1.1072, "step": 8187 }, { "epoch": 0.15, "learning_rate": 4.79960608377766e-06, "loss": 1.139, "step": 8188 }, { "epoch": 0.15, "learning_rate": 4.7995461513941725e-06, "loss": 0.972, "step": 8189 }, { "epoch": 0.15, "learning_rate": 4.79948621042425e-06, "loss": 1.0992, "step": 8190 }, { "epoch": 0.15, "learning_rate": 4.7994262608681166e-06, "loss": 0.9811, "step": 8191 }, { "epoch": 0.15, "learning_rate": 4.7993663027259954e-06, "loss": 1.0438, "step": 8192 }, { "epoch": 0.15, "learning_rate": 4.799306335998112e-06, "loss": 1.1678, "step": 8193 }, { "epoch": 0.15, "learning_rate": 4.799246360684688e-06, "loss": 0.8627, "step": 8194 }, { "epoch": 0.15, "learning_rate": 4.7991863767859494e-06, "loss": 0.8663, "step": 8195 }, { "epoch": 0.15, "learning_rate": 4.799126384302118e-06, "loss": 0.8191, "step": 8196 }, { "epoch": 0.15, "learning_rate": 4.799066383233421e-06, "loss": 0.731, "step": 8197 }, { "epoch": 0.15, "learning_rate": 4.79900637358008e-06, "loss": 0.8987, "step": 8198 }, { "epoch": 0.15, "learning_rate": 4.7989463553423195e-06, "loss": 1.1822, "step": 8199 }, { "epoch": 0.15, "learning_rate": 4.798886328520363e-06, "loss": 1.0605, "step": 8200 }, { "epoch": 0.15, "learning_rate": 4.798826293114437e-06, "loss": 0.8823, "step": 8201 }, { "epoch": 0.15, "learning_rate": 4.798766249124763e-06, "loss": 0.9905, "step": 8202 }, { "epoch": 0.15, "learning_rate": 4.798706196551567e-06, "loss": 0.7864, "step": 8203 }, { "epoch": 0.15, "learning_rate": 4.798646135395072e-06, "loss": 0.8223, "step": 8204 }, { "epoch": 0.15, "learning_rate": 4.798586065655503e-06, "loss": 0.9055, "step": 8205 }, { "epoch": 0.15, "learning_rate": 4.798525987333085e-06, "loss": 1.072, "step": 8206 }, { "epoch": 0.15, "learning_rate": 4.79846590042804e-06, "loss": 0.9047, "step": 8207 }, { "epoch": 0.15, "learning_rate": 4.7984058049405945e-06, "loss": 0.9278, "step": 8208 }, { "epoch": 0.15, "learning_rate": 4.798345700870972e-06, "loss": 0.9575, "step": 8209 }, { "epoch": 0.15, "learning_rate": 4.798285588219397e-06, "loss": 0.9351, "step": 8210 }, { "epoch": 0.15, "learning_rate": 4.7982254669860945e-06, "loss": 0.8174, "step": 8211 }, { "epoch": 0.15, "learning_rate": 4.798165337171289e-06, "loss": 0.8999, "step": 8212 }, { "epoch": 0.15, "learning_rate": 4.798105198775203e-06, "loss": 1.0476, "step": 8213 }, { "epoch": 0.15, "learning_rate": 4.798045051798064e-06, "loss": 0.9437, "step": 8214 }, { "epoch": 0.15, "learning_rate": 4.797984896240094e-06, "loss": 0.7589, "step": 8215 }, { "epoch": 0.16, "learning_rate": 4.79792473210152e-06, "loss": 0.9164, "step": 8216 }, { "epoch": 0.16, "learning_rate": 4.797864559382566e-06, "loss": 0.8471, "step": 8217 }, { "epoch": 0.16, "learning_rate": 4.797804378083455e-06, "loss": 0.8175, "step": 8218 }, { "epoch": 0.16, "learning_rate": 4.797744188204413e-06, "loss": 1.1817, "step": 8219 }, { "epoch": 0.16, "learning_rate": 4.797683989745665e-06, "loss": 1.0363, "step": 8220 }, { "epoch": 0.16, "learning_rate": 4.797623782707436e-06, "loss": 0.8861, "step": 8221 }, { "epoch": 0.16, "learning_rate": 4.797563567089949e-06, "loss": 0.9025, "step": 8222 }, { "epoch": 0.16, "learning_rate": 4.797503342893431e-06, "loss": 1.0029, "step": 8223 }, { "epoch": 0.16, "learning_rate": 4.797443110118105e-06, "loss": 1.0991, "step": 8224 }, { "epoch": 0.16, "learning_rate": 4.7973828687641975e-06, "loss": 1.2934, "step": 8225 }, { "epoch": 0.16, "learning_rate": 4.797322618831933e-06, "loss": 0.8799, "step": 8226 }, { "epoch": 0.16, "learning_rate": 4.797262360321536e-06, "loss": 0.8753, "step": 8227 }, { "epoch": 0.16, "learning_rate": 4.797202093233232e-06, "loss": 0.9343, "step": 8228 }, { "epoch": 0.16, "learning_rate": 4.797141817567246e-06, "loss": 0.8223, "step": 8229 }, { "epoch": 0.16, "learning_rate": 4.797081533323802e-06, "loss": 1.0578, "step": 8230 }, { "epoch": 0.16, "learning_rate": 4.7970212405031265e-06, "loss": 1.0479, "step": 8231 }, { "epoch": 0.16, "learning_rate": 4.796960939105445e-06, "loss": 0.8839, "step": 8232 }, { "epoch": 0.16, "learning_rate": 4.79690062913098e-06, "loss": 1.0374, "step": 8233 }, { "epoch": 0.16, "learning_rate": 4.7968403105799595e-06, "loss": 0.9303, "step": 8234 }, { "epoch": 0.16, "learning_rate": 4.796779983452608e-06, "loss": 0.9563, "step": 8235 }, { "epoch": 0.16, "learning_rate": 4.796719647749151e-06, "loss": 0.9195, "step": 8236 }, { "epoch": 0.16, "learning_rate": 4.7966593034698115e-06, "loss": 1.0864, "step": 8237 }, { "epoch": 0.16, "learning_rate": 4.796598950614818e-06, "loss": 0.9773, "step": 8238 }, { "epoch": 0.16, "learning_rate": 4.796538589184394e-06, "loss": 0.864, "step": 8239 }, { "epoch": 0.16, "learning_rate": 4.796478219178765e-06, "loss": 0.9908, "step": 8240 }, { "epoch": 0.16, "learning_rate": 4.796417840598157e-06, "loss": 0.983, "step": 8241 }, { "epoch": 0.16, "learning_rate": 4.796357453442795e-06, "loss": 0.7454, "step": 8242 }, { "epoch": 0.16, "learning_rate": 4.796297057712904e-06, "loss": 1.1282, "step": 8243 }, { "epoch": 0.16, "learning_rate": 4.796236653408712e-06, "loss": 1.0424, "step": 8244 }, { "epoch": 0.16, "learning_rate": 4.796176240530441e-06, "loss": 0.9161, "step": 8245 }, { "epoch": 0.16, "learning_rate": 4.79611581907832e-06, "loss": 0.9054, "step": 8246 }, { "epoch": 0.16, "learning_rate": 4.7960553890525715e-06, "loss": 1.0847, "step": 8247 }, { "epoch": 0.16, "learning_rate": 4.7959949504534235e-06, "loss": 0.8879, "step": 8248 }, { "epoch": 0.16, "learning_rate": 4.7959345032811e-06, "loss": 1.1474, "step": 8249 }, { "epoch": 0.16, "learning_rate": 4.795874047535828e-06, "loss": 0.8839, "step": 8250 }, { "epoch": 0.16, "learning_rate": 4.795813583217832e-06, "loss": 1.0726, "step": 8251 }, { "epoch": 0.16, "learning_rate": 4.7957531103273395e-06, "loss": 0.836, "step": 8252 }, { "epoch": 0.16, "learning_rate": 4.795692628864575e-06, "loss": 1.0245, "step": 8253 }, { "epoch": 0.16, "learning_rate": 4.795632138829764e-06, "loss": 0.807, "step": 8254 }, { "epoch": 0.16, "learning_rate": 4.795571640223133e-06, "loss": 0.846, "step": 8255 }, { "epoch": 0.16, "learning_rate": 4.7955111330449085e-06, "loss": 0.9629, "step": 8256 }, { "epoch": 0.16, "learning_rate": 4.7954506172953155e-06, "loss": 0.9849, "step": 8257 }, { "epoch": 0.16, "learning_rate": 4.79539009297458e-06, "loss": 0.8909, "step": 8258 }, { "epoch": 0.16, "learning_rate": 4.795329560082929e-06, "loss": 1.1993, "step": 8259 }, { "epoch": 0.16, "learning_rate": 4.795269018620587e-06, "loss": 0.8547, "step": 8260 }, { "epoch": 0.16, "learning_rate": 4.795208468587781e-06, "loss": 0.8682, "step": 8261 }, { "epoch": 0.16, "learning_rate": 4.795147909984738e-06, "loss": 1.0369, "step": 8262 }, { "epoch": 0.16, "learning_rate": 4.795087342811682e-06, "loss": 1.1516, "step": 8263 }, { "epoch": 0.16, "learning_rate": 4.79502676706884e-06, "loss": 0.8917, "step": 8264 }, { "epoch": 0.16, "learning_rate": 4.794966182756439e-06, "loss": 0.8948, "step": 8265 }, { "epoch": 0.16, "learning_rate": 4.794905589874704e-06, "loss": 0.9088, "step": 8266 }, { "epoch": 0.16, "learning_rate": 4.794844988423863e-06, "loss": 0.915, "step": 8267 }, { "epoch": 0.16, "learning_rate": 4.794784378404141e-06, "loss": 1.1021, "step": 8268 }, { "epoch": 0.16, "learning_rate": 4.794723759815763e-06, "loss": 1.0753, "step": 8269 }, { "epoch": 0.16, "learning_rate": 4.794663132658959e-06, "loss": 1.0576, "step": 8270 }, { "epoch": 0.16, "learning_rate": 4.794602496933952e-06, "loss": 0.8657, "step": 8271 }, { "epoch": 0.16, "learning_rate": 4.7945418526409695e-06, "loss": 0.985, "step": 8272 }, { "epoch": 0.16, "learning_rate": 4.794481199780238e-06, "loss": 1.0004, "step": 8273 }, { "epoch": 0.16, "learning_rate": 4.7944205383519845e-06, "loss": 0.7657, "step": 8274 }, { "epoch": 0.16, "learning_rate": 4.794359868356436e-06, "loss": 0.9588, "step": 8275 }, { "epoch": 0.16, "learning_rate": 4.794299189793816e-06, "loss": 0.9645, "step": 8276 }, { "epoch": 0.16, "learning_rate": 4.794238502664355e-06, "loss": 0.7759, "step": 8277 }, { "epoch": 0.16, "learning_rate": 4.794177806968276e-06, "loss": 0.9735, "step": 8278 }, { "epoch": 0.16, "learning_rate": 4.794117102705809e-06, "loss": 1.0375, "step": 8279 }, { "epoch": 0.16, "learning_rate": 4.7940563898771785e-06, "loss": 0.7911, "step": 8280 }, { "epoch": 0.16, "learning_rate": 4.7939956684826116e-06, "loss": 1.2777, "step": 8281 }, { "epoch": 0.16, "learning_rate": 4.793934938522336e-06, "loss": 1.1469, "step": 8282 }, { "epoch": 0.16, "learning_rate": 4.793874199996577e-06, "loss": 0.9207, "step": 8283 }, { "epoch": 0.16, "learning_rate": 4.793813452905561e-06, "loss": 0.9898, "step": 8284 }, { "epoch": 0.16, "learning_rate": 4.793752697249518e-06, "loss": 0.9662, "step": 8285 }, { "epoch": 0.16, "learning_rate": 4.793691933028671e-06, "loss": 1.1669, "step": 8286 }, { "epoch": 0.16, "learning_rate": 4.79363116024325e-06, "loss": 1.0822, "step": 8287 }, { "epoch": 0.16, "learning_rate": 4.793570378893479e-06, "loss": 1.1045, "step": 8288 }, { "epoch": 0.16, "learning_rate": 4.793509588979588e-06, "loss": 0.9357, "step": 8289 }, { "epoch": 0.16, "learning_rate": 4.7934487905018025e-06, "loss": 1.0933, "step": 8290 }, { "epoch": 0.16, "learning_rate": 4.7933879834603495e-06, "loss": 0.9885, "step": 8291 }, { "epoch": 0.16, "learning_rate": 4.793327167855455e-06, "loss": 0.8777, "step": 8292 }, { "epoch": 0.16, "learning_rate": 4.793266343687348e-06, "loss": 1.1868, "step": 8293 }, { "epoch": 0.16, "learning_rate": 4.7932055109562544e-06, "loss": 1.1068, "step": 8294 }, { "epoch": 0.16, "learning_rate": 4.793144669662402e-06, "loss": 0.9683, "step": 8295 }, { "epoch": 0.16, "learning_rate": 4.793083819806018e-06, "loss": 0.9685, "step": 8296 }, { "epoch": 0.16, "learning_rate": 4.793022961387329e-06, "loss": 0.8334, "step": 8297 }, { "epoch": 0.16, "learning_rate": 4.792962094406563e-06, "loss": 1.048, "step": 8298 }, { "epoch": 0.16, "learning_rate": 4.792901218863946e-06, "loss": 1.2577, "step": 8299 }, { "epoch": 0.16, "learning_rate": 4.7928403347597065e-06, "loss": 1.1876, "step": 8300 }, { "epoch": 0.16, "learning_rate": 4.792779442094071e-06, "loss": 1.0741, "step": 8301 }, { "epoch": 0.16, "learning_rate": 4.792718540867268e-06, "loss": 0.9551, "step": 8302 }, { "epoch": 0.16, "learning_rate": 4.7926576310795246e-06, "loss": 1.0241, "step": 8303 }, { "epoch": 0.16, "learning_rate": 4.792596712731067e-06, "loss": 0.8574, "step": 8304 }, { "epoch": 0.16, "learning_rate": 4.792535785822124e-06, "loss": 0.903, "step": 8305 }, { "epoch": 0.16, "learning_rate": 4.7924748503529225e-06, "loss": 0.9408, "step": 8306 }, { "epoch": 0.16, "learning_rate": 4.7924139063236906e-06, "loss": 1.0033, "step": 8307 }, { "epoch": 0.16, "learning_rate": 4.792352953734655e-06, "loss": 0.8916, "step": 8308 }, { "epoch": 0.16, "learning_rate": 4.792291992586045e-06, "loss": 0.8352, "step": 8309 }, { "epoch": 0.16, "learning_rate": 4.792231022878086e-06, "loss": 0.926, "step": 8310 }, { "epoch": 0.16, "learning_rate": 4.792170044611005e-06, "loss": 0.9539, "step": 8311 }, { "epoch": 0.16, "learning_rate": 4.792109057785034e-06, "loss": 1.0863, "step": 8312 }, { "epoch": 0.16, "learning_rate": 4.792048062400397e-06, "loss": 0.838, "step": 8313 }, { "epoch": 0.16, "learning_rate": 4.791987058457323e-06, "loss": 0.9811, "step": 8314 }, { "epoch": 0.16, "learning_rate": 4.7919260459560395e-06, "loss": 0.8802, "step": 8315 }, { "epoch": 0.16, "learning_rate": 4.791865024896773e-06, "loss": 1.1928, "step": 8316 }, { "epoch": 0.16, "learning_rate": 4.7918039952797544e-06, "loss": 0.866, "step": 8317 }, { "epoch": 0.16, "learning_rate": 4.79174295710521e-06, "loss": 1.0259, "step": 8318 }, { "epoch": 0.16, "learning_rate": 4.791681910373368e-06, "loss": 1.0671, "step": 8319 }, { "epoch": 0.16, "learning_rate": 4.791620855084454e-06, "loss": 1.0348, "step": 8320 }, { "epoch": 0.16, "learning_rate": 4.7915597912387e-06, "loss": 0.8518, "step": 8321 }, { "epoch": 0.16, "learning_rate": 4.791498718836332e-06, "loss": 1.0269, "step": 8322 }, { "epoch": 0.16, "learning_rate": 4.7914376378775766e-06, "loss": 0.6823, "step": 8323 }, { "epoch": 0.16, "learning_rate": 4.7913765483626635e-06, "loss": 1.1572, "step": 8324 }, { "epoch": 0.16, "learning_rate": 4.7913154502918224e-06, "loss": 1.311, "step": 8325 }, { "epoch": 0.16, "learning_rate": 4.791254343665278e-06, "loss": 1.0693, "step": 8326 }, { "epoch": 0.16, "learning_rate": 4.791193228483261e-06, "loss": 0.8649, "step": 8327 }, { "epoch": 0.16, "learning_rate": 4.791132104745998e-06, "loss": 0.9201, "step": 8328 }, { "epoch": 0.16, "learning_rate": 4.791070972453718e-06, "loss": 0.9933, "step": 8329 }, { "epoch": 0.16, "learning_rate": 4.79100983160665e-06, "loss": 0.9341, "step": 8330 }, { "epoch": 0.16, "learning_rate": 4.790948682205021e-06, "loss": 1.1707, "step": 8331 }, { "epoch": 0.16, "learning_rate": 4.79088752424906e-06, "loss": 0.8152, "step": 8332 }, { "epoch": 0.16, "learning_rate": 4.790826357738995e-06, "loss": 0.7648, "step": 8333 }, { "epoch": 0.16, "learning_rate": 4.790765182675055e-06, "loss": 1.0046, "step": 8334 }, { "epoch": 0.16, "learning_rate": 4.790703999057468e-06, "loss": 0.8087, "step": 8335 }, { "epoch": 0.16, "learning_rate": 4.7906428068864615e-06, "loss": 1.0301, "step": 8336 }, { "epoch": 0.16, "learning_rate": 4.790581606162266e-06, "loss": 1.1603, "step": 8337 }, { "epoch": 0.16, "learning_rate": 4.790520396885109e-06, "loss": 1.0006, "step": 8338 }, { "epoch": 0.16, "learning_rate": 4.790459179055219e-06, "loss": 0.8899, "step": 8339 }, { "epoch": 0.16, "learning_rate": 4.790397952672825e-06, "loss": 0.8991, "step": 8340 }, { "epoch": 0.16, "learning_rate": 4.790336717738154e-06, "loss": 0.8965, "step": 8341 }, { "epoch": 0.16, "learning_rate": 4.790275474251437e-06, "loss": 0.9339, "step": 8342 }, { "epoch": 0.16, "learning_rate": 4.790214222212901e-06, "loss": 0.9477, "step": 8343 }, { "epoch": 0.16, "learning_rate": 4.790152961622776e-06, "loss": 1.0786, "step": 8344 }, { "epoch": 0.16, "learning_rate": 4.79009169248129e-06, "loss": 0.9164, "step": 8345 }, { "epoch": 0.16, "learning_rate": 4.790030414788671e-06, "loss": 0.6695, "step": 8346 }, { "epoch": 0.16, "learning_rate": 4.78996912854515e-06, "loss": 0.8724, "step": 8347 }, { "epoch": 0.16, "learning_rate": 4.789907833750953e-06, "loss": 0.808, "step": 8348 }, { "epoch": 0.16, "learning_rate": 4.789846530406311e-06, "loss": 1.0032, "step": 8349 }, { "epoch": 0.16, "learning_rate": 4.789785218511453e-06, "loss": 1.0003, "step": 8350 }, { "epoch": 0.16, "learning_rate": 4.789723898066606e-06, "loss": 0.8725, "step": 8351 }, { "epoch": 0.16, "learning_rate": 4.789662569072001e-06, "loss": 0.8174, "step": 8352 }, { "epoch": 0.16, "learning_rate": 4.789601231527866e-06, "loss": 0.9999, "step": 8353 }, { "epoch": 0.16, "learning_rate": 4.78953988543443e-06, "loss": 1.0073, "step": 8354 }, { "epoch": 0.16, "learning_rate": 4.789478530791922e-06, "loss": 1.1176, "step": 8355 }, { "epoch": 0.16, "learning_rate": 4.789417167600572e-06, "loss": 1.0521, "step": 8356 }, { "epoch": 0.16, "learning_rate": 4.789355795860608e-06, "loss": 0.9273, "step": 8357 }, { "epoch": 0.16, "learning_rate": 4.7892944155722595e-06, "loss": 0.9359, "step": 8358 }, { "epoch": 0.16, "learning_rate": 4.7892330267357565e-06, "loss": 1.0183, "step": 8359 }, { "epoch": 0.16, "learning_rate": 4.7891716293513265e-06, "loss": 0.759, "step": 8360 }, { "epoch": 0.16, "learning_rate": 4.789110223419201e-06, "loss": 1.0161, "step": 8361 }, { "epoch": 0.16, "learning_rate": 4.789048808939608e-06, "loss": 0.9419, "step": 8362 }, { "epoch": 0.16, "learning_rate": 4.788987385912777e-06, "loss": 1.0017, "step": 8363 }, { "epoch": 0.16, "learning_rate": 4.788925954338936e-06, "loss": 1.0221, "step": 8364 }, { "epoch": 0.16, "learning_rate": 4.788864514218317e-06, "loss": 1.0209, "step": 8365 }, { "epoch": 0.16, "learning_rate": 4.788803065551148e-06, "loss": 0.7447, "step": 8366 }, { "epoch": 0.16, "learning_rate": 4.7887416083376576e-06, "loss": 0.9425, "step": 8367 }, { "epoch": 0.16, "learning_rate": 4.788680142578077e-06, "loss": 0.9327, "step": 8368 }, { "epoch": 0.16, "learning_rate": 4.788618668272634e-06, "loss": 0.9348, "step": 8369 }, { "epoch": 0.16, "learning_rate": 4.78855718542156e-06, "loss": 1.1089, "step": 8370 }, { "epoch": 0.16, "learning_rate": 4.788495694025084e-06, "loss": 0.9644, "step": 8371 }, { "epoch": 0.16, "learning_rate": 4.7884341940834335e-06, "loss": 0.8289, "step": 8372 }, { "epoch": 0.16, "learning_rate": 4.788372685596842e-06, "loss": 1.0348, "step": 8373 }, { "epoch": 0.16, "learning_rate": 4.788311168565536e-06, "loss": 0.9868, "step": 8374 }, { "epoch": 0.16, "learning_rate": 4.788249642989747e-06, "loss": 1.3252, "step": 8375 }, { "epoch": 0.16, "learning_rate": 4.788188108869703e-06, "loss": 1.0833, "step": 8376 }, { "epoch": 0.16, "learning_rate": 4.788126566205634e-06, "loss": 0.8299, "step": 8377 }, { "epoch": 0.16, "learning_rate": 4.788065014997772e-06, "loss": 0.7662, "step": 8378 }, { "epoch": 0.16, "learning_rate": 4.788003455246345e-06, "loss": 0.838, "step": 8379 }, { "epoch": 0.16, "learning_rate": 4.787941886951584e-06, "loss": 1.0245, "step": 8380 }, { "epoch": 0.16, "learning_rate": 4.787880310113717e-06, "loss": 1.1165, "step": 8381 }, { "epoch": 0.16, "learning_rate": 4.787818724732976e-06, "loss": 0.8813, "step": 8382 }, { "epoch": 0.16, "learning_rate": 4.7877571308095884e-06, "loss": 0.8214, "step": 8383 }, { "epoch": 0.16, "learning_rate": 4.787695528343788e-06, "loss": 0.9086, "step": 8384 }, { "epoch": 0.16, "learning_rate": 4.787633917335801e-06, "loss": 0.9836, "step": 8385 }, { "epoch": 0.16, "learning_rate": 4.78757229778586e-06, "loss": 0.9634, "step": 8386 }, { "epoch": 0.16, "learning_rate": 4.7875106696941934e-06, "loss": 1.1282, "step": 8387 }, { "epoch": 0.16, "learning_rate": 4.7874490330610325e-06, "loss": 1.1372, "step": 8388 }, { "epoch": 0.16, "learning_rate": 4.787387387886607e-06, "loss": 0.8314, "step": 8389 }, { "epoch": 0.16, "learning_rate": 4.7873257341711475e-06, "loss": 0.9678, "step": 8390 }, { "epoch": 0.16, "learning_rate": 4.787264071914883e-06, "loss": 0.8393, "step": 8391 }, { "epoch": 0.16, "learning_rate": 4.787202401118045e-06, "loss": 0.9467, "step": 8392 }, { "epoch": 0.16, "learning_rate": 4.787140721780864e-06, "loss": 1.0228, "step": 8393 }, { "epoch": 0.16, "learning_rate": 4.787079033903569e-06, "loss": 0.9894, "step": 8394 }, { "epoch": 0.16, "learning_rate": 4.7870173374863915e-06, "loss": 0.8329, "step": 8395 }, { "epoch": 0.16, "learning_rate": 4.786955632529561e-06, "loss": 0.8517, "step": 8396 }, { "epoch": 0.16, "learning_rate": 4.786893919033308e-06, "loss": 0.8927, "step": 8397 }, { "epoch": 0.16, "learning_rate": 4.786832196997864e-06, "loss": 0.8371, "step": 8398 }, { "epoch": 0.16, "learning_rate": 4.786770466423458e-06, "loss": 0.9645, "step": 8399 }, { "epoch": 0.16, "learning_rate": 4.786708727310321e-06, "loss": 1.2211, "step": 8400 }, { "epoch": 0.16, "learning_rate": 4.7866469796586845e-06, "loss": 0.9237, "step": 8401 }, { "epoch": 0.16, "learning_rate": 4.786585223468778e-06, "loss": 1.0266, "step": 8402 }, { "epoch": 0.16, "learning_rate": 4.786523458740833e-06, "loss": 1.0168, "step": 8403 }, { "epoch": 0.16, "learning_rate": 4.786461685475078e-06, "loss": 0.8815, "step": 8404 }, { "epoch": 0.16, "learning_rate": 4.786399903671746e-06, "loss": 1.1574, "step": 8405 }, { "epoch": 0.16, "learning_rate": 4.786338113331067e-06, "loss": 0.9867, "step": 8406 }, { "epoch": 0.16, "learning_rate": 4.786276314453272e-06, "loss": 1.1139, "step": 8407 }, { "epoch": 0.16, "learning_rate": 4.78621450703859e-06, "loss": 0.9395, "step": 8408 }, { "epoch": 0.16, "learning_rate": 4.786152691087255e-06, "loss": 1.1563, "step": 8409 }, { "epoch": 0.16, "learning_rate": 4.786090866599495e-06, "loss": 0.9451, "step": 8410 }, { "epoch": 0.16, "learning_rate": 4.786029033575541e-06, "loss": 1.0516, "step": 8411 }, { "epoch": 0.16, "learning_rate": 4.785967192015625e-06, "loss": 1.0492, "step": 8412 }, { "epoch": 0.16, "learning_rate": 4.7859053419199786e-06, "loss": 0.983, "step": 8413 }, { "epoch": 0.16, "learning_rate": 4.785843483288831e-06, "loss": 0.7492, "step": 8414 }, { "epoch": 0.16, "learning_rate": 4.785781616122413e-06, "loss": 1.0496, "step": 8415 }, { "epoch": 0.16, "learning_rate": 4.785719740420959e-06, "loss": 0.8599, "step": 8416 }, { "epoch": 0.16, "learning_rate": 4.785657856184696e-06, "loss": 1.0062, "step": 8417 }, { "epoch": 0.16, "learning_rate": 4.785595963413856e-06, "loss": 0.9302, "step": 8418 }, { "epoch": 0.16, "learning_rate": 4.785534062108672e-06, "loss": 1.1812, "step": 8419 }, { "epoch": 0.16, "learning_rate": 4.785472152269373e-06, "loss": 1.0314, "step": 8420 }, { "epoch": 0.16, "learning_rate": 4.7854102338961915e-06, "loss": 0.8621, "step": 8421 }, { "epoch": 0.16, "learning_rate": 4.785348306989358e-06, "loss": 0.9154, "step": 8422 }, { "epoch": 0.16, "learning_rate": 4.785286371549105e-06, "loss": 0.9675, "step": 8423 }, { "epoch": 0.16, "learning_rate": 4.7852244275756615e-06, "loss": 1.0215, "step": 8424 }, { "epoch": 0.16, "learning_rate": 4.78516247506926e-06, "loss": 1.1455, "step": 8425 }, { "epoch": 0.16, "learning_rate": 4.785100514030133e-06, "loss": 1.0027, "step": 8426 }, { "epoch": 0.16, "learning_rate": 4.78503854445851e-06, "loss": 0.7981, "step": 8427 }, { "epoch": 0.16, "learning_rate": 4.784976566354623e-06, "loss": 0.9163, "step": 8428 }, { "epoch": 0.16, "learning_rate": 4.784914579718704e-06, "loss": 0.8171, "step": 8429 }, { "epoch": 0.16, "learning_rate": 4.784852584550984e-06, "loss": 0.8954, "step": 8430 }, { "epoch": 0.16, "learning_rate": 4.784790580851695e-06, "loss": 1.0931, "step": 8431 }, { "epoch": 0.16, "learning_rate": 4.784728568621067e-06, "loss": 1.1337, "step": 8432 }, { "epoch": 0.16, "learning_rate": 4.784666547859333e-06, "loss": 1.0606, "step": 8433 }, { "epoch": 0.16, "learning_rate": 4.784604518566725e-06, "loss": 0.8137, "step": 8434 }, { "epoch": 0.16, "learning_rate": 4.784542480743472e-06, "loss": 0.7436, "step": 8435 }, { "epoch": 0.16, "learning_rate": 4.7844804343898084e-06, "loss": 0.8748, "step": 8436 }, { "epoch": 0.16, "learning_rate": 4.784418379505965e-06, "loss": 1.1135, "step": 8437 }, { "epoch": 0.16, "learning_rate": 4.784356316092173e-06, "loss": 0.8733, "step": 8438 }, { "epoch": 0.16, "learning_rate": 4.784294244148665e-06, "loss": 1.0147, "step": 8439 }, { "epoch": 0.16, "learning_rate": 4.784232163675672e-06, "loss": 0.7892, "step": 8440 }, { "epoch": 0.16, "learning_rate": 4.784170074673426e-06, "loss": 0.9887, "step": 8441 }, { "epoch": 0.16, "learning_rate": 4.784107977142159e-06, "loss": 0.6624, "step": 8442 }, { "epoch": 0.16, "learning_rate": 4.784045871082103e-06, "loss": 0.9696, "step": 8443 }, { "epoch": 0.16, "learning_rate": 4.78398375649349e-06, "loss": 1.1536, "step": 8444 }, { "epoch": 0.16, "learning_rate": 4.783921633376551e-06, "loss": 0.862, "step": 8445 }, { "epoch": 0.16, "learning_rate": 4.78385950173152e-06, "loss": 0.8217, "step": 8446 }, { "epoch": 0.16, "learning_rate": 4.783797361558627e-06, "loss": 0.9549, "step": 8447 }, { "epoch": 0.16, "learning_rate": 4.783735212858104e-06, "loss": 0.9074, "step": 8448 }, { "epoch": 0.16, "learning_rate": 4.783673055630185e-06, "loss": 1.0427, "step": 8449 }, { "epoch": 0.16, "learning_rate": 4.7836108898751e-06, "loss": 1.1981, "step": 8450 }, { "epoch": 0.16, "learning_rate": 4.783548715593081e-06, "loss": 1.0381, "step": 8451 }, { "epoch": 0.16, "learning_rate": 4.7834865327843625e-06, "loss": 0.7704, "step": 8452 }, { "epoch": 0.16, "learning_rate": 4.7834243414491755e-06, "loss": 0.9365, "step": 8453 }, { "epoch": 0.16, "learning_rate": 4.783362141587751e-06, "loss": 0.9605, "step": 8454 }, { "epoch": 0.16, "learning_rate": 4.7832999332003225e-06, "loss": 1.0146, "step": 8455 }, { "epoch": 0.16, "learning_rate": 4.783237716287122e-06, "loss": 0.9859, "step": 8456 }, { "epoch": 0.16, "learning_rate": 4.783175490848383e-06, "loss": 0.9525, "step": 8457 }, { "epoch": 0.16, "learning_rate": 4.783113256884335e-06, "loss": 0.8981, "step": 8458 }, { "epoch": 0.16, "learning_rate": 4.783051014395213e-06, "loss": 0.8873, "step": 8459 }, { "epoch": 0.16, "learning_rate": 4.7829887633812485e-06, "loss": 0.8364, "step": 8460 }, { "epoch": 0.16, "learning_rate": 4.782926503842675e-06, "loss": 1.1088, "step": 8461 }, { "epoch": 0.16, "learning_rate": 4.782864235779722e-06, "loss": 1.1102, "step": 8462 }, { "epoch": 0.16, "learning_rate": 4.782801959192625e-06, "loss": 1.0974, "step": 8463 }, { "epoch": 0.16, "learning_rate": 4.7827396740816155e-06, "loss": 1.0721, "step": 8464 }, { "epoch": 0.16, "learning_rate": 4.7826773804469256e-06, "loss": 0.9551, "step": 8465 }, { "epoch": 0.16, "learning_rate": 4.782615078288789e-06, "loss": 1.0598, "step": 8466 }, { "epoch": 0.16, "learning_rate": 4.782552767607437e-06, "loss": 0.9434, "step": 8467 }, { "epoch": 0.16, "learning_rate": 4.7824904484031034e-06, "loss": 1.0891, "step": 8468 }, { "epoch": 0.16, "learning_rate": 4.78242812067602e-06, "loss": 0.8865, "step": 8469 }, { "epoch": 0.16, "learning_rate": 4.782365784426421e-06, "loss": 0.9878, "step": 8470 }, { "epoch": 0.16, "learning_rate": 4.7823034396545365e-06, "loss": 0.9479, "step": 8471 }, { "epoch": 0.16, "learning_rate": 4.782241086360601e-06, "loss": 1.0454, "step": 8472 }, { "epoch": 0.16, "learning_rate": 4.782178724544849e-06, "loss": 0.8262, "step": 8473 }, { "epoch": 0.16, "learning_rate": 4.7821163542075105e-06, "loss": 0.955, "step": 8474 }, { "epoch": 0.16, "learning_rate": 4.78205397534882e-06, "loss": 1.0412, "step": 8475 }, { "epoch": 0.16, "learning_rate": 4.781991587969009e-06, "loss": 0.8307, "step": 8476 }, { "epoch": 0.16, "learning_rate": 4.781929192068312e-06, "loss": 0.7038, "step": 8477 }, { "epoch": 0.16, "learning_rate": 4.781866787646962e-06, "loss": 1.0701, "step": 8478 }, { "epoch": 0.16, "learning_rate": 4.78180437470519e-06, "loss": 0.8328, "step": 8479 }, { "epoch": 0.16, "learning_rate": 4.781741953243232e-06, "loss": 1.0144, "step": 8480 }, { "epoch": 0.16, "learning_rate": 4.781679523261318e-06, "loss": 1.1854, "step": 8481 }, { "epoch": 0.16, "learning_rate": 4.781617084759683e-06, "loss": 1.0007, "step": 8482 }, { "epoch": 0.16, "learning_rate": 4.78155463773856e-06, "loss": 1.0499, "step": 8483 }, { "epoch": 0.16, "learning_rate": 4.7814921821981825e-06, "loss": 1.0837, "step": 8484 }, { "epoch": 0.16, "learning_rate": 4.781429718138782e-06, "loss": 0.9857, "step": 8485 }, { "epoch": 0.16, "learning_rate": 4.7813672455605945e-06, "loss": 1.1158, "step": 8486 }, { "epoch": 0.16, "learning_rate": 4.78130476446385e-06, "loss": 0.9744, "step": 8487 }, { "epoch": 0.16, "learning_rate": 4.7812422748487845e-06, "loss": 1.0741, "step": 8488 }, { "epoch": 0.16, "learning_rate": 4.78117977671563e-06, "loss": 0.8113, "step": 8489 }, { "epoch": 0.16, "learning_rate": 4.78111727006462e-06, "loss": 0.9738, "step": 8490 }, { "epoch": 0.16, "learning_rate": 4.781054754895988e-06, "loss": 0.9185, "step": 8491 }, { "epoch": 0.16, "learning_rate": 4.7809922312099675e-06, "loss": 0.9227, "step": 8492 }, { "epoch": 0.16, "learning_rate": 4.780929699006792e-06, "loss": 0.9311, "step": 8493 }, { "epoch": 0.16, "learning_rate": 4.780867158286695e-06, "loss": 1.0795, "step": 8494 }, { "epoch": 0.16, "learning_rate": 4.78080460904991e-06, "loss": 0.6816, "step": 8495 }, { "epoch": 0.16, "learning_rate": 4.780742051296671e-06, "loss": 0.7583, "step": 8496 }, { "epoch": 0.16, "learning_rate": 4.78067948502721e-06, "loss": 1.0214, "step": 8497 }, { "epoch": 0.16, "learning_rate": 4.780616910241762e-06, "loss": 1.0024, "step": 8498 }, { "epoch": 0.16, "learning_rate": 4.780554326940561e-06, "loss": 0.9845, "step": 8499 }, { "epoch": 0.16, "learning_rate": 4.78049173512384e-06, "loss": 1.3116, "step": 8500 }, { "epoch": 0.16, "learning_rate": 4.780429134791832e-06, "loss": 0.9539, "step": 8501 }, { "epoch": 0.16, "learning_rate": 4.7803665259447725e-06, "loss": 1.0027, "step": 8502 }, { "epoch": 0.16, "learning_rate": 4.780303908582894e-06, "loss": 0.945, "step": 8503 }, { "epoch": 0.16, "learning_rate": 4.780241282706431e-06, "loss": 0.7096, "step": 8504 }, { "epoch": 0.16, "learning_rate": 4.7801786483156155e-06, "loss": 0.9061, "step": 8505 }, { "epoch": 0.16, "learning_rate": 4.780116005410684e-06, "loss": 1.0844, "step": 8506 }, { "epoch": 0.16, "learning_rate": 4.7800533539918695e-06, "loss": 0.9346, "step": 8507 }, { "epoch": 0.16, "learning_rate": 4.779990694059405e-06, "loss": 0.8808, "step": 8508 }, { "epoch": 0.16, "learning_rate": 4.779928025613525e-06, "loss": 0.7847, "step": 8509 }, { "epoch": 0.16, "learning_rate": 4.779865348654464e-06, "loss": 0.8497, "step": 8510 }, { "epoch": 0.16, "learning_rate": 4.7798026631824555e-06, "loss": 1.0192, "step": 8511 }, { "epoch": 0.16, "learning_rate": 4.7797399691977345e-06, "loss": 1.0917, "step": 8512 }, { "epoch": 0.16, "learning_rate": 4.779677266700534e-06, "loss": 0.7994, "step": 8513 }, { "epoch": 0.16, "learning_rate": 4.779614555691088e-06, "loss": 0.8686, "step": 8514 }, { "epoch": 0.16, "learning_rate": 4.779551836169631e-06, "loss": 1.0647, "step": 8515 }, { "epoch": 0.16, "learning_rate": 4.779489108136398e-06, "loss": 0.7738, "step": 8516 }, { "epoch": 0.16, "learning_rate": 4.7794263715916224e-06, "loss": 0.7489, "step": 8517 }, { "epoch": 0.16, "learning_rate": 4.7793636265355395e-06, "loss": 1.1295, "step": 8518 }, { "epoch": 0.16, "learning_rate": 4.779300872968381e-06, "loss": 1.0269, "step": 8519 }, { "epoch": 0.16, "learning_rate": 4.779238110890384e-06, "loss": 0.9225, "step": 8520 }, { "epoch": 0.16, "learning_rate": 4.7791753403017816e-06, "loss": 0.6423, "step": 8521 }, { "epoch": 0.16, "learning_rate": 4.7791125612028075e-06, "loss": 1.0006, "step": 8522 }, { "epoch": 0.16, "learning_rate": 4.7790497735936984e-06, "loss": 0.9642, "step": 8523 }, { "epoch": 0.16, "learning_rate": 4.7789869774746866e-06, "loss": 0.8264, "step": 8524 }, { "epoch": 0.16, "learning_rate": 4.7789241728460065e-06, "loss": 1.273, "step": 8525 }, { "epoch": 0.16, "learning_rate": 4.7788613597078945e-06, "loss": 1.0143, "step": 8526 }, { "epoch": 0.16, "learning_rate": 4.778798538060584e-06, "loss": 0.909, "step": 8527 }, { "epoch": 0.16, "learning_rate": 4.77873570790431e-06, "loss": 0.8962, "step": 8528 }, { "epoch": 0.16, "learning_rate": 4.778672869239306e-06, "loss": 0.9436, "step": 8529 }, { "epoch": 0.16, "learning_rate": 4.778610022065807e-06, "loss": 0.9551, "step": 8530 }, { "epoch": 0.16, "learning_rate": 4.778547166384048e-06, "loss": 1.1118, "step": 8531 }, { "epoch": 0.16, "learning_rate": 4.778484302194265e-06, "loss": 0.8853, "step": 8532 }, { "epoch": 0.16, "learning_rate": 4.778421429496691e-06, "loss": 0.9693, "step": 8533 }, { "epoch": 0.16, "learning_rate": 4.778358548291561e-06, "loss": 1.0119, "step": 8534 }, { "epoch": 0.16, "learning_rate": 4.77829565857911e-06, "loss": 0.9154, "step": 8535 }, { "epoch": 0.16, "learning_rate": 4.778232760359574e-06, "loss": 0.8412, "step": 8536 }, { "epoch": 0.16, "learning_rate": 4.778169853633185e-06, "loss": 1.0632, "step": 8537 }, { "epoch": 0.16, "learning_rate": 4.77810693840018e-06, "loss": 1.1103, "step": 8538 }, { "epoch": 0.16, "learning_rate": 4.7780440146607946e-06, "loss": 0.9708, "step": 8539 }, { "epoch": 0.16, "learning_rate": 4.777981082415261e-06, "loss": 1.0873, "step": 8540 }, { "epoch": 0.16, "learning_rate": 4.777918141663817e-06, "loss": 0.9951, "step": 8541 }, { "epoch": 0.16, "learning_rate": 4.777855192406697e-06, "loss": 0.9148, "step": 8542 }, { "epoch": 0.16, "learning_rate": 4.7777922346441345e-06, "loss": 0.9554, "step": 8543 }, { "epoch": 0.16, "learning_rate": 4.777729268376365e-06, "loss": 1.0124, "step": 8544 }, { "epoch": 0.16, "learning_rate": 4.777666293603626e-06, "loss": 0.7955, "step": 8545 }, { "epoch": 0.16, "learning_rate": 4.77760331032615e-06, "loss": 0.8199, "step": 8546 }, { "epoch": 0.16, "learning_rate": 4.777540318544174e-06, "loss": 0.9858, "step": 8547 }, { "epoch": 0.16, "learning_rate": 4.7774773182579305e-06, "loss": 0.897, "step": 8548 }, { "epoch": 0.16, "learning_rate": 4.777414309467658e-06, "loss": 0.9612, "step": 8549 }, { "epoch": 0.16, "learning_rate": 4.77735129217359e-06, "loss": 0.9678, "step": 8550 }, { "epoch": 0.16, "learning_rate": 4.777288266375961e-06, "loss": 0.8616, "step": 8551 }, { "epoch": 0.16, "learning_rate": 4.777225232075009e-06, "loss": 0.9694, "step": 8552 }, { "epoch": 0.16, "learning_rate": 4.777162189270967e-06, "loss": 0.8027, "step": 8553 }, { "epoch": 0.16, "learning_rate": 4.777099137964071e-06, "loss": 0.9351, "step": 8554 }, { "epoch": 0.16, "learning_rate": 4.777036078154558e-06, "loss": 0.8568, "step": 8555 }, { "epoch": 0.16, "learning_rate": 4.7769730098426606e-06, "loss": 0.9492, "step": 8556 }, { "epoch": 0.16, "learning_rate": 4.7769099330286165e-06, "loss": 0.9182, "step": 8557 }, { "epoch": 0.16, "learning_rate": 4.7768468477126604e-06, "loss": 0.8517, "step": 8558 }, { "epoch": 0.16, "learning_rate": 4.776783753895027e-06, "loss": 0.8867, "step": 8559 }, { "epoch": 0.16, "learning_rate": 4.7767206515759544e-06, "loss": 0.8265, "step": 8560 }, { "epoch": 0.16, "learning_rate": 4.776657540755676e-06, "loss": 1.0726, "step": 8561 }, { "epoch": 0.16, "learning_rate": 4.776594421434428e-06, "loss": 0.916, "step": 8562 }, { "epoch": 0.16, "learning_rate": 4.776531293612446e-06, "loss": 1.1315, "step": 8563 }, { "epoch": 0.16, "learning_rate": 4.776468157289967e-06, "loss": 1.0367, "step": 8564 }, { "epoch": 0.16, "learning_rate": 4.776405012467225e-06, "loss": 1.114, "step": 8565 }, { "epoch": 0.16, "learning_rate": 4.776341859144456e-06, "loss": 0.9358, "step": 8566 }, { "epoch": 0.16, "learning_rate": 4.7762786973218975e-06, "loss": 0.9583, "step": 8567 }, { "epoch": 0.16, "learning_rate": 4.776215526999783e-06, "loss": 1.3057, "step": 8568 }, { "epoch": 0.16, "learning_rate": 4.77615234817835e-06, "loss": 0.9197, "step": 8569 }, { "epoch": 0.16, "learning_rate": 4.776089160857834e-06, "loss": 1.0425, "step": 8570 }, { "epoch": 0.16, "learning_rate": 4.776025965038471e-06, "loss": 0.9509, "step": 8571 }, { "epoch": 0.16, "learning_rate": 4.7759627607204965e-06, "loss": 0.918, "step": 8572 }, { "epoch": 0.16, "learning_rate": 4.775899547904147e-06, "loss": 0.8561, "step": 8573 }, { "epoch": 0.16, "learning_rate": 4.7758363265896585e-06, "loss": 1.1545, "step": 8574 }, { "epoch": 0.16, "learning_rate": 4.775773096777266e-06, "loss": 1.124, "step": 8575 }, { "epoch": 0.16, "learning_rate": 4.775709858467208e-06, "loss": 1.054, "step": 8576 }, { "epoch": 0.16, "learning_rate": 4.775646611659719e-06, "loss": 0.9336, "step": 8577 }, { "epoch": 0.16, "learning_rate": 4.7755833563550345e-06, "loss": 0.8741, "step": 8578 }, { "epoch": 0.16, "learning_rate": 4.775520092553392e-06, "loss": 0.9278, "step": 8579 }, { "epoch": 0.16, "learning_rate": 4.775456820255026e-06, "loss": 0.8129, "step": 8580 }, { "epoch": 0.16, "learning_rate": 4.775393539460176e-06, "loss": 0.9884, "step": 8581 }, { "epoch": 0.16, "learning_rate": 4.775330250169075e-06, "loss": 1.1651, "step": 8582 }, { "epoch": 0.16, "learning_rate": 4.77526695238196e-06, "loss": 0.9061, "step": 8583 }, { "epoch": 0.16, "learning_rate": 4.775203646099069e-06, "loss": 0.9296, "step": 8584 }, { "epoch": 0.16, "learning_rate": 4.775140331320638e-06, "loss": 0.8332, "step": 8585 }, { "epoch": 0.16, "learning_rate": 4.775077008046903e-06, "loss": 1.0716, "step": 8586 }, { "epoch": 0.16, "learning_rate": 4.775013676278099e-06, "loss": 0.9134, "step": 8587 }, { "epoch": 0.16, "learning_rate": 4.774950336014463e-06, "loss": 1.1024, "step": 8588 }, { "epoch": 0.16, "learning_rate": 4.7748869872562335e-06, "loss": 0.7127, "step": 8589 }, { "epoch": 0.16, "learning_rate": 4.774823630003645e-06, "loss": 1.1018, "step": 8590 }, { "epoch": 0.16, "learning_rate": 4.774760264256935e-06, "loss": 0.887, "step": 8591 }, { "epoch": 0.16, "learning_rate": 4.774696890016341e-06, "loss": 0.997, "step": 8592 }, { "epoch": 0.16, "learning_rate": 4.774633507282097e-06, "loss": 1.2182, "step": 8593 }, { "epoch": 0.16, "learning_rate": 4.774570116054442e-06, "loss": 1.1082, "step": 8594 }, { "epoch": 0.16, "learning_rate": 4.7745067163336115e-06, "loss": 0.9166, "step": 8595 }, { "epoch": 0.16, "learning_rate": 4.774443308119843e-06, "loss": 1.0267, "step": 8596 }, { "epoch": 0.16, "learning_rate": 4.774379891413373e-06, "loss": 0.7221, "step": 8597 }, { "epoch": 0.16, "learning_rate": 4.774316466214438e-06, "loss": 0.8197, "step": 8598 }, { "epoch": 0.16, "learning_rate": 4.774253032523275e-06, "loss": 1.0043, "step": 8599 }, { "epoch": 0.16, "learning_rate": 4.774189590340121e-06, "loss": 1.1406, "step": 8600 }, { "epoch": 0.16, "learning_rate": 4.774126139665213e-06, "loss": 0.9346, "step": 8601 }, { "epoch": 0.16, "learning_rate": 4.774062680498787e-06, "loss": 0.8648, "step": 8602 }, { "epoch": 0.16, "learning_rate": 4.773999212841081e-06, "loss": 0.9936, "step": 8603 }, { "epoch": 0.16, "learning_rate": 4.773935736692332e-06, "loss": 0.9564, "step": 8604 }, { "epoch": 0.16, "learning_rate": 4.773872252052777e-06, "loss": 0.9021, "step": 8605 }, { "epoch": 0.16, "learning_rate": 4.773808758922652e-06, "loss": 1.1279, "step": 8606 }, { "epoch": 0.16, "learning_rate": 4.773745257302195e-06, "loss": 0.9827, "step": 8607 }, { "epoch": 0.16, "learning_rate": 4.773681747191643e-06, "loss": 1.0266, "step": 8608 }, { "epoch": 0.16, "learning_rate": 4.773618228591233e-06, "loss": 0.9022, "step": 8609 }, { "epoch": 0.16, "learning_rate": 4.773554701501203e-06, "loss": 0.8463, "step": 8610 }, { "epoch": 0.16, "learning_rate": 4.773491165921789e-06, "loss": 0.7897, "step": 8611 }, { "epoch": 0.16, "learning_rate": 4.773427621853228e-06, "loss": 0.8923, "step": 8612 }, { "epoch": 0.16, "learning_rate": 4.773364069295758e-06, "loss": 1.056, "step": 8613 }, { "epoch": 0.16, "learning_rate": 4.773300508249617e-06, "loss": 1.027, "step": 8614 }, { "epoch": 0.16, "learning_rate": 4.773236938715041e-06, "loss": 0.9686, "step": 8615 }, { "epoch": 0.16, "learning_rate": 4.773173360692268e-06, "loss": 0.7907, "step": 8616 }, { "epoch": 0.16, "learning_rate": 4.773109774181536e-06, "loss": 1.0486, "step": 8617 }, { "epoch": 0.16, "learning_rate": 4.773046179183082e-06, "loss": 0.9348, "step": 8618 }, { "epoch": 0.16, "learning_rate": 4.772982575697143e-06, "loss": 1.0295, "step": 8619 }, { "epoch": 0.16, "learning_rate": 4.772918963723956e-06, "loss": 1.0861, "step": 8620 }, { "epoch": 0.16, "learning_rate": 4.77285534326376e-06, "loss": 0.9922, "step": 8621 }, { "epoch": 0.16, "learning_rate": 4.772791714316791e-06, "loss": 0.9529, "step": 8622 }, { "epoch": 0.16, "learning_rate": 4.772728076883288e-06, "loss": 0.8584, "step": 8623 }, { "epoch": 0.16, "learning_rate": 4.772664430963488e-06, "loss": 0.9366, "step": 8624 }, { "epoch": 0.16, "learning_rate": 4.772600776557629e-06, "loss": 1.1392, "step": 8625 }, { "epoch": 0.16, "learning_rate": 4.772537113665948e-06, "loss": 0.989, "step": 8626 }, { "epoch": 0.16, "learning_rate": 4.772473442288683e-06, "loss": 1.104, "step": 8627 }, { "epoch": 0.16, "learning_rate": 4.772409762426073e-06, "loss": 1.0433, "step": 8628 }, { "epoch": 0.16, "learning_rate": 4.772346074078353e-06, "loss": 0.9919, "step": 8629 }, { "epoch": 0.16, "learning_rate": 4.772282377245763e-06, "loss": 1.0023, "step": 8630 }, { "epoch": 0.16, "learning_rate": 4.772218671928541e-06, "loss": 1.0537, "step": 8631 }, { "epoch": 0.16, "learning_rate": 4.772154958126923e-06, "loss": 0.8528, "step": 8632 }, { "epoch": 0.16, "learning_rate": 4.772091235841149e-06, "loss": 0.8406, "step": 8633 }, { "epoch": 0.16, "learning_rate": 4.772027505071455e-06, "loss": 0.885, "step": 8634 }, { "epoch": 0.16, "learning_rate": 4.7719637658180805e-06, "loss": 0.7912, "step": 8635 }, { "epoch": 0.16, "learning_rate": 4.771900018081263e-06, "loss": 0.9649, "step": 8636 }, { "epoch": 0.16, "learning_rate": 4.771836261861241e-06, "loss": 1.0761, "step": 8637 }, { "epoch": 0.16, "learning_rate": 4.7717724971582514e-06, "loss": 0.9267, "step": 8638 }, { "epoch": 0.16, "learning_rate": 4.7717087239725336e-06, "loss": 1.0071, "step": 8639 }, { "epoch": 0.16, "learning_rate": 4.7716449423043245e-06, "loss": 1.0969, "step": 8640 }, { "epoch": 0.16, "learning_rate": 4.771581152153862e-06, "loss": 0.9272, "step": 8641 }, { "epoch": 0.16, "learning_rate": 4.771517353521387e-06, "loss": 0.9316, "step": 8642 }, { "epoch": 0.16, "learning_rate": 4.771453546407135e-06, "loss": 0.9555, "step": 8643 }, { "epoch": 0.16, "learning_rate": 4.7713897308113445e-06, "loss": 1.1897, "step": 8644 }, { "epoch": 0.16, "learning_rate": 4.771325906734254e-06, "loss": 0.7895, "step": 8645 }, { "epoch": 0.16, "learning_rate": 4.771262074176104e-06, "loss": 0.9439, "step": 8646 }, { "epoch": 0.16, "learning_rate": 4.7711982331371295e-06, "loss": 0.9584, "step": 8647 }, { "epoch": 0.16, "learning_rate": 4.7711343836175716e-06, "loss": 0.7428, "step": 8648 }, { "epoch": 0.16, "learning_rate": 4.771070525617667e-06, "loss": 1.4127, "step": 8649 }, { "epoch": 0.16, "learning_rate": 4.771006659137655e-06, "loss": 0.8502, "step": 8650 }, { "epoch": 0.16, "learning_rate": 4.770942784177773e-06, "loss": 1.0892, "step": 8651 }, { "epoch": 0.16, "learning_rate": 4.770878900738261e-06, "loss": 0.8765, "step": 8652 }, { "epoch": 0.16, "learning_rate": 4.7708150088193565e-06, "loss": 0.9271, "step": 8653 }, { "epoch": 0.16, "learning_rate": 4.770751108421298e-06, "loss": 0.9406, "step": 8654 }, { "epoch": 0.16, "learning_rate": 4.770687199544325e-06, "loss": 0.9697, "step": 8655 }, { "epoch": 0.16, "learning_rate": 4.770623282188676e-06, "loss": 1.2554, "step": 8656 }, { "epoch": 0.16, "learning_rate": 4.770559356354588e-06, "loss": 0.8522, "step": 8657 }, { "epoch": 0.16, "learning_rate": 4.7704954220423025e-06, "loss": 1.0176, "step": 8658 }, { "epoch": 0.16, "learning_rate": 4.7704314792520555e-06, "loss": 0.8495, "step": 8659 }, { "epoch": 0.16, "learning_rate": 4.770367527984088e-06, "loss": 0.9259, "step": 8660 }, { "epoch": 0.16, "learning_rate": 4.770303568238636e-06, "loss": 0.8981, "step": 8661 }, { "epoch": 0.16, "learning_rate": 4.770239600015942e-06, "loss": 1.134, "step": 8662 }, { "epoch": 0.16, "learning_rate": 4.770175623316242e-06, "loss": 1.0711, "step": 8663 }, { "epoch": 0.16, "learning_rate": 4.770111638139776e-06, "loss": 0.9543, "step": 8664 }, { "epoch": 0.16, "learning_rate": 4.770047644486784e-06, "loss": 0.9588, "step": 8665 }, { "epoch": 0.16, "learning_rate": 4.769983642357502e-06, "loss": 0.8309, "step": 8666 }, { "epoch": 0.16, "learning_rate": 4.769919631752172e-06, "loss": 1.0045, "step": 8667 }, { "epoch": 0.16, "learning_rate": 4.76985561267103e-06, "loss": 0.9371, "step": 8668 }, { "epoch": 0.16, "learning_rate": 4.769791585114317e-06, "loss": 0.8879, "step": 8669 }, { "epoch": 0.16, "learning_rate": 4.769727549082273e-06, "loss": 1.0661, "step": 8670 }, { "epoch": 0.16, "learning_rate": 4.7696635045751345e-06, "loss": 0.9036, "step": 8671 }, { "epoch": 0.16, "learning_rate": 4.769599451593144e-06, "loss": 0.832, "step": 8672 }, { "epoch": 0.16, "learning_rate": 4.769535390136537e-06, "loss": 0.7911, "step": 8673 }, { "epoch": 0.16, "learning_rate": 4.769471320205555e-06, "loss": 1.084, "step": 8674 }, { "epoch": 0.16, "learning_rate": 4.769407241800438e-06, "loss": 1.1709, "step": 8675 }, { "epoch": 0.16, "learning_rate": 4.769343154921422e-06, "loss": 1.1182, "step": 8676 }, { "epoch": 0.16, "learning_rate": 4.7692790595687485e-06, "loss": 0.7982, "step": 8677 }, { "epoch": 0.16, "learning_rate": 4.7692149557426575e-06, "loss": 0.9504, "step": 8678 }, { "epoch": 0.16, "learning_rate": 4.769150843443387e-06, "loss": 0.8698, "step": 8679 }, { "epoch": 0.16, "learning_rate": 4.769086722671177e-06, "loss": 1.087, "step": 8680 }, { "epoch": 0.16, "learning_rate": 4.7690225934262665e-06, "loss": 1.14, "step": 8681 }, { "epoch": 0.16, "learning_rate": 4.768958455708896e-06, "loss": 0.8028, "step": 8682 }, { "epoch": 0.16, "learning_rate": 4.768894309519302e-06, "loss": 0.8332, "step": 8683 }, { "epoch": 0.16, "learning_rate": 4.768830154857728e-06, "loss": 0.8293, "step": 8684 }, { "epoch": 0.16, "learning_rate": 4.768765991724411e-06, "loss": 0.9047, "step": 8685 }, { "epoch": 0.16, "learning_rate": 4.768701820119593e-06, "loss": 0.8093, "step": 8686 }, { "epoch": 0.16, "learning_rate": 4.76863764004351e-06, "loss": 1.1268, "step": 8687 }, { "epoch": 0.16, "learning_rate": 4.768573451496404e-06, "loss": 1.2136, "step": 8688 }, { "epoch": 0.16, "learning_rate": 4.768509254478515e-06, "loss": 1.1788, "step": 8689 }, { "epoch": 0.16, "learning_rate": 4.7684450489900814e-06, "loss": 0.9153, "step": 8690 }, { "epoch": 0.16, "learning_rate": 4.7683808350313444e-06, "loss": 0.9579, "step": 8691 }, { "epoch": 0.16, "learning_rate": 4.768316612602541e-06, "loss": 0.7696, "step": 8692 }, { "epoch": 0.16, "learning_rate": 4.768252381703915e-06, "loss": 0.9891, "step": 8693 }, { "epoch": 0.16, "learning_rate": 4.768188142335704e-06, "loss": 1.0648, "step": 8694 }, { "epoch": 0.16, "learning_rate": 4.768123894498147e-06, "loss": 0.9583, "step": 8695 }, { "epoch": 0.16, "learning_rate": 4.768059638191484e-06, "loss": 1.2024, "step": 8696 }, { "epoch": 0.16, "learning_rate": 4.7679953734159575e-06, "loss": 0.8011, "step": 8697 }, { "epoch": 0.16, "learning_rate": 4.7679311001718065e-06, "loss": 0.8119, "step": 8698 }, { "epoch": 0.16, "learning_rate": 4.767866818459269e-06, "loss": 1.0418, "step": 8699 }, { "epoch": 0.16, "learning_rate": 4.767802528278587e-06, "loss": 1.0497, "step": 8700 }, { "epoch": 0.16, "learning_rate": 4.767738229629999e-06, "loss": 0.9278, "step": 8701 }, { "epoch": 0.16, "learning_rate": 4.767673922513746e-06, "loss": 0.9982, "step": 8702 }, { "epoch": 0.16, "learning_rate": 4.7676096069300695e-06, "loss": 1.1145, "step": 8703 }, { "epoch": 0.16, "learning_rate": 4.767545282879207e-06, "loss": 1.1888, "step": 8704 }, { "epoch": 0.16, "learning_rate": 4.7674809503614e-06, "loss": 0.8965, "step": 8705 }, { "epoch": 0.16, "learning_rate": 4.767416609376889e-06, "loss": 0.9931, "step": 8706 }, { "epoch": 0.16, "learning_rate": 4.767352259925914e-06, "loss": 1.0443, "step": 8707 }, { "epoch": 0.16, "learning_rate": 4.767287902008715e-06, "loss": 0.9219, "step": 8708 }, { "epoch": 0.16, "learning_rate": 4.767223535625532e-06, "loss": 0.8698, "step": 8709 }, { "epoch": 0.16, "learning_rate": 4.767159160776606e-06, "loss": 1.0172, "step": 8710 }, { "epoch": 0.16, "learning_rate": 4.767094777462178e-06, "loss": 1.0831, "step": 8711 }, { "epoch": 0.16, "learning_rate": 4.767030385682487e-06, "loss": 1.1235, "step": 8712 }, { "epoch": 0.16, "learning_rate": 4.766965985437775e-06, "loss": 1.0004, "step": 8713 }, { "epoch": 0.16, "learning_rate": 4.76690157672828e-06, "loss": 0.8381, "step": 8714 }, { "epoch": 0.16, "learning_rate": 4.7668371595542455e-06, "loss": 1.0309, "step": 8715 }, { "epoch": 0.16, "learning_rate": 4.7667727339159085e-06, "loss": 1.0762, "step": 8716 }, { "epoch": 0.16, "learning_rate": 4.7667082998135135e-06, "loss": 0.8558, "step": 8717 }, { "epoch": 0.16, "learning_rate": 4.7666438572472984e-06, "loss": 0.9921, "step": 8718 }, { "epoch": 0.16, "learning_rate": 4.766579406217506e-06, "loss": 1.0413, "step": 8719 }, { "epoch": 0.16, "learning_rate": 4.766514946724373e-06, "loss": 0.9261, "step": 8720 }, { "epoch": 0.16, "learning_rate": 4.766450478768144e-06, "loss": 1.074, "step": 8721 }, { "epoch": 0.16, "learning_rate": 4.7663860023490585e-06, "loss": 0.9953, "step": 8722 }, { "epoch": 0.16, "learning_rate": 4.766321517467357e-06, "loss": 0.8923, "step": 8723 }, { "epoch": 0.16, "learning_rate": 4.766257024123281e-06, "loss": 0.9958, "step": 8724 }, { "epoch": 0.16, "learning_rate": 4.76619252231707e-06, "loss": 1.0536, "step": 8725 }, { "epoch": 0.16, "learning_rate": 4.7661280120489665e-06, "loss": 1.0483, "step": 8726 }, { "epoch": 0.16, "learning_rate": 4.76606349331921e-06, "loss": 0.9833, "step": 8727 }, { "epoch": 0.16, "learning_rate": 4.765998966128041e-06, "loss": 1.1099, "step": 8728 }, { "epoch": 0.16, "learning_rate": 4.765934430475702e-06, "loss": 0.9583, "step": 8729 }, { "epoch": 0.16, "learning_rate": 4.765869886362434e-06, "loss": 1.0093, "step": 8730 }, { "epoch": 0.16, "learning_rate": 4.765805333788477e-06, "loss": 1.1877, "step": 8731 }, { "epoch": 0.16, "learning_rate": 4.765740772754072e-06, "loss": 1.2159, "step": 8732 }, { "epoch": 0.16, "learning_rate": 4.765676203259461e-06, "loss": 0.8587, "step": 8733 }, { "epoch": 0.16, "learning_rate": 4.765611625304884e-06, "loss": 0.8137, "step": 8734 }, { "epoch": 0.16, "learning_rate": 4.765547038890582e-06, "loss": 0.9523, "step": 8735 }, { "epoch": 0.16, "learning_rate": 4.765482444016798e-06, "loss": 0.9264, "step": 8736 }, { "epoch": 0.16, "learning_rate": 4.765417840683771e-06, "loss": 0.9319, "step": 8737 }, { "epoch": 0.16, "learning_rate": 4.765353228891745e-06, "loss": 1.0505, "step": 8738 }, { "epoch": 0.16, "learning_rate": 4.7652886086409576e-06, "loss": 0.9519, "step": 8739 }, { "epoch": 0.16, "learning_rate": 4.765223979931654e-06, "loss": 0.8732, "step": 8740 }, { "epoch": 0.16, "learning_rate": 4.765159342764071e-06, "loss": 0.9194, "step": 8741 }, { "epoch": 0.16, "learning_rate": 4.7650946971384535e-06, "loss": 0.9563, "step": 8742 }, { "epoch": 0.16, "learning_rate": 4.765030043055042e-06, "loss": 0.9467, "step": 8743 }, { "epoch": 0.16, "learning_rate": 4.764965380514078e-06, "loss": 1.0745, "step": 8744 }, { "epoch": 0.16, "learning_rate": 4.764900709515803e-06, "loss": 0.7557, "step": 8745 }, { "epoch": 0.17, "learning_rate": 4.764836030060458e-06, "loss": 0.8885, "step": 8746 }, { "epoch": 0.17, "learning_rate": 4.764771342148284e-06, "loss": 0.9946, "step": 8747 }, { "epoch": 0.17, "learning_rate": 4.764706645779524e-06, "loss": 0.8093, "step": 8748 }, { "epoch": 0.17, "learning_rate": 4.764641940954418e-06, "loss": 0.8521, "step": 8749 }, { "epoch": 0.17, "learning_rate": 4.76457722767321e-06, "loss": 1.0103, "step": 8750 }, { "epoch": 0.17, "learning_rate": 4.764512505936139e-06, "loss": 1.0759, "step": 8751 }, { "epoch": 0.17, "learning_rate": 4.7644477757434474e-06, "loss": 0.8472, "step": 8752 }, { "epoch": 0.17, "learning_rate": 4.764383037095377e-06, "loss": 1.1129, "step": 8753 }, { "epoch": 0.17, "learning_rate": 4.76431828999217e-06, "loss": 0.8635, "step": 8754 }, { "epoch": 0.17, "learning_rate": 4.764253534434069e-06, "loss": 0.9822, "step": 8755 }, { "epoch": 0.17, "learning_rate": 4.764188770421314e-06, "loss": 1.052, "step": 8756 }, { "epoch": 0.17, "learning_rate": 4.7641239979541474e-06, "loss": 1.1534, "step": 8757 }, { "epoch": 0.17, "learning_rate": 4.764059217032811e-06, "loss": 0.8391, "step": 8758 }, { "epoch": 0.17, "learning_rate": 4.763994427657548e-06, "loss": 0.6861, "step": 8759 }, { "epoch": 0.17, "learning_rate": 4.763929629828597e-06, "loss": 0.9731, "step": 8760 }, { "epoch": 0.17, "learning_rate": 4.763864823546205e-06, "loss": 0.8282, "step": 8761 }, { "epoch": 0.17, "learning_rate": 4.76380000881061e-06, "loss": 1.1591, "step": 8762 }, { "epoch": 0.17, "learning_rate": 4.763735185622054e-06, "loss": 1.0333, "step": 8763 }, { "epoch": 0.17, "learning_rate": 4.763670353980781e-06, "loss": 0.9108, "step": 8764 }, { "epoch": 0.17, "learning_rate": 4.763605513887033e-06, "loss": 0.8909, "step": 8765 }, { "epoch": 0.17, "learning_rate": 4.763540665341051e-06, "loss": 1.0869, "step": 8766 }, { "epoch": 0.17, "learning_rate": 4.763475808343078e-06, "loss": 0.8891, "step": 8767 }, { "epoch": 0.17, "learning_rate": 4.763410942893355e-06, "loss": 1.1028, "step": 8768 }, { "epoch": 0.17, "learning_rate": 4.763346068992125e-06, "loss": 0.8952, "step": 8769 }, { "epoch": 0.17, "learning_rate": 4.76328118663963e-06, "loss": 0.8301, "step": 8770 }, { "epoch": 0.17, "learning_rate": 4.763216295836113e-06, "loss": 0.8744, "step": 8771 }, { "epoch": 0.17, "learning_rate": 4.763151396581816e-06, "loss": 0.8922, "step": 8772 }, { "epoch": 0.17, "learning_rate": 4.76308648887698e-06, "loss": 0.9526, "step": 8773 }, { "epoch": 0.17, "learning_rate": 4.763021572721849e-06, "loss": 1.0896, "step": 8774 }, { "epoch": 0.17, "learning_rate": 4.762956648116665e-06, "loss": 1.0847, "step": 8775 }, { "epoch": 0.17, "learning_rate": 4.76289171506167e-06, "loss": 0.8772, "step": 8776 }, { "epoch": 0.17, "learning_rate": 4.762826773557107e-06, "loss": 1.1864, "step": 8777 }, { "epoch": 0.17, "learning_rate": 4.762761823603218e-06, "loss": 1.0213, "step": 8778 }, { "epoch": 0.17, "learning_rate": 4.7626968652002455e-06, "loss": 0.8904, "step": 8779 }, { "epoch": 0.17, "learning_rate": 4.762631898348433e-06, "loss": 0.868, "step": 8780 }, { "epoch": 0.17, "learning_rate": 4.762566923048022e-06, "loss": 1.4678, "step": 8781 }, { "epoch": 0.17, "learning_rate": 4.762501939299255e-06, "loss": 0.8554, "step": 8782 }, { "epoch": 0.17, "learning_rate": 4.762436947102376e-06, "loss": 0.8838, "step": 8783 }, { "epoch": 0.17, "learning_rate": 4.762371946457626e-06, "loss": 0.9662, "step": 8784 }, { "epoch": 0.17, "learning_rate": 4.7623069373652484e-06, "loss": 0.8464, "step": 8785 }, { "epoch": 0.17, "learning_rate": 4.762241919825487e-06, "loss": 1.0391, "step": 8786 }, { "epoch": 0.17, "learning_rate": 4.762176893838583e-06, "loss": 1.0569, "step": 8787 }, { "epoch": 0.17, "learning_rate": 4.76211185940478e-06, "loss": 0.9201, "step": 8788 }, { "epoch": 0.17, "learning_rate": 4.762046816524321e-06, "loss": 0.9799, "step": 8789 }, { "epoch": 0.17, "learning_rate": 4.761981765197448e-06, "loss": 0.7537, "step": 8790 }, { "epoch": 0.17, "learning_rate": 4.761916705424405e-06, "loss": 0.8945, "step": 8791 }, { "epoch": 0.17, "learning_rate": 4.761851637205433e-06, "loss": 0.9821, "step": 8792 }, { "epoch": 0.17, "learning_rate": 4.7617865605407774e-06, "loss": 1.1218, "step": 8793 }, { "epoch": 0.17, "learning_rate": 4.76172147543068e-06, "loss": 0.9894, "step": 8794 }, { "epoch": 0.17, "learning_rate": 4.7616563818753846e-06, "loss": 0.9118, "step": 8795 }, { "epoch": 0.17, "learning_rate": 4.761591279875133e-06, "loss": 0.7983, "step": 8796 }, { "epoch": 0.17, "learning_rate": 4.7615261694301695e-06, "loss": 0.7167, "step": 8797 }, { "epoch": 0.17, "learning_rate": 4.761461050540736e-06, "loss": 1.0908, "step": 8798 }, { "epoch": 0.17, "learning_rate": 4.761395923207076e-06, "loss": 1.1185, "step": 8799 }, { "epoch": 0.17, "learning_rate": 4.7613307874294335e-06, "loss": 1.0748, "step": 8800 }, { "epoch": 0.17, "learning_rate": 4.761265643208051e-06, "loss": 0.7935, "step": 8801 }, { "epoch": 0.17, "learning_rate": 4.761200490543172e-06, "loss": 0.8842, "step": 8802 }, { "epoch": 0.17, "learning_rate": 4.761135329435039e-06, "loss": 0.8167, "step": 8803 }, { "epoch": 0.17, "learning_rate": 4.761070159883897e-06, "loss": 0.7499, "step": 8804 }, { "epoch": 0.17, "learning_rate": 4.7610049818899885e-06, "loss": 1.0308, "step": 8805 }, { "epoch": 0.17, "learning_rate": 4.760939795453556e-06, "loss": 1.1262, "step": 8806 }, { "epoch": 0.17, "learning_rate": 4.760874600574844e-06, "loss": 1.1677, "step": 8807 }, { "epoch": 0.17, "learning_rate": 4.760809397254095e-06, "loss": 0.8945, "step": 8808 }, { "epoch": 0.17, "learning_rate": 4.760744185491554e-06, "loss": 0.7776, "step": 8809 }, { "epoch": 0.17, "learning_rate": 4.7606789652874625e-06, "loss": 0.8691, "step": 8810 }, { "epoch": 0.17, "learning_rate": 4.760613736642066e-06, "loss": 0.9446, "step": 8811 }, { "epoch": 0.17, "learning_rate": 4.7605484995556064e-06, "loss": 1.0132, "step": 8812 }, { "epoch": 0.17, "learning_rate": 4.760483254028327e-06, "loss": 0.9107, "step": 8813 }, { "epoch": 0.17, "learning_rate": 4.760418000060474e-06, "loss": 0.7519, "step": 8814 }, { "epoch": 0.17, "learning_rate": 4.760352737652289e-06, "loss": 0.9874, "step": 8815 }, { "epoch": 0.17, "learning_rate": 4.760287466804016e-06, "loss": 0.9158, "step": 8816 }, { "epoch": 0.17, "learning_rate": 4.7602221875159005e-06, "loss": 0.7541, "step": 8817 }, { "epoch": 0.17, "learning_rate": 4.760156899788183e-06, "loss": 1.0005, "step": 8818 }, { "epoch": 0.17, "learning_rate": 4.7600916036211095e-06, "loss": 1.0081, "step": 8819 }, { "epoch": 0.17, "learning_rate": 4.760026299014923e-06, "loss": 1.0175, "step": 8820 }, { "epoch": 0.17, "learning_rate": 4.7599609859698675e-06, "loss": 0.9792, "step": 8821 }, { "epoch": 0.17, "learning_rate": 4.759895664486187e-06, "loss": 0.972, "step": 8822 }, { "epoch": 0.17, "learning_rate": 4.759830334564126e-06, "loss": 0.9479, "step": 8823 }, { "epoch": 0.17, "learning_rate": 4.759764996203927e-06, "loss": 1.2402, "step": 8824 }, { "epoch": 0.17, "learning_rate": 4.759699649405836e-06, "loss": 1.2033, "step": 8825 }, { "epoch": 0.17, "learning_rate": 4.759634294170094e-06, "loss": 1.0731, "step": 8826 }, { "epoch": 0.17, "learning_rate": 4.759568930496948e-06, "loss": 1.0616, "step": 8827 }, { "epoch": 0.17, "learning_rate": 4.75950355838664e-06, "loss": 0.9329, "step": 8828 }, { "epoch": 0.17, "learning_rate": 4.759438177839416e-06, "loss": 1.1304, "step": 8829 }, { "epoch": 0.17, "learning_rate": 4.759372788855518e-06, "loss": 0.9993, "step": 8830 }, { "epoch": 0.17, "learning_rate": 4.7593073914351925e-06, "loss": 1.0294, "step": 8831 }, { "epoch": 0.17, "learning_rate": 4.759241985578682e-06, "loss": 1.0206, "step": 8832 }, { "epoch": 0.17, "learning_rate": 4.759176571286232e-06, "loss": 0.7467, "step": 8833 }, { "epoch": 0.17, "learning_rate": 4.759111148558085e-06, "loss": 1.0404, "step": 8834 }, { "epoch": 0.17, "learning_rate": 4.759045717394486e-06, "loss": 0.7426, "step": 8835 }, { "epoch": 0.17, "learning_rate": 4.75898027779568e-06, "loss": 0.7576, "step": 8836 }, { "epoch": 0.17, "learning_rate": 4.758914829761911e-06, "loss": 1.1948, "step": 8837 }, { "epoch": 0.17, "learning_rate": 4.758849373293423e-06, "loss": 1.1664, "step": 8838 }, { "epoch": 0.17, "learning_rate": 4.758783908390461e-06, "loss": 0.874, "step": 8839 }, { "epoch": 0.17, "learning_rate": 4.758718435053269e-06, "loss": 1.1005, "step": 8840 }, { "epoch": 0.17, "learning_rate": 4.758652953282091e-06, "loss": 1.1061, "step": 8841 }, { "epoch": 0.17, "learning_rate": 4.758587463077174e-06, "loss": 0.9664, "step": 8842 }, { "epoch": 0.17, "learning_rate": 4.758521964438758e-06, "loss": 1.2087, "step": 8843 }, { "epoch": 0.17, "learning_rate": 4.758456457367092e-06, "loss": 1.0544, "step": 8844 }, { "epoch": 0.17, "learning_rate": 4.7583909418624186e-06, "loss": 0.9365, "step": 8845 }, { "epoch": 0.17, "learning_rate": 4.758325417924983e-06, "loss": 1.0118, "step": 8846 }, { "epoch": 0.17, "learning_rate": 4.758259885555029e-06, "loss": 1.0417, "step": 8847 }, { "epoch": 0.17, "learning_rate": 4.758194344752801e-06, "loss": 0.7894, "step": 8848 }, { "epoch": 0.17, "learning_rate": 4.758128795518546e-06, "loss": 1.047, "step": 8849 }, { "epoch": 0.17, "learning_rate": 4.758063237852506e-06, "loss": 1.0519, "step": 8850 }, { "epoch": 0.17, "learning_rate": 4.757997671754928e-06, "loss": 1.0215, "step": 8851 }, { "epoch": 0.17, "learning_rate": 4.757932097226056e-06, "loss": 0.8452, "step": 8852 }, { "epoch": 0.17, "learning_rate": 4.7578665142661345e-06, "loss": 1.219, "step": 8853 }, { "epoch": 0.17, "learning_rate": 4.757800922875409e-06, "loss": 0.7312, "step": 8854 }, { "epoch": 0.17, "learning_rate": 4.757735323054123e-06, "loss": 0.8832, "step": 8855 }, { "epoch": 0.17, "learning_rate": 4.757669714802524e-06, "loss": 1.0656, "step": 8856 }, { "epoch": 0.17, "learning_rate": 4.757604098120855e-06, "loss": 1.1788, "step": 8857 }, { "epoch": 0.17, "learning_rate": 4.757538473009361e-06, "loss": 0.7744, "step": 8858 }, { "epoch": 0.17, "learning_rate": 4.757472839468288e-06, "loss": 1.1531, "step": 8859 }, { "epoch": 0.17, "learning_rate": 4.757407197497881e-06, "loss": 0.9047, "step": 8860 }, { "epoch": 0.17, "learning_rate": 4.757341547098384e-06, "loss": 0.9185, "step": 8861 }, { "epoch": 0.17, "learning_rate": 4.757275888270043e-06, "loss": 1.0011, "step": 8862 }, { "epoch": 0.17, "learning_rate": 4.757210221013103e-06, "loss": 0.9857, "step": 8863 }, { "epoch": 0.17, "learning_rate": 4.75714454532781e-06, "loss": 0.8435, "step": 8864 }, { "epoch": 0.17, "learning_rate": 4.757078861214408e-06, "loss": 1.1162, "step": 8865 }, { "epoch": 0.17, "learning_rate": 4.757013168673143e-06, "loss": 0.967, "step": 8866 }, { "epoch": 0.17, "learning_rate": 4.756947467704258e-06, "loss": 0.8763, "step": 8867 }, { "epoch": 0.17, "learning_rate": 4.756881758308003e-06, "loss": 1.0439, "step": 8868 }, { "epoch": 0.17, "learning_rate": 4.756816040484619e-06, "loss": 1.0483, "step": 8869 }, { "epoch": 0.17, "learning_rate": 4.7567503142343544e-06, "loss": 0.8849, "step": 8870 }, { "epoch": 0.17, "learning_rate": 4.7566845795574525e-06, "loss": 0.9659, "step": 8871 }, { "epoch": 0.17, "learning_rate": 4.75661883645416e-06, "loss": 0.9457, "step": 8872 }, { "epoch": 0.17, "learning_rate": 4.756553084924722e-06, "loss": 0.9348, "step": 8873 }, { "epoch": 0.17, "learning_rate": 4.756487324969383e-06, "loss": 0.9399, "step": 8874 }, { "epoch": 0.17, "learning_rate": 4.756421556588391e-06, "loss": 0.9835, "step": 8875 }, { "epoch": 0.17, "learning_rate": 4.756355779781989e-06, "loss": 1.1688, "step": 8876 }, { "epoch": 0.17, "learning_rate": 4.7562899945504245e-06, "loss": 1.0215, "step": 8877 }, { "epoch": 0.17, "learning_rate": 4.756224200893942e-06, "loss": 1.009, "step": 8878 }, { "epoch": 0.17, "learning_rate": 4.756158398812787e-06, "loss": 0.9656, "step": 8879 }, { "epoch": 0.17, "learning_rate": 4.756092588307206e-06, "loss": 1.0218, "step": 8880 }, { "epoch": 0.17, "learning_rate": 4.7560267693774445e-06, "loss": 1.3207, "step": 8881 }, { "epoch": 0.17, "learning_rate": 4.755960942023748e-06, "loss": 0.8881, "step": 8882 }, { "epoch": 0.17, "learning_rate": 4.755895106246363e-06, "loss": 0.9922, "step": 8883 }, { "epoch": 0.17, "learning_rate": 4.755829262045535e-06, "loss": 0.913, "step": 8884 }, { "epoch": 0.17, "learning_rate": 4.755763409421509e-06, "loss": 0.9375, "step": 8885 }, { "epoch": 0.17, "learning_rate": 4.755697548374532e-06, "loss": 0.8944, "step": 8886 }, { "epoch": 0.17, "learning_rate": 4.7556316789048495e-06, "loss": 1.128, "step": 8887 }, { "epoch": 0.17, "learning_rate": 4.755565801012707e-06, "loss": 1.1501, "step": 8888 }, { "epoch": 0.17, "learning_rate": 4.7554999146983515e-06, "loss": 0.959, "step": 8889 }, { "epoch": 0.17, "learning_rate": 4.755434019962029e-06, "loss": 0.9911, "step": 8890 }, { "epoch": 0.17, "learning_rate": 4.7553681168039835e-06, "loss": 0.9271, "step": 8891 }, { "epoch": 0.17, "learning_rate": 4.755302205224463e-06, "loss": 0.8066, "step": 8892 }, { "epoch": 0.17, "learning_rate": 4.755236285223714e-06, "loss": 1.2183, "step": 8893 }, { "epoch": 0.17, "learning_rate": 4.755170356801982e-06, "loss": 1.2594, "step": 8894 }, { "epoch": 0.17, "learning_rate": 4.7551044199595135e-06, "loss": 1.0733, "step": 8895 }, { "epoch": 0.17, "learning_rate": 4.755038474696553e-06, "loss": 0.9506, "step": 8896 }, { "epoch": 0.17, "learning_rate": 4.754972521013348e-06, "loss": 0.9365, "step": 8897 }, { "epoch": 0.17, "learning_rate": 4.754906558910145e-06, "loss": 0.8311, "step": 8898 }, { "epoch": 0.17, "learning_rate": 4.75484058838719e-06, "loss": 0.7623, "step": 8899 }, { "epoch": 0.17, "learning_rate": 4.75477460944473e-06, "loss": 0.8436, "step": 8900 }, { "epoch": 0.17, "learning_rate": 4.75470862208301e-06, "loss": 1.1026, "step": 8901 }, { "epoch": 0.17, "learning_rate": 4.754642626302277e-06, "loss": 0.787, "step": 8902 }, { "epoch": 0.17, "learning_rate": 4.754576622102778e-06, "loss": 1.0393, "step": 8903 }, { "epoch": 0.17, "learning_rate": 4.7545106094847585e-06, "loss": 0.8456, "step": 8904 }, { "epoch": 0.17, "learning_rate": 4.754444588448466e-06, "loss": 0.9684, "step": 8905 }, { "epoch": 0.17, "learning_rate": 4.754378558994147e-06, "loss": 1.1213, "step": 8906 }, { "epoch": 0.17, "learning_rate": 4.754312521122047e-06, "loss": 1.1126, "step": 8907 }, { "epoch": 0.17, "learning_rate": 4.754246474832412e-06, "loss": 0.8116, "step": 8908 }, { "epoch": 0.17, "learning_rate": 4.754180420125491e-06, "loss": 0.9551, "step": 8909 }, { "epoch": 0.17, "learning_rate": 4.75411435700153e-06, "loss": 1.0307, "step": 8910 }, { "epoch": 0.17, "learning_rate": 4.754048285460775e-06, "loss": 0.8999, "step": 8911 }, { "epoch": 0.17, "learning_rate": 4.7539822055034724e-06, "loss": 0.9608, "step": 8912 }, { "epoch": 0.17, "learning_rate": 4.753916117129869e-06, "loss": 0.8923, "step": 8913 }, { "epoch": 0.17, "learning_rate": 4.753850020340212e-06, "loss": 0.9745, "step": 8914 }, { "epoch": 0.17, "learning_rate": 4.753783915134749e-06, "loss": 0.7812, "step": 8915 }, { "epoch": 0.17, "learning_rate": 4.753717801513725e-06, "loss": 0.8967, "step": 8916 }, { "epoch": 0.17, "learning_rate": 4.753651679477388e-06, "loss": 0.813, "step": 8917 }, { "epoch": 0.17, "learning_rate": 4.753585549025985e-06, "loss": 1.0459, "step": 8918 }, { "epoch": 0.17, "learning_rate": 4.753519410159762e-06, "loss": 1.1169, "step": 8919 }, { "epoch": 0.17, "learning_rate": 4.753453262878967e-06, "loss": 0.8693, "step": 8920 }, { "epoch": 0.17, "learning_rate": 4.753387107183847e-06, "loss": 0.8441, "step": 8921 }, { "epoch": 0.17, "learning_rate": 4.753320943074648e-06, "loss": 1.0392, "step": 8922 }, { "epoch": 0.17, "learning_rate": 4.753254770551618e-06, "loss": 0.8582, "step": 8923 }, { "epoch": 0.17, "learning_rate": 4.753188589615004e-06, "loss": 1.0966, "step": 8924 }, { "epoch": 0.17, "learning_rate": 4.753122400265053e-06, "loss": 1.2232, "step": 8925 }, { "epoch": 0.17, "learning_rate": 4.7530562025020115e-06, "loss": 1.1716, "step": 8926 }, { "epoch": 0.17, "learning_rate": 4.752989996326128e-06, "loss": 0.7738, "step": 8927 }, { "epoch": 0.17, "learning_rate": 4.752923781737648e-06, "loss": 0.9519, "step": 8928 }, { "epoch": 0.17, "learning_rate": 4.75285755873682e-06, "loss": 0.7136, "step": 8929 }, { "epoch": 0.17, "learning_rate": 4.752791327323891e-06, "loss": 0.9854, "step": 8930 }, { "epoch": 0.17, "learning_rate": 4.7527250874991085e-06, "loss": 1.1209, "step": 8931 }, { "epoch": 0.17, "learning_rate": 4.75265883926272e-06, "loss": 1.0915, "step": 8932 }, { "epoch": 0.17, "learning_rate": 4.752592582614971e-06, "loss": 0.7634, "step": 8933 }, { "epoch": 0.17, "learning_rate": 4.752526317556111e-06, "loss": 1.1162, "step": 8934 }, { "epoch": 0.17, "learning_rate": 4.752460044086387e-06, "loss": 0.9285, "step": 8935 }, { "epoch": 0.17, "learning_rate": 4.752393762206047e-06, "loss": 1.1623, "step": 8936 }, { "epoch": 0.17, "learning_rate": 4.7523274719153364e-06, "loss": 1.1234, "step": 8937 }, { "epoch": 0.17, "learning_rate": 4.752261173214505e-06, "loss": 0.9574, "step": 8938 }, { "epoch": 0.17, "learning_rate": 4.752194866103799e-06, "loss": 0.8228, "step": 8939 }, { "epoch": 0.17, "learning_rate": 4.752128550583467e-06, "loss": 1.1042, "step": 8940 }, { "epoch": 0.17, "learning_rate": 4.752062226653755e-06, "loss": 0.936, "step": 8941 }, { "epoch": 0.17, "learning_rate": 4.751995894314913e-06, "loss": 0.8906, "step": 8942 }, { "epoch": 0.17, "learning_rate": 4.751929553567186e-06, "loss": 1.0395, "step": 8943 }, { "epoch": 0.17, "learning_rate": 4.751863204410824e-06, "loss": 1.1364, "step": 8944 }, { "epoch": 0.17, "learning_rate": 4.751796846846074e-06, "loss": 1.1178, "step": 8945 }, { "epoch": 0.17, "learning_rate": 4.751730480873183e-06, "loss": 0.9785, "step": 8946 }, { "epoch": 0.17, "learning_rate": 4.7516641064923995e-06, "loss": 0.9306, "step": 8947 }, { "epoch": 0.17, "learning_rate": 4.7515977237039715e-06, "loss": 0.8189, "step": 8948 }, { "epoch": 0.17, "learning_rate": 4.751531332508146e-06, "loss": 1.1115, "step": 8949 }, { "epoch": 0.17, "learning_rate": 4.751464932905172e-06, "loss": 1.2893, "step": 8950 }, { "epoch": 0.17, "learning_rate": 4.751398524895298e-06, "loss": 0.8339, "step": 8951 }, { "epoch": 0.17, "learning_rate": 4.751332108478769e-06, "loss": 0.8123, "step": 8952 }, { "epoch": 0.17, "learning_rate": 4.751265683655836e-06, "loss": 0.7963, "step": 8953 }, { "epoch": 0.17, "learning_rate": 4.751199250426746e-06, "loss": 0.774, "step": 8954 }, { "epoch": 0.17, "learning_rate": 4.751132808791747e-06, "loss": 0.726, "step": 8955 }, { "epoch": 0.17, "learning_rate": 4.751066358751087e-06, "loss": 1.1988, "step": 8956 }, { "epoch": 0.17, "learning_rate": 4.750999900305015e-06, "loss": 0.9332, "step": 8957 }, { "epoch": 0.17, "learning_rate": 4.750933433453777e-06, "loss": 0.9541, "step": 8958 }, { "epoch": 0.17, "learning_rate": 4.750866958197623e-06, "loss": 0.7599, "step": 8959 }, { "epoch": 0.17, "learning_rate": 4.7508004745368005e-06, "loss": 1.0025, "step": 8960 }, { "epoch": 0.17, "learning_rate": 4.750733982471559e-06, "loss": 1.098, "step": 8961 }, { "epoch": 0.17, "learning_rate": 4.750667482002145e-06, "loss": 1.1019, "step": 8962 }, { "epoch": 0.17, "learning_rate": 4.750600973128808e-06, "loss": 0.9056, "step": 8963 }, { "epoch": 0.17, "learning_rate": 4.7505344558517965e-06, "loss": 0.9629, "step": 8964 }, { "epoch": 0.17, "learning_rate": 4.750467930171357e-06, "loss": 0.9495, "step": 8965 }, { "epoch": 0.17, "learning_rate": 4.750401396087741e-06, "loss": 0.9313, "step": 8966 }, { "epoch": 0.17, "learning_rate": 4.750334853601194e-06, "loss": 0.8791, "step": 8967 }, { "epoch": 0.17, "learning_rate": 4.7502683027119656e-06, "loss": 1.0734, "step": 8968 }, { "epoch": 0.17, "learning_rate": 4.750201743420305e-06, "loss": 1.0147, "step": 8969 }, { "epoch": 0.17, "learning_rate": 4.750135175726459e-06, "loss": 1.0612, "step": 8970 }, { "epoch": 0.17, "learning_rate": 4.7500685996306785e-06, "loss": 0.9182, "step": 8971 }, { "epoch": 0.17, "learning_rate": 4.750002015133211e-06, "loss": 0.8805, "step": 8972 }, { "epoch": 0.17, "learning_rate": 4.749935422234304e-06, "loss": 0.8906, "step": 8973 }, { "epoch": 0.17, "learning_rate": 4.749868820934207e-06, "loss": 1.0518, "step": 8974 }, { "epoch": 0.17, "learning_rate": 4.749802211233169e-06, "loss": 1.0079, "step": 8975 }, { "epoch": 0.17, "learning_rate": 4.7497355931314395e-06, "loss": 1.238, "step": 8976 }, { "epoch": 0.17, "learning_rate": 4.749668966629265e-06, "loss": 0.8463, "step": 8977 }, { "epoch": 0.17, "learning_rate": 4.749602331726896e-06, "loss": 1.0537, "step": 8978 }, { "epoch": 0.17, "learning_rate": 4.749535688424581e-06, "loss": 0.8455, "step": 8979 }, { "epoch": 0.17, "learning_rate": 4.749469036722568e-06, "loss": 1.1531, "step": 8980 }, { "epoch": 0.17, "learning_rate": 4.749402376621108e-06, "loss": 1.1593, "step": 8981 }, { "epoch": 0.17, "learning_rate": 4.749335708120447e-06, "loss": 1.0013, "step": 8982 }, { "epoch": 0.17, "learning_rate": 4.749269031220836e-06, "loss": 1.1324, "step": 8983 }, { "epoch": 0.17, "learning_rate": 4.7492023459225245e-06, "loss": 0.9646, "step": 8984 }, { "epoch": 0.17, "learning_rate": 4.749135652225759e-06, "loss": 0.9124, "step": 8985 }, { "epoch": 0.17, "learning_rate": 4.7490689501307906e-06, "loss": 0.9045, "step": 8986 }, { "epoch": 0.17, "learning_rate": 4.749002239637867e-06, "loss": 1.0172, "step": 8987 }, { "epoch": 0.17, "learning_rate": 4.7489355207472386e-06, "loss": 0.9717, "step": 8988 }, { "epoch": 0.17, "learning_rate": 4.748868793459154e-06, "loss": 0.6642, "step": 8989 }, { "epoch": 0.17, "learning_rate": 4.748802057773862e-06, "loss": 0.9083, "step": 8990 }, { "epoch": 0.17, "learning_rate": 4.748735313691612e-06, "loss": 0.8316, "step": 8991 }, { "epoch": 0.17, "learning_rate": 4.748668561212654e-06, "loss": 1.0382, "step": 8992 }, { "epoch": 0.17, "learning_rate": 4.7486018003372355e-06, "loss": 1.0267, "step": 8993 }, { "epoch": 0.17, "learning_rate": 4.748535031065608e-06, "loss": 0.9194, "step": 8994 }, { "epoch": 0.17, "learning_rate": 4.748468253398018e-06, "loss": 0.9413, "step": 8995 }, { "epoch": 0.17, "learning_rate": 4.748401467334718e-06, "loss": 1.0024, "step": 8996 }, { "epoch": 0.17, "learning_rate": 4.748334672875955e-06, "loss": 0.9603, "step": 8997 }, { "epoch": 0.17, "learning_rate": 4.74826787002198e-06, "loss": 0.8673, "step": 8998 }, { "epoch": 0.17, "learning_rate": 4.748201058773041e-06, "loss": 0.8751, "step": 8999 }, { "epoch": 0.17, "learning_rate": 4.748134239129388e-06, "loss": 1.0319, "step": 9000 }, { "epoch": 0.17, "learning_rate": 4.748067411091271e-06, "loss": 0.9117, "step": 9001 }, { "epoch": 0.17, "learning_rate": 4.74800057465894e-06, "loss": 0.8843, "step": 9002 }, { "epoch": 0.17, "learning_rate": 4.7479337298326424e-06, "loss": 0.8873, "step": 9003 }, { "epoch": 0.17, "learning_rate": 4.74786687661263e-06, "loss": 0.7824, "step": 9004 }, { "epoch": 0.17, "learning_rate": 4.747800014999151e-06, "loss": 0.7899, "step": 9005 }, { "epoch": 0.17, "learning_rate": 4.747733144992457e-06, "loss": 1.0129, "step": 9006 }, { "epoch": 0.17, "learning_rate": 4.747666266592796e-06, "loss": 0.9512, "step": 9007 }, { "epoch": 0.17, "learning_rate": 4.747599379800417e-06, "loss": 0.8827, "step": 9008 }, { "epoch": 0.17, "learning_rate": 4.747532484615571e-06, "loss": 0.9869, "step": 9009 }, { "epoch": 0.17, "learning_rate": 4.747465581038508e-06, "loss": 0.9833, "step": 9010 }, { "epoch": 0.17, "learning_rate": 4.747398669069478e-06, "loss": 0.8152, "step": 9011 }, { "epoch": 0.17, "learning_rate": 4.747331748708729e-06, "loss": 1.0917, "step": 9012 }, { "epoch": 0.17, "learning_rate": 4.747264819956513e-06, "loss": 0.9754, "step": 9013 }, { "epoch": 0.17, "learning_rate": 4.7471978828130786e-06, "loss": 0.6891, "step": 9014 }, { "epoch": 0.17, "learning_rate": 4.747130937278677e-06, "loss": 0.8068, "step": 9015 }, { "epoch": 0.17, "learning_rate": 4.747063983353557e-06, "loss": 0.8279, "step": 9016 }, { "epoch": 0.17, "learning_rate": 4.746997021037969e-06, "loss": 1.0354, "step": 9017 }, { "epoch": 0.17, "learning_rate": 4.746930050332163e-06, "loss": 0.8257, "step": 9018 }, { "epoch": 0.17, "learning_rate": 4.746863071236388e-06, "loss": 1.1284, "step": 9019 }, { "epoch": 0.17, "learning_rate": 4.746796083750897e-06, "loss": 1.0652, "step": 9020 }, { "epoch": 0.17, "learning_rate": 4.746729087875937e-06, "loss": 0.891, "step": 9021 }, { "epoch": 0.17, "learning_rate": 4.74666208361176e-06, "loss": 0.9969, "step": 9022 }, { "epoch": 0.17, "learning_rate": 4.746595070958616e-06, "loss": 0.9543, "step": 9023 }, { "epoch": 0.17, "learning_rate": 4.7465280499167546e-06, "loss": 1.0574, "step": 9024 }, { "epoch": 0.17, "learning_rate": 4.7464610204864255e-06, "loss": 0.8466, "step": 9025 }, { "epoch": 0.17, "learning_rate": 4.746393982667881e-06, "loss": 0.7538, "step": 9026 }, { "epoch": 0.17, "learning_rate": 4.74632693646137e-06, "loss": 0.9776, "step": 9027 }, { "epoch": 0.17, "learning_rate": 4.746259881867143e-06, "loss": 0.847, "step": 9028 }, { "epoch": 0.17, "learning_rate": 4.74619281888545e-06, "loss": 0.8163, "step": 9029 }, { "epoch": 0.17, "learning_rate": 4.746125747516542e-06, "loss": 1.1782, "step": 9030 }, { "epoch": 0.17, "learning_rate": 4.74605866776067e-06, "loss": 1.1025, "step": 9031 }, { "epoch": 0.17, "learning_rate": 4.745991579618083e-06, "loss": 1.0022, "step": 9032 }, { "epoch": 0.17, "learning_rate": 4.745924483089033e-06, "loss": 0.9575, "step": 9033 }, { "epoch": 0.17, "learning_rate": 4.74585737817377e-06, "loss": 0.8549, "step": 9034 }, { "epoch": 0.17, "learning_rate": 4.745790264872544e-06, "loss": 0.8603, "step": 9035 }, { "epoch": 0.17, "learning_rate": 4.745723143185605e-06, "loss": 1.1578, "step": 9036 }, { "epoch": 0.17, "learning_rate": 4.745656013113206e-06, "loss": 1.0559, "step": 9037 }, { "epoch": 0.17, "learning_rate": 4.745588874655596e-06, "loss": 1.0822, "step": 9038 }, { "epoch": 0.17, "learning_rate": 4.745521727813026e-06, "loss": 0.7644, "step": 9039 }, { "epoch": 0.17, "learning_rate": 4.745454572585747e-06, "loss": 0.9768, "step": 9040 }, { "epoch": 0.17, "learning_rate": 4.745387408974008e-06, "loss": 0.8945, "step": 9041 }, { "epoch": 0.17, "learning_rate": 4.7453202369780624e-06, "loss": 0.9754, "step": 9042 }, { "epoch": 0.17, "learning_rate": 4.74525305659816e-06, "loss": 0.9547, "step": 9043 }, { "epoch": 0.17, "learning_rate": 4.7451858678345515e-06, "loss": 1.0642, "step": 9044 }, { "epoch": 0.17, "learning_rate": 4.745118670687487e-06, "loss": 0.7866, "step": 9045 }, { "epoch": 0.17, "learning_rate": 4.74505146515722e-06, "loss": 0.8828, "step": 9046 }, { "epoch": 0.17, "learning_rate": 4.744984251243998e-06, "loss": 0.8387, "step": 9047 }, { "epoch": 0.17, "learning_rate": 4.744917028948074e-06, "loss": 0.8787, "step": 9048 }, { "epoch": 0.17, "learning_rate": 4.7448497982697e-06, "loss": 0.8622, "step": 9049 }, { "epoch": 0.17, "learning_rate": 4.744782559209124e-06, "loss": 1.1179, "step": 9050 }, { "epoch": 0.17, "learning_rate": 4.744715311766599e-06, "loss": 0.9491, "step": 9051 }, { "epoch": 0.17, "learning_rate": 4.744648055942376e-06, "loss": 0.9485, "step": 9052 }, { "epoch": 0.17, "learning_rate": 4.744580791736706e-06, "loss": 0.864, "step": 9053 }, { "epoch": 0.17, "learning_rate": 4.744513519149841e-06, "loss": 0.8816, "step": 9054 }, { "epoch": 0.17, "learning_rate": 4.74444623818203e-06, "loss": 0.8063, "step": 9055 }, { "epoch": 0.17, "learning_rate": 4.7443789488335254e-06, "loss": 1.0552, "step": 9056 }, { "epoch": 0.17, "learning_rate": 4.744311651104579e-06, "loss": 1.0598, "step": 9057 }, { "epoch": 0.17, "learning_rate": 4.7442443449954435e-06, "loss": 0.9894, "step": 9058 }, { "epoch": 0.17, "learning_rate": 4.744177030506366e-06, "loss": 0.8922, "step": 9059 }, { "epoch": 0.17, "learning_rate": 4.744109707637602e-06, "loss": 0.9217, "step": 9060 }, { "epoch": 0.17, "learning_rate": 4.7440423763894e-06, "loss": 1.0107, "step": 9061 }, { "epoch": 0.17, "learning_rate": 4.743975036762013e-06, "loss": 1.3172, "step": 9062 }, { "epoch": 0.17, "learning_rate": 4.743907688755693e-06, "loss": 0.954, "step": 9063 }, { "epoch": 0.17, "learning_rate": 4.743840332370688e-06, "loss": 0.9918, "step": 9064 }, { "epoch": 0.17, "learning_rate": 4.743772967607254e-06, "loss": 1.0755, "step": 9065 }, { "epoch": 0.17, "learning_rate": 4.74370559446564e-06, "loss": 0.8867, "step": 9066 }, { "epoch": 0.17, "learning_rate": 4.7436382129460984e-06, "loss": 1.1789, "step": 9067 }, { "epoch": 0.17, "learning_rate": 4.74357082304888e-06, "loss": 1.0388, "step": 9068 }, { "epoch": 0.17, "learning_rate": 4.743503424774237e-06, "loss": 1.1181, "step": 9069 }, { "epoch": 0.17, "learning_rate": 4.743436018122422e-06, "loss": 0.9573, "step": 9070 }, { "epoch": 0.17, "learning_rate": 4.743368603093684e-06, "loss": 0.8352, "step": 9071 }, { "epoch": 0.17, "learning_rate": 4.743301179688278e-06, "loss": 0.9217, "step": 9072 }, { "epoch": 0.17, "learning_rate": 4.743233747906453e-06, "loss": 0.8043, "step": 9073 }, { "epoch": 0.17, "learning_rate": 4.7431663077484625e-06, "loss": 1.174, "step": 9074 }, { "epoch": 0.17, "learning_rate": 4.743098859214557e-06, "loss": 1.1319, "step": 9075 }, { "epoch": 0.17, "learning_rate": 4.743031402304991e-06, "loss": 1.0309, "step": 9076 }, { "epoch": 0.17, "learning_rate": 4.742963937020013e-06, "loss": 0.9553, "step": 9077 }, { "epoch": 0.17, "learning_rate": 4.742896463359876e-06, "loss": 0.9293, "step": 9078 }, { "epoch": 0.17, "learning_rate": 4.742828981324834e-06, "loss": 0.8466, "step": 9079 }, { "epoch": 0.17, "learning_rate": 4.7427614909151365e-06, "loss": 1.2784, "step": 9080 }, { "epoch": 0.17, "learning_rate": 4.742693992131036e-06, "loss": 1.0646, "step": 9081 }, { "epoch": 0.17, "learning_rate": 4.742626484972785e-06, "loss": 0.9653, "step": 9082 }, { "epoch": 0.17, "learning_rate": 4.742558969440636e-06, "loss": 0.9954, "step": 9083 }, { "epoch": 0.17, "learning_rate": 4.7424914455348404e-06, "loss": 0.8976, "step": 9084 }, { "epoch": 0.17, "learning_rate": 4.74242391325565e-06, "loss": 0.9855, "step": 9085 }, { "epoch": 0.17, "learning_rate": 4.742356372603318e-06, "loss": 0.9349, "step": 9086 }, { "epoch": 0.17, "learning_rate": 4.742288823578096e-06, "loss": 0.983, "step": 9087 }, { "epoch": 0.17, "learning_rate": 4.742221266180237e-06, "loss": 1.0279, "step": 9088 }, { "epoch": 0.17, "learning_rate": 4.742153700409991e-06, "loss": 0.838, "step": 9089 }, { "epoch": 0.17, "learning_rate": 4.742086126267613e-06, "loss": 0.8224, "step": 9090 }, { "epoch": 0.17, "learning_rate": 4.742018543753353e-06, "loss": 0.9871, "step": 9091 }, { "epoch": 0.17, "learning_rate": 4.7419509528674655e-06, "loss": 0.8443, "step": 9092 }, { "epoch": 0.17, "learning_rate": 4.741883353610201e-06, "loss": 0.9769, "step": 9093 }, { "epoch": 0.17, "learning_rate": 4.741815745981814e-06, "loss": 1.1064, "step": 9094 }, { "epoch": 0.17, "learning_rate": 4.741748129982555e-06, "loss": 0.902, "step": 9095 }, { "epoch": 0.17, "learning_rate": 4.741680505612677e-06, "loss": 0.908, "step": 9096 }, { "epoch": 0.17, "learning_rate": 4.7416128728724335e-06, "loss": 0.9799, "step": 9097 }, { "epoch": 0.17, "learning_rate": 4.741545231762076e-06, "loss": 0.8974, "step": 9098 }, { "epoch": 0.17, "learning_rate": 4.7414775822818575e-06, "loss": 1.0643, "step": 9099 }, { "epoch": 0.17, "learning_rate": 4.74140992443203e-06, "loss": 1.0739, "step": 9100 }, { "epoch": 0.17, "learning_rate": 4.741342258212846e-06, "loss": 0.8673, "step": 9101 }, { "epoch": 0.17, "learning_rate": 4.74127458362456e-06, "loss": 0.851, "step": 9102 }, { "epoch": 0.17, "learning_rate": 4.741206900667422e-06, "loss": 0.9786, "step": 9103 }, { "epoch": 0.17, "learning_rate": 4.741139209341688e-06, "loss": 0.8564, "step": 9104 }, { "epoch": 0.17, "learning_rate": 4.741071509647608e-06, "loss": 1.0712, "step": 9105 }, { "epoch": 0.17, "learning_rate": 4.741003801585435e-06, "loss": 1.1752, "step": 9106 }, { "epoch": 0.17, "learning_rate": 4.740936085155423e-06, "loss": 1.0094, "step": 9107 }, { "epoch": 0.17, "learning_rate": 4.740868360357824e-06, "loss": 1.085, "step": 9108 }, { "epoch": 0.17, "learning_rate": 4.740800627192892e-06, "loss": 0.8498, "step": 9109 }, { "epoch": 0.17, "learning_rate": 4.740732885660879e-06, "loss": 0.8503, "step": 9110 }, { "epoch": 0.17, "learning_rate": 4.740665135762038e-06, "loss": 0.8564, "step": 9111 }, { "epoch": 0.17, "learning_rate": 4.7405973774966214e-06, "loss": 1.1599, "step": 9112 }, { "epoch": 0.17, "learning_rate": 4.740529610864884e-06, "loss": 0.932, "step": 9113 }, { "epoch": 0.17, "learning_rate": 4.7404618358670775e-06, "loss": 1.0123, "step": 9114 }, { "epoch": 0.17, "learning_rate": 4.740394052503456e-06, "loss": 0.7558, "step": 9115 }, { "epoch": 0.17, "learning_rate": 4.7403262607742696e-06, "loss": 0.8618, "step": 9116 }, { "epoch": 0.17, "learning_rate": 4.740258460679775e-06, "loss": 1.0408, "step": 9117 }, { "epoch": 0.17, "learning_rate": 4.740190652220224e-06, "loss": 1.1167, "step": 9118 }, { "epoch": 0.17, "learning_rate": 4.74012283539587e-06, "loss": 0.8943, "step": 9119 }, { "epoch": 0.17, "learning_rate": 4.740055010206965e-06, "loss": 1.0469, "step": 9120 }, { "epoch": 0.17, "learning_rate": 4.739987176653764e-06, "loss": 1.0815, "step": 9121 }, { "epoch": 0.17, "learning_rate": 4.739919334736519e-06, "loss": 1.0045, "step": 9122 }, { "epoch": 0.17, "learning_rate": 4.739851484455484e-06, "loss": 0.7971, "step": 9123 }, { "epoch": 0.17, "learning_rate": 4.739783625810913e-06, "loss": 1.0654, "step": 9124 }, { "epoch": 0.17, "learning_rate": 4.739715758803059e-06, "loss": 1.1793, "step": 9125 }, { "epoch": 0.17, "learning_rate": 4.739647883432174e-06, "loss": 1.0712, "step": 9126 }, { "epoch": 0.17, "learning_rate": 4.739579999698512e-06, "loss": 1.0273, "step": 9127 }, { "epoch": 0.17, "learning_rate": 4.739512107602328e-06, "loss": 0.9352, "step": 9128 }, { "epoch": 0.17, "learning_rate": 4.739444207143874e-06, "loss": 0.8284, "step": 9129 }, { "epoch": 0.17, "learning_rate": 4.739376298323404e-06, "loss": 0.868, "step": 9130 }, { "epoch": 0.17, "learning_rate": 4.739308381141171e-06, "loss": 1.1039, "step": 9131 }, { "epoch": 0.17, "learning_rate": 4.73924045559743e-06, "loss": 1.1151, "step": 9132 }, { "epoch": 0.17, "learning_rate": 4.739172521692434e-06, "loss": 0.8959, "step": 9133 }, { "epoch": 0.17, "learning_rate": 4.739104579426436e-06, "loss": 0.9213, "step": 9134 }, { "epoch": 0.17, "learning_rate": 4.73903662879969e-06, "loss": 0.9086, "step": 9135 }, { "epoch": 0.17, "learning_rate": 4.738968669812451e-06, "loss": 0.8996, "step": 9136 }, { "epoch": 0.17, "learning_rate": 4.73890070246497e-06, "loss": 1.0283, "step": 9137 }, { "epoch": 0.17, "learning_rate": 4.738832726757503e-06, "loss": 1.063, "step": 9138 }, { "epoch": 0.17, "learning_rate": 4.7387647426903035e-06, "loss": 0.9152, "step": 9139 }, { "epoch": 0.17, "learning_rate": 4.738696750263625e-06, "loss": 0.9113, "step": 9140 }, { "epoch": 0.17, "learning_rate": 4.738628749477721e-06, "loss": 0.8168, "step": 9141 }, { "epoch": 0.17, "learning_rate": 4.738560740332847e-06, "loss": 0.9545, "step": 9142 }, { "epoch": 0.17, "learning_rate": 4.738492722829255e-06, "loss": 1.2298, "step": 9143 }, { "epoch": 0.17, "learning_rate": 4.7384246969672e-06, "loss": 1.1443, "step": 9144 }, { "epoch": 0.17, "learning_rate": 4.738356662746936e-06, "loss": 0.8425, "step": 9145 }, { "epoch": 0.17, "learning_rate": 4.738288620168716e-06, "loss": 0.8705, "step": 9146 }, { "epoch": 0.17, "learning_rate": 4.738220569232795e-06, "loss": 0.8934, "step": 9147 }, { "epoch": 0.17, "learning_rate": 4.738152509939428e-06, "loss": 0.8747, "step": 9148 }, { "epoch": 0.17, "learning_rate": 4.738084442288868e-06, "loss": 0.8292, "step": 9149 }, { "epoch": 0.17, "learning_rate": 4.738016366281369e-06, "loss": 1.1224, "step": 9150 }, { "epoch": 0.17, "learning_rate": 4.737948281917186e-06, "loss": 0.8925, "step": 9151 }, { "epoch": 0.17, "learning_rate": 4.737880189196572e-06, "loss": 0.9365, "step": 9152 }, { "epoch": 0.17, "learning_rate": 4.737812088119782e-06, "loss": 0.8195, "step": 9153 }, { "epoch": 0.17, "learning_rate": 4.73774397868707e-06, "loss": 0.7842, "step": 9154 }, { "epoch": 0.17, "learning_rate": 4.7376758608986914e-06, "loss": 0.7268, "step": 9155 }, { "epoch": 0.17, "learning_rate": 4.7376077347549e-06, "loss": 1.1848, "step": 9156 }, { "epoch": 0.17, "learning_rate": 4.737539600255949e-06, "loss": 1.0519, "step": 9157 }, { "epoch": 0.17, "learning_rate": 4.737471457402094e-06, "loss": 0.7472, "step": 9158 }, { "epoch": 0.17, "learning_rate": 4.73740330619359e-06, "loss": 0.9644, "step": 9159 }, { "epoch": 0.17, "learning_rate": 4.7373351466306895e-06, "loss": 0.9028, "step": 9160 }, { "epoch": 0.17, "learning_rate": 4.737266978713649e-06, "loss": 1.1014, "step": 9161 }, { "epoch": 0.17, "learning_rate": 4.737198802442722e-06, "loss": 1.0393, "step": 9162 }, { "epoch": 0.17, "learning_rate": 4.737130617818163e-06, "loss": 1.0071, "step": 9163 }, { "epoch": 0.17, "learning_rate": 4.737062424840226e-06, "loss": 0.9016, "step": 9164 }, { "epoch": 0.17, "learning_rate": 4.736994223509168e-06, "loss": 0.9904, "step": 9165 }, { "epoch": 0.17, "learning_rate": 4.736926013825242e-06, "loss": 0.8708, "step": 9166 }, { "epoch": 0.17, "learning_rate": 4.736857795788703e-06, "loss": 0.8907, "step": 9167 }, { "epoch": 0.17, "learning_rate": 4.7367895693998045e-06, "loss": 1.0985, "step": 9168 }, { "epoch": 0.17, "learning_rate": 4.736721334658802e-06, "loss": 1.0358, "step": 9169 }, { "epoch": 0.17, "learning_rate": 4.736653091565953e-06, "loss": 0.9492, "step": 9170 }, { "epoch": 0.17, "learning_rate": 4.7365848401215075e-06, "loss": 0.9756, "step": 9171 }, { "epoch": 0.17, "learning_rate": 4.736516580325724e-06, "loss": 0.8073, "step": 9172 }, { "epoch": 0.17, "learning_rate": 4.736448312178856e-06, "loss": 0.8251, "step": 9173 }, { "epoch": 0.17, "learning_rate": 4.736380035681158e-06, "loss": 0.9957, "step": 9174 }, { "epoch": 0.17, "learning_rate": 4.736311750832886e-06, "loss": 1.1036, "step": 9175 }, { "epoch": 0.17, "learning_rate": 4.736243457634294e-06, "loss": 0.7327, "step": 9176 }, { "epoch": 0.17, "learning_rate": 4.736175156085638e-06, "loss": 0.8633, "step": 9177 }, { "epoch": 0.17, "learning_rate": 4.736106846187173e-06, "loss": 0.9319, "step": 9178 }, { "epoch": 0.17, "learning_rate": 4.736038527939153e-06, "loss": 1.0149, "step": 9179 }, { "epoch": 0.17, "learning_rate": 4.735970201341834e-06, "loss": 1.0046, "step": 9180 }, { "epoch": 0.17, "learning_rate": 4.73590186639547e-06, "loss": 0.9625, "step": 9181 }, { "epoch": 0.17, "learning_rate": 4.7358335231003185e-06, "loss": 0.9892, "step": 9182 }, { "epoch": 0.17, "learning_rate": 4.735765171456632e-06, "loss": 1.1343, "step": 9183 }, { "epoch": 0.17, "learning_rate": 4.735696811464667e-06, "loss": 0.9697, "step": 9184 }, { "epoch": 0.17, "learning_rate": 4.735628443124678e-06, "loss": 1.0411, "step": 9185 }, { "epoch": 0.17, "learning_rate": 4.735560066436922e-06, "loss": 0.884, "step": 9186 }, { "epoch": 0.17, "learning_rate": 4.735491681401653e-06, "loss": 1.1131, "step": 9187 }, { "epoch": 0.17, "learning_rate": 4.735423288019127e-06, "loss": 1.0498, "step": 9188 }, { "epoch": 0.17, "learning_rate": 4.7353548862895985e-06, "loss": 0.8719, "step": 9189 }, { "epoch": 0.17, "learning_rate": 4.735286476213323e-06, "loss": 0.8878, "step": 9190 }, { "epoch": 0.17, "learning_rate": 4.735218057790557e-06, "loss": 0.9636, "step": 9191 }, { "epoch": 0.17, "learning_rate": 4.735149631021555e-06, "loss": 0.8983, "step": 9192 }, { "epoch": 0.17, "learning_rate": 4.735081195906574e-06, "loss": 1.1686, "step": 9193 }, { "epoch": 0.17, "learning_rate": 4.735012752445866e-06, "loss": 1.0039, "step": 9194 }, { "epoch": 0.17, "learning_rate": 4.7349443006396915e-06, "loss": 0.823, "step": 9195 }, { "epoch": 0.17, "learning_rate": 4.734875840488301e-06, "loss": 1.0655, "step": 9196 }, { "epoch": 0.17, "learning_rate": 4.734807371991954e-06, "loss": 0.7896, "step": 9197 }, { "epoch": 0.17, "learning_rate": 4.734738895150905e-06, "loss": 0.9835, "step": 9198 }, { "epoch": 0.17, "learning_rate": 4.734670409965409e-06, "loss": 1.023, "step": 9199 }, { "epoch": 0.17, "learning_rate": 4.734601916435722e-06, "loss": 1.2607, "step": 9200 }, { "epoch": 0.17, "learning_rate": 4.7345334145621e-06, "loss": 1.1744, "step": 9201 }, { "epoch": 0.17, "learning_rate": 4.734464904344799e-06, "loss": 0.9374, "step": 9202 }, { "epoch": 0.17, "learning_rate": 4.7343963857840745e-06, "loss": 0.9565, "step": 9203 }, { "epoch": 0.17, "learning_rate": 4.734327858880183e-06, "loss": 0.7234, "step": 9204 }, { "epoch": 0.17, "learning_rate": 4.734259323633379e-06, "loss": 1.0696, "step": 9205 }, { "epoch": 0.17, "learning_rate": 4.73419078004392e-06, "loss": 1.0594, "step": 9206 }, { "epoch": 0.17, "learning_rate": 4.734122228112061e-06, "loss": 0.8393, "step": 9207 }, { "epoch": 0.17, "learning_rate": 4.734053667838057e-06, "loss": 0.9788, "step": 9208 }, { "epoch": 0.17, "learning_rate": 4.733985099222166e-06, "loss": 0.9305, "step": 9209 }, { "epoch": 0.17, "learning_rate": 4.733916522264642e-06, "loss": 0.8033, "step": 9210 }, { "epoch": 0.17, "learning_rate": 4.7338479369657435e-06, "loss": 0.9702, "step": 9211 }, { "epoch": 0.17, "learning_rate": 4.733779343325725e-06, "loss": 0.9913, "step": 9212 }, { "epoch": 0.17, "learning_rate": 4.733710741344842e-06, "loss": 1.0031, "step": 9213 }, { "epoch": 0.17, "learning_rate": 4.733642131023353e-06, "loss": 1.1047, "step": 9214 }, { "epoch": 0.17, "learning_rate": 4.733573512361512e-06, "loss": 0.8412, "step": 9215 }, { "epoch": 0.17, "learning_rate": 4.733504885359577e-06, "loss": 0.9838, "step": 9216 }, { "epoch": 0.17, "learning_rate": 4.733436250017802e-06, "loss": 0.9675, "step": 9217 }, { "epoch": 0.17, "learning_rate": 4.733367606336445e-06, "loss": 1.0317, "step": 9218 }, { "epoch": 0.17, "learning_rate": 4.7332989543157615e-06, "loss": 1.0377, "step": 9219 }, { "epoch": 0.17, "learning_rate": 4.733230293956008e-06, "loss": 0.8801, "step": 9220 }, { "epoch": 0.17, "learning_rate": 4.733161625257442e-06, "loss": 0.7654, "step": 9221 }, { "epoch": 0.17, "learning_rate": 4.733092948220318e-06, "loss": 0.7229, "step": 9222 }, { "epoch": 0.17, "learning_rate": 4.733024262844894e-06, "loss": 0.9292, "step": 9223 }, { "epoch": 0.17, "learning_rate": 4.732955569131425e-06, "loss": 1.0271, "step": 9224 }, { "epoch": 0.17, "learning_rate": 4.73288686708017e-06, "loss": 1.0595, "step": 9225 }, { "epoch": 0.17, "learning_rate": 4.732818156691383e-06, "loss": 0.8428, "step": 9226 }, { "epoch": 0.17, "learning_rate": 4.732749437965321e-06, "loss": 0.8318, "step": 9227 }, { "epoch": 0.17, "learning_rate": 4.732680710902242e-06, "loss": 0.8295, "step": 9228 }, { "epoch": 0.17, "learning_rate": 4.732611975502402e-06, "loss": 0.9283, "step": 9229 }, { "epoch": 0.17, "learning_rate": 4.7325432317660556e-06, "loss": 1.1555, "step": 9230 }, { "epoch": 0.17, "learning_rate": 4.732474479693462e-06, "loss": 1.3468, "step": 9231 }, { "epoch": 0.17, "learning_rate": 4.732405719284877e-06, "loss": 0.9604, "step": 9232 }, { "epoch": 0.17, "learning_rate": 4.732336950540558e-06, "loss": 0.8723, "step": 9233 }, { "epoch": 0.17, "learning_rate": 4.732268173460761e-06, "loss": 0.9973, "step": 9234 }, { "epoch": 0.17, "learning_rate": 4.732199388045743e-06, "loss": 0.8423, "step": 9235 }, { "epoch": 0.17, "learning_rate": 4.732130594295762e-06, "loss": 0.9661, "step": 9236 }, { "epoch": 0.17, "learning_rate": 4.7320617922110724e-06, "loss": 0.8355, "step": 9237 }, { "epoch": 0.17, "learning_rate": 4.731992981791933e-06, "loss": 1.0615, "step": 9238 }, { "epoch": 0.17, "learning_rate": 4.7319241630386e-06, "loss": 1.0339, "step": 9239 }, { "epoch": 0.17, "learning_rate": 4.7318553359513305e-06, "loss": 0.9385, "step": 9240 }, { "epoch": 0.17, "learning_rate": 4.731786500530382e-06, "loss": 0.8436, "step": 9241 }, { "epoch": 0.17, "learning_rate": 4.7317176567760105e-06, "loss": 0.9589, "step": 9242 }, { "epoch": 0.17, "learning_rate": 4.7316488046884745e-06, "loss": 1.0682, "step": 9243 }, { "epoch": 0.17, "learning_rate": 4.73157994426803e-06, "loss": 0.9392, "step": 9244 }, { "epoch": 0.17, "learning_rate": 4.731511075514935e-06, "loss": 1.0733, "step": 9245 }, { "epoch": 0.17, "learning_rate": 4.731442198429445e-06, "loss": 0.9477, "step": 9246 }, { "epoch": 0.17, "learning_rate": 4.731373313011819e-06, "loss": 1.1325, "step": 9247 }, { "epoch": 0.17, "learning_rate": 4.731304419262313e-06, "loss": 0.8941, "step": 9248 }, { "epoch": 0.17, "learning_rate": 4.731235517181185e-06, "loss": 1.0375, "step": 9249 }, { "epoch": 0.17, "learning_rate": 4.7311666067686925e-06, "loss": 1.2003, "step": 9250 }, { "epoch": 0.17, "learning_rate": 4.731097688025091e-06, "loss": 0.9798, "step": 9251 }, { "epoch": 0.17, "learning_rate": 4.73102876095064e-06, "loss": 0.9005, "step": 9252 }, { "epoch": 0.17, "learning_rate": 4.7309598255455955e-06, "loss": 1.1046, "step": 9253 }, { "epoch": 0.17, "learning_rate": 4.730890881810216e-06, "loss": 0.78, "step": 9254 }, { "epoch": 0.17, "learning_rate": 4.730821929744759e-06, "loss": 0.8243, "step": 9255 }, { "epoch": 0.17, "learning_rate": 4.7307529693494795e-06, "loss": 1.1075, "step": 9256 }, { "epoch": 0.17, "learning_rate": 4.730684000624638e-06, "loss": 1.0305, "step": 9257 }, { "epoch": 0.17, "learning_rate": 4.73061502357049e-06, "loss": 0.9847, "step": 9258 }, { "epoch": 0.17, "learning_rate": 4.7305460381872944e-06, "loss": 1.0647, "step": 9259 }, { "epoch": 0.17, "learning_rate": 4.730477044475309e-06, "loss": 0.9015, "step": 9260 }, { "epoch": 0.17, "learning_rate": 4.7304080424347894e-06, "loss": 0.8275, "step": 9261 }, { "epoch": 0.17, "learning_rate": 4.730339032065996e-06, "loss": 1.0991, "step": 9262 }, { "epoch": 0.17, "learning_rate": 4.730270013369183e-06, "loss": 0.8688, "step": 9263 }, { "epoch": 0.17, "learning_rate": 4.730200986344613e-06, "loss": 0.8252, "step": 9264 }, { "epoch": 0.17, "learning_rate": 4.7301319509925395e-06, "loss": 0.8971, "step": 9265 }, { "epoch": 0.17, "learning_rate": 4.730062907313221e-06, "loss": 0.8037, "step": 9266 }, { "epoch": 0.17, "learning_rate": 4.7299938553069155e-06, "loss": 0.7635, "step": 9267 }, { "epoch": 0.17, "learning_rate": 4.729924794973883e-06, "loss": 0.9855, "step": 9268 }, { "epoch": 0.17, "learning_rate": 4.729855726314379e-06, "loss": 0.856, "step": 9269 }, { "epoch": 0.17, "learning_rate": 4.729786649328662e-06, "loss": 0.9116, "step": 9270 }, { "epoch": 0.17, "learning_rate": 4.72971756401699e-06, "loss": 0.8409, "step": 9271 }, { "epoch": 0.17, "learning_rate": 4.729648470379621e-06, "loss": 1.0219, "step": 9272 }, { "epoch": 0.17, "learning_rate": 4.729579368416813e-06, "loss": 0.9508, "step": 9273 }, { "epoch": 0.17, "learning_rate": 4.729510258128824e-06, "loss": 0.9101, "step": 9274 }, { "epoch": 0.17, "learning_rate": 4.729441139515912e-06, "loss": 1.1232, "step": 9275 }, { "epoch": 0.18, "learning_rate": 4.729372012578335e-06, "loss": 1.0326, "step": 9276 }, { "epoch": 0.18, "learning_rate": 4.7293028773163515e-06, "loss": 0.7994, "step": 9277 }, { "epoch": 0.18, "learning_rate": 4.729233733730219e-06, "loss": 0.9825, "step": 9278 }, { "epoch": 0.18, "learning_rate": 4.729164581820197e-06, "loss": 0.9155, "step": 9279 }, { "epoch": 0.18, "learning_rate": 4.729095421586543e-06, "loss": 0.8056, "step": 9280 }, { "epoch": 0.18, "learning_rate": 4.729026253029514e-06, "loss": 1.1757, "step": 9281 }, { "epoch": 0.18, "learning_rate": 4.72895707614937e-06, "loss": 1.0013, "step": 9282 }, { "epoch": 0.18, "learning_rate": 4.7288878909463675e-06, "loss": 0.8929, "step": 9283 }, { "epoch": 0.18, "learning_rate": 4.728818697420767e-06, "loss": 1.1395, "step": 9284 }, { "epoch": 0.18, "learning_rate": 4.728749495572825e-06, "loss": 1.1297, "step": 9285 }, { "epoch": 0.18, "learning_rate": 4.728680285402801e-06, "loss": 1.0308, "step": 9286 }, { "epoch": 0.18, "learning_rate": 4.728611066910954e-06, "loss": 1.051, "step": 9287 }, { "epoch": 0.18, "learning_rate": 4.728541840097541e-06, "loss": 1.1763, "step": 9288 }, { "epoch": 0.18, "learning_rate": 4.728472604962821e-06, "loss": 0.8969, "step": 9289 }, { "epoch": 0.18, "learning_rate": 4.728403361507053e-06, "loss": 1.0428, "step": 9290 }, { "epoch": 0.18, "learning_rate": 4.728334109730495e-06, "loss": 1.0175, "step": 9291 }, { "epoch": 0.18, "learning_rate": 4.728264849633405e-06, "loss": 0.897, "step": 9292 }, { "epoch": 0.18, "learning_rate": 4.728195581216043e-06, "loss": 1.1754, "step": 9293 }, { "epoch": 0.18, "learning_rate": 4.728126304478667e-06, "loss": 1.2635, "step": 9294 }, { "epoch": 0.18, "learning_rate": 4.728057019421536e-06, "loss": 0.9828, "step": 9295 }, { "epoch": 0.18, "learning_rate": 4.727987726044908e-06, "loss": 0.8809, "step": 9296 }, { "epoch": 0.18, "learning_rate": 4.727918424349042e-06, "loss": 1.1287, "step": 9297 }, { "epoch": 0.18, "learning_rate": 4.727849114334198e-06, "loss": 0.7343, "step": 9298 }, { "epoch": 0.18, "learning_rate": 4.7277797960006326e-06, "loss": 1.0404, "step": 9299 }, { "epoch": 0.18, "learning_rate": 4.727710469348606e-06, "loss": 1.0764, "step": 9300 }, { "epoch": 0.18, "learning_rate": 4.727641134378377e-06, "loss": 0.8797, "step": 9301 }, { "epoch": 0.18, "learning_rate": 4.727571791090204e-06, "loss": 0.8341, "step": 9302 }, { "epoch": 0.18, "learning_rate": 4.727502439484346e-06, "loss": 1.0432, "step": 9303 }, { "epoch": 0.18, "learning_rate": 4.727433079561063e-06, "loss": 0.9048, "step": 9304 }, { "epoch": 0.18, "learning_rate": 4.727363711320613e-06, "loss": 1.0629, "step": 9305 }, { "epoch": 0.18, "learning_rate": 4.727294334763254e-06, "loss": 0.9724, "step": 9306 }, { "epoch": 0.18, "learning_rate": 4.727224949889247e-06, "loss": 0.9529, "step": 9307 }, { "epoch": 0.18, "learning_rate": 4.727155556698852e-06, "loss": 1.045, "step": 9308 }, { "epoch": 0.18, "learning_rate": 4.727086155192324e-06, "loss": 0.8994, "step": 9309 }, { "epoch": 0.18, "learning_rate": 4.7270167453699254e-06, "loss": 0.8474, "step": 9310 }, { "epoch": 0.18, "learning_rate": 4.726947327231915e-06, "loss": 0.9949, "step": 9311 }, { "epoch": 0.18, "learning_rate": 4.7268779007785515e-06, "loss": 1.1973, "step": 9312 }, { "epoch": 0.18, "learning_rate": 4.7268084660100935e-06, "loss": 1.1866, "step": 9313 }, { "epoch": 0.18, "learning_rate": 4.726739022926802e-06, "loss": 1.0317, "step": 9314 }, { "epoch": 0.18, "learning_rate": 4.726669571528934e-06, "loss": 0.9601, "step": 9315 }, { "epoch": 0.18, "learning_rate": 4.7266001118167505e-06, "loss": 0.9355, "step": 9316 }, { "epoch": 0.18, "learning_rate": 4.726530643790511e-06, "loss": 0.8801, "step": 9317 }, { "epoch": 0.18, "learning_rate": 4.726461167450474e-06, "loss": 0.8648, "step": 9318 }, { "epoch": 0.18, "learning_rate": 4.726391682796899e-06, "loss": 1.1998, "step": 9319 }, { "epoch": 0.18, "learning_rate": 4.7263221898300464e-06, "loss": 0.9108, "step": 9320 }, { "epoch": 0.18, "learning_rate": 4.7262526885501744e-06, "loss": 0.8155, "step": 9321 }, { "epoch": 0.18, "learning_rate": 4.726183178957544e-06, "loss": 0.9009, "step": 9322 }, { "epoch": 0.18, "learning_rate": 4.7261136610524126e-06, "loss": 1.0291, "step": 9323 }, { "epoch": 0.18, "learning_rate": 4.726044134835042e-06, "loss": 1.1536, "step": 9324 }, { "epoch": 0.18, "learning_rate": 4.72597460030569e-06, "loss": 1.0933, "step": 9325 }, { "epoch": 0.18, "learning_rate": 4.725905057464618e-06, "loss": 0.974, "step": 9326 }, { "epoch": 0.18, "learning_rate": 4.725835506312085e-06, "loss": 0.9521, "step": 9327 }, { "epoch": 0.18, "learning_rate": 4.72576594684835e-06, "loss": 0.9946, "step": 9328 }, { "epoch": 0.18, "learning_rate": 4.725696379073672e-06, "loss": 0.9283, "step": 9329 }, { "epoch": 0.18, "learning_rate": 4.7256268029883135e-06, "loss": 0.9189, "step": 9330 }, { "epoch": 0.18, "learning_rate": 4.725557218592532e-06, "loss": 1.141, "step": 9331 }, { "epoch": 0.18, "learning_rate": 4.725487625886589e-06, "loss": 1.164, "step": 9332 }, { "epoch": 0.18, "learning_rate": 4.725418024870743e-06, "loss": 0.9121, "step": 9333 }, { "epoch": 0.18, "learning_rate": 4.725348415545253e-06, "loss": 1.0554, "step": 9334 }, { "epoch": 0.18, "learning_rate": 4.725278797910382e-06, "loss": 0.8361, "step": 9335 }, { "epoch": 0.18, "learning_rate": 4.725209171966387e-06, "loss": 0.9607, "step": 9336 }, { "epoch": 0.18, "learning_rate": 4.72513953771353e-06, "loss": 0.8964, "step": 9337 }, { "epoch": 0.18, "learning_rate": 4.72506989515207e-06, "loss": 1.0556, "step": 9338 }, { "epoch": 0.18, "learning_rate": 4.725000244282267e-06, "loss": 0.9141, "step": 9339 }, { "epoch": 0.18, "learning_rate": 4.724930585104381e-06, "loss": 0.923, "step": 9340 }, { "epoch": 0.18, "learning_rate": 4.7248609176186736e-06, "loss": 0.8776, "step": 9341 }, { "epoch": 0.18, "learning_rate": 4.724791241825403e-06, "loss": 0.9086, "step": 9342 }, { "epoch": 0.18, "learning_rate": 4.72472155772483e-06, "loss": 1.0045, "step": 9343 }, { "epoch": 0.18, "learning_rate": 4.724651865317215e-06, "loss": 1.2339, "step": 9344 }, { "epoch": 0.18, "learning_rate": 4.724582164602819e-06, "loss": 0.9643, "step": 9345 }, { "epoch": 0.18, "learning_rate": 4.7245124555819e-06, "loss": 0.8908, "step": 9346 }, { "epoch": 0.18, "learning_rate": 4.72444273825472e-06, "loss": 1.0649, "step": 9347 }, { "epoch": 0.18, "learning_rate": 4.724373012621539e-06, "loss": 0.9016, "step": 9348 }, { "epoch": 0.18, "learning_rate": 4.724303278682618e-06, "loss": 0.9846, "step": 9349 }, { "epoch": 0.18, "learning_rate": 4.724233536438216e-06, "loss": 1.0322, "step": 9350 }, { "epoch": 0.18, "learning_rate": 4.724163785888595e-06, "loss": 0.8264, "step": 9351 }, { "epoch": 0.18, "learning_rate": 4.724094027034014e-06, "loss": 0.8142, "step": 9352 }, { "epoch": 0.18, "learning_rate": 4.724024259874734e-06, "loss": 0.8616, "step": 9353 }, { "epoch": 0.18, "learning_rate": 4.7239544844110164e-06, "loss": 0.8284, "step": 9354 }, { "epoch": 0.18, "learning_rate": 4.723884700643121e-06, "loss": 0.8785, "step": 9355 }, { "epoch": 0.18, "learning_rate": 4.7238149085713075e-06, "loss": 1.1551, "step": 9356 }, { "epoch": 0.18, "learning_rate": 4.723745108195837e-06, "loss": 0.9563, "step": 9357 }, { "epoch": 0.18, "learning_rate": 4.723675299516972e-06, "loss": 0.8259, "step": 9358 }, { "epoch": 0.18, "learning_rate": 4.72360548253497e-06, "loss": 0.7505, "step": 9359 }, { "epoch": 0.18, "learning_rate": 4.723535657250095e-06, "loss": 0.7284, "step": 9360 }, { "epoch": 0.18, "learning_rate": 4.723465823662604e-06, "loss": 1.0643, "step": 9361 }, { "epoch": 0.18, "learning_rate": 4.723395981772762e-06, "loss": 1.0472, "step": 9362 }, { "epoch": 0.18, "learning_rate": 4.723326131580825e-06, "loss": 1.116, "step": 9363 }, { "epoch": 0.18, "learning_rate": 4.723256273087058e-06, "loss": 1.0581, "step": 9364 }, { "epoch": 0.18, "learning_rate": 4.72318640629172e-06, "loss": 1.0002, "step": 9365 }, { "epoch": 0.18, "learning_rate": 4.723116531195072e-06, "loss": 0.8706, "step": 9366 }, { "epoch": 0.18, "learning_rate": 4.7230466477973755e-06, "loss": 0.9007, "step": 9367 }, { "epoch": 0.18, "learning_rate": 4.7229767560988906e-06, "loss": 1.1381, "step": 9368 }, { "epoch": 0.18, "learning_rate": 4.722906856099878e-06, "loss": 1.1308, "step": 9369 }, { "epoch": 0.18, "learning_rate": 4.7228369478006005e-06, "loss": 1.0449, "step": 9370 }, { "epoch": 0.18, "learning_rate": 4.722767031201317e-06, "loss": 1.0511, "step": 9371 }, { "epoch": 0.18, "learning_rate": 4.722697106302291e-06, "loss": 0.8109, "step": 9372 }, { "epoch": 0.18, "learning_rate": 4.722627173103781e-06, "loss": 0.9935, "step": 9373 }, { "epoch": 0.18, "learning_rate": 4.722557231606049e-06, "loss": 1.1641, "step": 9374 }, { "epoch": 0.18, "learning_rate": 4.722487281809358e-06, "loss": 1.1553, "step": 9375 }, { "epoch": 0.18, "learning_rate": 4.722417323713966e-06, "loss": 0.9488, "step": 9376 }, { "epoch": 0.18, "learning_rate": 4.722347357320136e-06, "loss": 0.7861, "step": 9377 }, { "epoch": 0.18, "learning_rate": 4.722277382628131e-06, "loss": 0.9073, "step": 9378 }, { "epoch": 0.18, "learning_rate": 4.722207399638208e-06, "loss": 0.8818, "step": 9379 }, { "epoch": 0.18, "learning_rate": 4.722137408350632e-06, "loss": 1.1014, "step": 9380 }, { "epoch": 0.18, "learning_rate": 4.722067408765662e-06, "loss": 1.1107, "step": 9381 }, { "epoch": 0.18, "learning_rate": 4.721997400883562e-06, "loss": 0.9109, "step": 9382 }, { "epoch": 0.18, "learning_rate": 4.721927384704591e-06, "loss": 0.8406, "step": 9383 }, { "epoch": 0.18, "learning_rate": 4.7218573602290106e-06, "loss": 0.7395, "step": 9384 }, { "epoch": 0.18, "learning_rate": 4.721787327457083e-06, "loss": 0.9286, "step": 9385 }, { "epoch": 0.18, "learning_rate": 4.721717286389071e-06, "loss": 0.906, "step": 9386 }, { "epoch": 0.18, "learning_rate": 4.721647237025234e-06, "loss": 1.2039, "step": 9387 }, { "epoch": 0.18, "learning_rate": 4.7215771793658345e-06, "loss": 0.9156, "step": 9388 }, { "epoch": 0.18, "learning_rate": 4.721507113411133e-06, "loss": 0.9709, "step": 9389 }, { "epoch": 0.18, "learning_rate": 4.721437039161393e-06, "loss": 0.9355, "step": 9390 }, { "epoch": 0.18, "learning_rate": 4.721366956616875e-06, "loss": 0.9344, "step": 9391 }, { "epoch": 0.18, "learning_rate": 4.721296865777841e-06, "loss": 0.9402, "step": 9392 }, { "epoch": 0.18, "learning_rate": 4.721226766644553e-06, "loss": 0.734, "step": 9393 }, { "epoch": 0.18, "learning_rate": 4.721156659217272e-06, "loss": 1.0593, "step": 9394 }, { "epoch": 0.18, "learning_rate": 4.721086543496259e-06, "loss": 0.9031, "step": 9395 }, { "epoch": 0.18, "learning_rate": 4.7210164194817785e-06, "loss": 1.0876, "step": 9396 }, { "epoch": 0.18, "learning_rate": 4.7209462871740905e-06, "loss": 0.8868, "step": 9397 }, { "epoch": 0.18, "learning_rate": 4.720876146573456e-06, "loss": 0.9932, "step": 9398 }, { "epoch": 0.18, "learning_rate": 4.72080599768014e-06, "loss": 0.9355, "step": 9399 }, { "epoch": 0.18, "learning_rate": 4.720735840494401e-06, "loss": 1.1104, "step": 9400 }, { "epoch": 0.18, "learning_rate": 4.720665675016503e-06, "loss": 0.8751, "step": 9401 }, { "epoch": 0.18, "learning_rate": 4.7205955012467075e-06, "loss": 0.8837, "step": 9402 }, { "epoch": 0.18, "learning_rate": 4.720525319185277e-06, "loss": 0.8453, "step": 9403 }, { "epoch": 0.18, "learning_rate": 4.720455128832471e-06, "loss": 0.8192, "step": 9404 }, { "epoch": 0.18, "learning_rate": 4.720384930188555e-06, "loss": 0.8656, "step": 9405 }, { "epoch": 0.18, "learning_rate": 4.72031472325379e-06, "loss": 0.913, "step": 9406 }, { "epoch": 0.18, "learning_rate": 4.7202445080284385e-06, "loss": 0.9188, "step": 9407 }, { "epoch": 0.18, "learning_rate": 4.72017428451276e-06, "loss": 1.1711, "step": 9408 }, { "epoch": 0.18, "learning_rate": 4.720104052707021e-06, "loss": 0.8083, "step": 9409 }, { "epoch": 0.18, "learning_rate": 4.720033812611481e-06, "loss": 0.9211, "step": 9410 }, { "epoch": 0.18, "learning_rate": 4.719963564226402e-06, "loss": 1.0278, "step": 9411 }, { "epoch": 0.18, "learning_rate": 4.719893307552048e-06, "loss": 1.1718, "step": 9412 }, { "epoch": 0.18, "learning_rate": 4.719823042588679e-06, "loss": 0.9697, "step": 9413 }, { "epoch": 0.18, "learning_rate": 4.71975276933656e-06, "loss": 1.0085, "step": 9414 }, { "epoch": 0.18, "learning_rate": 4.719682487795952e-06, "loss": 0.7305, "step": 9415 }, { "epoch": 0.18, "learning_rate": 4.719612197967117e-06, "loss": 1.0173, "step": 9416 }, { "epoch": 0.18, "learning_rate": 4.719541899850319e-06, "loss": 0.9478, "step": 9417 }, { "epoch": 0.18, "learning_rate": 4.71947159344582e-06, "loss": 0.8096, "step": 9418 }, { "epoch": 0.18, "learning_rate": 4.719401278753881e-06, "loss": 0.9608, "step": 9419 }, { "epoch": 0.18, "learning_rate": 4.719330955774767e-06, "loss": 0.9809, "step": 9420 }, { "epoch": 0.18, "learning_rate": 4.719260624508738e-06, "loss": 0.9979, "step": 9421 }, { "epoch": 0.18, "learning_rate": 4.719190284956058e-06, "loss": 0.7678, "step": 9422 }, { "epoch": 0.18, "learning_rate": 4.7191199371169906e-06, "loss": 1.0657, "step": 9423 }, { "epoch": 0.18, "learning_rate": 4.719049580991796e-06, "loss": 1.0317, "step": 9424 }, { "epoch": 0.18, "learning_rate": 4.718979216580739e-06, "loss": 1.2157, "step": 9425 }, { "epoch": 0.18, "learning_rate": 4.718908843884081e-06, "loss": 0.9792, "step": 9426 }, { "epoch": 0.18, "learning_rate": 4.718838462902086e-06, "loss": 1.0892, "step": 9427 }, { "epoch": 0.18, "learning_rate": 4.7187680736350165e-06, "loss": 0.9338, "step": 9428 }, { "epoch": 0.18, "learning_rate": 4.718697676083135e-06, "loss": 0.8132, "step": 9429 }, { "epoch": 0.18, "learning_rate": 4.718627270246704e-06, "loss": 1.0604, "step": 9430 }, { "epoch": 0.18, "learning_rate": 4.718556856125987e-06, "loss": 1.2731, "step": 9431 }, { "epoch": 0.18, "learning_rate": 4.718486433721247e-06, "loss": 1.1271, "step": 9432 }, { "epoch": 0.18, "learning_rate": 4.718416003032746e-06, "loss": 0.9697, "step": 9433 }, { "epoch": 0.18, "learning_rate": 4.718345564060748e-06, "loss": 0.8783, "step": 9434 }, { "epoch": 0.18, "learning_rate": 4.718275116805515e-06, "loss": 0.8371, "step": 9435 }, { "epoch": 0.18, "learning_rate": 4.718204661267312e-06, "loss": 1.1818, "step": 9436 }, { "epoch": 0.18, "learning_rate": 4.7181341974464e-06, "loss": 1.2776, "step": 9437 }, { "epoch": 0.18, "learning_rate": 4.718063725343043e-06, "loss": 0.9122, "step": 9438 }, { "epoch": 0.18, "learning_rate": 4.717993244957504e-06, "loss": 0.7423, "step": 9439 }, { "epoch": 0.18, "learning_rate": 4.717922756290046e-06, "loss": 0.9127, "step": 9440 }, { "epoch": 0.18, "learning_rate": 4.717852259340934e-06, "loss": 0.9033, "step": 9441 }, { "epoch": 0.18, "learning_rate": 4.717781754110427e-06, "loss": 0.9068, "step": 9442 }, { "epoch": 0.18, "learning_rate": 4.717711240598794e-06, "loss": 1.1808, "step": 9443 }, { "epoch": 0.18, "learning_rate": 4.717640718806292e-06, "loss": 1.066, "step": 9444 }, { "epoch": 0.18, "learning_rate": 4.71757018873319e-06, "loss": 0.8999, "step": 9445 }, { "epoch": 0.18, "learning_rate": 4.717499650379748e-06, "loss": 0.8967, "step": 9446 }, { "epoch": 0.18, "learning_rate": 4.71742910374623e-06, "loss": 0.8823, "step": 9447 }, { "epoch": 0.18, "learning_rate": 4.717358548832901e-06, "loss": 0.9014, "step": 9448 }, { "epoch": 0.18, "learning_rate": 4.717287985640022e-06, "loss": 1.0396, "step": 9449 }, { "epoch": 0.18, "learning_rate": 4.7172174141678576e-06, "loss": 1.0074, "step": 9450 }, { "epoch": 0.18, "learning_rate": 4.717146834416671e-06, "loss": 0.8922, "step": 9451 }, { "epoch": 0.18, "learning_rate": 4.717076246386728e-06, "loss": 0.7307, "step": 9452 }, { "epoch": 0.18, "learning_rate": 4.717005650078289e-06, "loss": 0.8716, "step": 9453 }, { "epoch": 0.18, "learning_rate": 4.716935045491618e-06, "loss": 0.9985, "step": 9454 }, { "epoch": 0.18, "learning_rate": 4.716864432626981e-06, "loss": 0.9707, "step": 9455 }, { "epoch": 0.18, "learning_rate": 4.716793811484639e-06, "loss": 1.0607, "step": 9456 }, { "epoch": 0.18, "learning_rate": 4.716723182064859e-06, "loss": 0.9145, "step": 9457 }, { "epoch": 0.18, "learning_rate": 4.7166525443679e-06, "loss": 0.8321, "step": 9458 }, { "epoch": 0.18, "learning_rate": 4.71658189839403e-06, "loss": 0.9196, "step": 9459 }, { "epoch": 0.18, "learning_rate": 4.7165112441435105e-06, "loss": 0.9247, "step": 9460 }, { "epoch": 0.18, "learning_rate": 4.716440581616606e-06, "loss": 0.8031, "step": 9461 }, { "epoch": 0.18, "learning_rate": 4.71636991081358e-06, "loss": 0.9761, "step": 9462 }, { "epoch": 0.18, "learning_rate": 4.716299231734697e-06, "loss": 0.9882, "step": 9463 }, { "epoch": 0.18, "learning_rate": 4.716228544380221e-06, "loss": 0.9527, "step": 9464 }, { "epoch": 0.18, "learning_rate": 4.7161578487504155e-06, "loss": 1.112, "step": 9465 }, { "epoch": 0.18, "learning_rate": 4.716087144845544e-06, "loss": 0.9566, "step": 9466 }, { "epoch": 0.18, "learning_rate": 4.716016432665872e-06, "loss": 1.0633, "step": 9467 }, { "epoch": 0.18, "learning_rate": 4.7159457122116615e-06, "loss": 1.1722, "step": 9468 }, { "epoch": 0.18, "learning_rate": 4.7158749834831785e-06, "loss": 1.0049, "step": 9469 }, { "epoch": 0.18, "learning_rate": 4.7158042464806854e-06, "loss": 0.908, "step": 9470 }, { "epoch": 0.18, "learning_rate": 4.715733501204448e-06, "loss": 0.867, "step": 9471 }, { "epoch": 0.18, "learning_rate": 4.715662747654729e-06, "loss": 1.037, "step": 9472 }, { "epoch": 0.18, "learning_rate": 4.715591985831793e-06, "loss": 0.9382, "step": 9473 }, { "epoch": 0.18, "learning_rate": 4.715521215735905e-06, "loss": 0.8878, "step": 9474 }, { "epoch": 0.18, "learning_rate": 4.715450437367329e-06, "loss": 1.1411, "step": 9475 }, { "epoch": 0.18, "learning_rate": 4.715379650726329e-06, "loss": 0.7442, "step": 9476 }, { "epoch": 0.18, "learning_rate": 4.715308855813169e-06, "loss": 0.8593, "step": 9477 }, { "epoch": 0.18, "learning_rate": 4.715238052628114e-06, "loss": 0.9512, "step": 9478 }, { "epoch": 0.18, "learning_rate": 4.715167241171428e-06, "loss": 0.8394, "step": 9479 }, { "epoch": 0.18, "learning_rate": 4.715096421443375e-06, "loss": 0.9114, "step": 9480 }, { "epoch": 0.18, "learning_rate": 4.715025593444219e-06, "loss": 0.981, "step": 9481 }, { "epoch": 0.18, "learning_rate": 4.714954757174227e-06, "loss": 1.0235, "step": 9482 }, { "epoch": 0.18, "learning_rate": 4.714883912633661e-06, "loss": 0.8626, "step": 9483 }, { "epoch": 0.18, "learning_rate": 4.714813059822787e-06, "loss": 1.0574, "step": 9484 }, { "epoch": 0.18, "learning_rate": 4.714742198741869e-06, "loss": 0.898, "step": 9485 }, { "epoch": 0.18, "learning_rate": 4.71467132939117e-06, "loss": 0.8474, "step": 9486 }, { "epoch": 0.18, "learning_rate": 4.714600451770957e-06, "loss": 0.9588, "step": 9487 }, { "epoch": 0.18, "learning_rate": 4.714529565881495e-06, "loss": 1.0138, "step": 9488 }, { "epoch": 0.18, "learning_rate": 4.714458671723046e-06, "loss": 0.977, "step": 9489 }, { "epoch": 0.18, "learning_rate": 4.714387769295877e-06, "loss": 1.0696, "step": 9490 }, { "epoch": 0.18, "learning_rate": 4.714316858600252e-06, "loss": 0.9973, "step": 9491 }, { "epoch": 0.18, "learning_rate": 4.714245939636435e-06, "loss": 0.9869, "step": 9492 }, { "epoch": 0.18, "learning_rate": 4.714175012404692e-06, "loss": 0.9597, "step": 9493 }, { "epoch": 0.18, "learning_rate": 4.714104076905287e-06, "loss": 0.9722, "step": 9494 }, { "epoch": 0.18, "learning_rate": 4.7140331331384856e-06, "loss": 0.8178, "step": 9495 }, { "epoch": 0.18, "learning_rate": 4.7139621811045535e-06, "loss": 0.9966, "step": 9496 }, { "epoch": 0.18, "learning_rate": 4.713891220803753e-06, "loss": 0.7953, "step": 9497 }, { "epoch": 0.18, "learning_rate": 4.713820252236351e-06, "loss": 0.8837, "step": 9498 }, { "epoch": 0.18, "learning_rate": 4.713749275402611e-06, "loss": 0.8615, "step": 9499 }, { "epoch": 0.18, "learning_rate": 4.713678290302801e-06, "loss": 1.0092, "step": 9500 }, { "epoch": 0.18, "learning_rate": 4.713607296937183e-06, "loss": 0.9014, "step": 9501 }, { "epoch": 0.18, "learning_rate": 4.713536295306024e-06, "loss": 1.0177, "step": 9502 }, { "epoch": 0.18, "learning_rate": 4.713465285409588e-06, "loss": 0.8416, "step": 9503 }, { "epoch": 0.18, "learning_rate": 4.71339426724814e-06, "loss": 0.9249, "step": 9504 }, { "epoch": 0.18, "learning_rate": 4.713323240821946e-06, "loss": 0.8518, "step": 9505 }, { "epoch": 0.18, "learning_rate": 4.7132522061312705e-06, "loss": 1.043, "step": 9506 }, { "epoch": 0.18, "learning_rate": 4.71318116317638e-06, "loss": 0.9308, "step": 9507 }, { "epoch": 0.18, "learning_rate": 4.713110111957538e-06, "loss": 0.9346, "step": 9508 }, { "epoch": 0.18, "learning_rate": 4.713039052475011e-06, "loss": 0.9635, "step": 9509 }, { "epoch": 0.18, "learning_rate": 4.7129679847290645e-06, "loss": 0.9595, "step": 9510 }, { "epoch": 0.18, "learning_rate": 4.712896908719962e-06, "loss": 0.8665, "step": 9511 }, { "epoch": 0.18, "learning_rate": 4.712825824447972e-06, "loss": 1.2072, "step": 9512 }, { "epoch": 0.18, "learning_rate": 4.7127547319133575e-06, "loss": 1.0516, "step": 9513 }, { "epoch": 0.18, "learning_rate": 4.712683631116385e-06, "loss": 0.9612, "step": 9514 }, { "epoch": 0.18, "learning_rate": 4.7126125220573195e-06, "loss": 1.1548, "step": 9515 }, { "epoch": 0.18, "learning_rate": 4.712541404736426e-06, "loss": 0.8309, "step": 9516 }, { "epoch": 0.18, "learning_rate": 4.712470279153971e-06, "loss": 0.8033, "step": 9517 }, { "epoch": 0.18, "learning_rate": 4.7123991453102205e-06, "loss": 0.8513, "step": 9518 }, { "epoch": 0.18, "learning_rate": 4.712328003205439e-06, "loss": 1.0762, "step": 9519 }, { "epoch": 0.18, "learning_rate": 4.712256852839893e-06, "loss": 0.879, "step": 9520 }, { "epoch": 0.18, "learning_rate": 4.712185694213847e-06, "loss": 0.81, "step": 9521 }, { "epoch": 0.18, "learning_rate": 4.712114527327568e-06, "loss": 0.9671, "step": 9522 }, { "epoch": 0.18, "learning_rate": 4.712043352181321e-06, "loss": 0.8666, "step": 9523 }, { "epoch": 0.18, "learning_rate": 4.711972168775372e-06, "loss": 1.047, "step": 9524 }, { "epoch": 0.18, "learning_rate": 4.711900977109987e-06, "loss": 1.1099, "step": 9525 }, { "epoch": 0.18, "learning_rate": 4.71182977718543e-06, "loss": 1.0539, "step": 9526 }, { "epoch": 0.18, "learning_rate": 4.7117585690019705e-06, "loss": 0.9077, "step": 9527 }, { "epoch": 0.18, "learning_rate": 4.711687352559871e-06, "loss": 0.9433, "step": 9528 }, { "epoch": 0.18, "learning_rate": 4.711616127859399e-06, "loss": 1.0935, "step": 9529 }, { "epoch": 0.18, "learning_rate": 4.7115448949008205e-06, "loss": 1.011, "step": 9530 }, { "epoch": 0.18, "learning_rate": 4.7114736536844015e-06, "loss": 1.1449, "step": 9531 }, { "epoch": 0.18, "learning_rate": 4.7114024042104065e-06, "loss": 0.9606, "step": 9532 }, { "epoch": 0.18, "learning_rate": 4.711331146479104e-06, "loss": 0.8948, "step": 9533 }, { "epoch": 0.18, "learning_rate": 4.7112598804907584e-06, "loss": 1.0515, "step": 9534 }, { "epoch": 0.18, "learning_rate": 4.711188606245636e-06, "loss": 0.9505, "step": 9535 }, { "epoch": 0.18, "learning_rate": 4.711117323744003e-06, "loss": 0.9078, "step": 9536 }, { "epoch": 0.18, "learning_rate": 4.711046032986126e-06, "loss": 1.0443, "step": 9537 }, { "epoch": 0.18, "learning_rate": 4.710974733972271e-06, "loss": 1.0845, "step": 9538 }, { "epoch": 0.18, "learning_rate": 4.710903426702704e-06, "loss": 0.9249, "step": 9539 }, { "epoch": 0.18, "learning_rate": 4.710832111177691e-06, "loss": 1.0657, "step": 9540 }, { "epoch": 0.18, "learning_rate": 4.710760787397499e-06, "loss": 0.967, "step": 9541 }, { "epoch": 0.18, "learning_rate": 4.710689455362394e-06, "loss": 0.9377, "step": 9542 }, { "epoch": 0.18, "learning_rate": 4.710618115072642e-06, "loss": 1.1957, "step": 9543 }, { "epoch": 0.18, "learning_rate": 4.710546766528511e-06, "loss": 1.0609, "step": 9544 }, { "epoch": 0.18, "learning_rate": 4.710475409730265e-06, "loss": 0.9046, "step": 9545 }, { "epoch": 0.18, "learning_rate": 4.7104040446781715e-06, "loss": 0.9902, "step": 9546 }, { "epoch": 0.18, "learning_rate": 4.710332671372497e-06, "loss": 0.8441, "step": 9547 }, { "epoch": 0.18, "learning_rate": 4.710261289813509e-06, "loss": 0.9158, "step": 9548 }, { "epoch": 0.18, "learning_rate": 4.710189900001473e-06, "loss": 0.9824, "step": 9549 }, { "epoch": 0.18, "learning_rate": 4.710118501936655e-06, "loss": 1.0574, "step": 9550 }, { "epoch": 0.18, "learning_rate": 4.710047095619323e-06, "loss": 0.7896, "step": 9551 }, { "epoch": 0.18, "learning_rate": 4.709975681049742e-06, "loss": 1.0425, "step": 9552 }, { "epoch": 0.18, "learning_rate": 4.70990425822818e-06, "loss": 0.8615, "step": 9553 }, { "epoch": 0.18, "learning_rate": 4.709832827154903e-06, "loss": 0.8586, "step": 9554 }, { "epoch": 0.18, "learning_rate": 4.709761387830179e-06, "loss": 1.0212, "step": 9555 }, { "epoch": 0.18, "learning_rate": 4.709689940254273e-06, "loss": 1.1428, "step": 9556 }, { "epoch": 0.18, "learning_rate": 4.709618484427452e-06, "loss": 1.083, "step": 9557 }, { "epoch": 0.18, "learning_rate": 4.709547020349984e-06, "loss": 0.8934, "step": 9558 }, { "epoch": 0.18, "learning_rate": 4.709475548022136e-06, "loss": 0.9777, "step": 9559 }, { "epoch": 0.18, "learning_rate": 4.709404067444172e-06, "loss": 1.0032, "step": 9560 }, { "epoch": 0.18, "learning_rate": 4.709332578616362e-06, "loss": 1.1863, "step": 9561 }, { "epoch": 0.18, "learning_rate": 4.709261081538972e-06, "loss": 1.0268, "step": 9562 }, { "epoch": 0.18, "learning_rate": 4.709189576212269e-06, "loss": 1.0363, "step": 9563 }, { "epoch": 0.18, "learning_rate": 4.70911806263652e-06, "loss": 0.8945, "step": 9564 }, { "epoch": 0.18, "learning_rate": 4.709046540811991e-06, "loss": 0.8557, "step": 9565 }, { "epoch": 0.18, "learning_rate": 4.708975010738951e-06, "loss": 0.8184, "step": 9566 }, { "epoch": 0.18, "learning_rate": 4.708903472417665e-06, "loss": 0.7685, "step": 9567 }, { "epoch": 0.18, "learning_rate": 4.708831925848402e-06, "loss": 1.2271, "step": 9568 }, { "epoch": 0.18, "learning_rate": 4.7087603710314275e-06, "loss": 0.9518, "step": 9569 }, { "epoch": 0.18, "learning_rate": 4.70868880796701e-06, "loss": 0.9274, "step": 9570 }, { "epoch": 0.18, "learning_rate": 4.708617236655416e-06, "loss": 0.9809, "step": 9571 }, { "epoch": 0.18, "learning_rate": 4.708545657096913e-06, "loss": 0.7787, "step": 9572 }, { "epoch": 0.18, "learning_rate": 4.708474069291769e-06, "loss": 0.9411, "step": 9573 }, { "epoch": 0.18, "learning_rate": 4.70840247324025e-06, "loss": 0.8593, "step": 9574 }, { "epoch": 0.18, "learning_rate": 4.708330868942624e-06, "loss": 1.1498, "step": 9575 }, { "epoch": 0.18, "learning_rate": 4.708259256399158e-06, "loss": 0.8052, "step": 9576 }, { "epoch": 0.18, "learning_rate": 4.70818763561012e-06, "loss": 0.8315, "step": 9577 }, { "epoch": 0.18, "learning_rate": 4.708116006575775e-06, "loss": 0.9683, "step": 9578 }, { "epoch": 0.18, "learning_rate": 4.7080443692963954e-06, "loss": 0.9286, "step": 9579 }, { "epoch": 0.18, "learning_rate": 4.707972723772245e-06, "loss": 0.9058, "step": 9580 }, { "epoch": 0.18, "learning_rate": 4.7079010700035916e-06, "loss": 1.0527, "step": 9581 }, { "epoch": 0.18, "learning_rate": 4.707829407990704e-06, "loss": 1.053, "step": 9582 }, { "epoch": 0.18, "learning_rate": 4.707757737733848e-06, "loss": 0.9334, "step": 9583 }, { "epoch": 0.18, "learning_rate": 4.7076860592332925e-06, "loss": 0.7824, "step": 9584 }, { "epoch": 0.18, "learning_rate": 4.707614372489306e-06, "loss": 1.0597, "step": 9585 }, { "epoch": 0.18, "learning_rate": 4.707542677502155e-06, "loss": 0.9729, "step": 9586 }, { "epoch": 0.18, "learning_rate": 4.707470974272106e-06, "loss": 1.3062, "step": 9587 }, { "epoch": 0.18, "learning_rate": 4.707399262799429e-06, "loss": 1.0871, "step": 9588 }, { "epoch": 0.18, "learning_rate": 4.707327543084391e-06, "loss": 0.9992, "step": 9589 }, { "epoch": 0.18, "learning_rate": 4.707255815127259e-06, "loss": 0.9458, "step": 9590 }, { "epoch": 0.18, "learning_rate": 4.707184078928302e-06, "loss": 1.0395, "step": 9591 }, { "epoch": 0.18, "learning_rate": 4.707112334487788e-06, "loss": 0.8591, "step": 9592 }, { "epoch": 0.18, "learning_rate": 4.707040581805983e-06, "loss": 1.1064, "step": 9593 }, { "epoch": 0.18, "learning_rate": 4.706968820883156e-06, "loss": 1.0475, "step": 9594 }, { "epoch": 0.18, "learning_rate": 4.706897051719576e-06, "loss": 0.9802, "step": 9595 }, { "epoch": 0.18, "learning_rate": 4.70682527431551e-06, "loss": 0.8861, "step": 9596 }, { "epoch": 0.18, "learning_rate": 4.7067534886712256e-06, "loss": 0.8234, "step": 9597 }, { "epoch": 0.18, "learning_rate": 4.706681694786991e-06, "loss": 0.878, "step": 9598 }, { "epoch": 0.18, "learning_rate": 4.706609892663075e-06, "loss": 1.3057, "step": 9599 }, { "epoch": 0.18, "learning_rate": 4.706538082299745e-06, "loss": 0.9476, "step": 9600 }, { "epoch": 0.18, "learning_rate": 4.706466263697271e-06, "loss": 0.8135, "step": 9601 }, { "epoch": 0.18, "learning_rate": 4.7063944368559176e-06, "loss": 0.7733, "step": 9602 }, { "epoch": 0.18, "learning_rate": 4.706322601775957e-06, "loss": 0.7986, "step": 9603 }, { "epoch": 0.18, "learning_rate": 4.706250758457653e-06, "loss": 0.9298, "step": 9604 }, { "epoch": 0.18, "learning_rate": 4.706178906901279e-06, "loss": 0.8681, "step": 9605 }, { "epoch": 0.18, "learning_rate": 4.706107047107098e-06, "loss": 1.0748, "step": 9606 }, { "epoch": 0.18, "learning_rate": 4.706035179075383e-06, "loss": 0.817, "step": 9607 }, { "epoch": 0.18, "learning_rate": 4.705963302806399e-06, "loss": 0.7759, "step": 9608 }, { "epoch": 0.18, "learning_rate": 4.7058914183004165e-06, "loss": 0.9275, "step": 9609 }, { "epoch": 0.18, "learning_rate": 4.705819525557703e-06, "loss": 0.9385, "step": 9610 }, { "epoch": 0.18, "learning_rate": 4.705747624578526e-06, "loss": 0.9537, "step": 9611 }, { "epoch": 0.18, "learning_rate": 4.705675715363156e-06, "loss": 0.9148, "step": 9612 }, { "epoch": 0.18, "learning_rate": 4.705603797911861e-06, "loss": 1.1729, "step": 9613 }, { "epoch": 0.18, "learning_rate": 4.705531872224908e-06, "loss": 0.8362, "step": 9614 }, { "epoch": 0.18, "learning_rate": 4.705459938302566e-06, "loss": 0.8736, "step": 9615 }, { "epoch": 0.18, "learning_rate": 4.705387996145106e-06, "loss": 0.9131, "step": 9616 }, { "epoch": 0.18, "learning_rate": 4.705316045752794e-06, "loss": 0.8875, "step": 9617 }, { "epoch": 0.18, "learning_rate": 4.705244087125899e-06, "loss": 0.9423, "step": 9618 }, { "epoch": 0.18, "learning_rate": 4.705172120264691e-06, "loss": 0.8509, "step": 9619 }, { "epoch": 0.18, "learning_rate": 4.705100145169438e-06, "loss": 1.0723, "step": 9620 }, { "epoch": 0.18, "learning_rate": 4.705028161840408e-06, "loss": 1.0346, "step": 9621 }, { "epoch": 0.18, "learning_rate": 4.704956170277871e-06, "loss": 0.8654, "step": 9622 }, { "epoch": 0.18, "learning_rate": 4.704884170482094e-06, "loss": 0.817, "step": 9623 }, { "epoch": 0.18, "learning_rate": 4.704812162453348e-06, "loss": 0.9766, "step": 9624 }, { "epoch": 0.18, "learning_rate": 4.704740146191902e-06, "loss": 1.0547, "step": 9625 }, { "epoch": 0.18, "learning_rate": 4.704668121698023e-06, "loss": 0.8047, "step": 9626 }, { "epoch": 0.18, "learning_rate": 4.70459608897198e-06, "loss": 0.8963, "step": 9627 }, { "epoch": 0.18, "learning_rate": 4.704524048014044e-06, "loss": 0.8651, "step": 9628 }, { "epoch": 0.18, "learning_rate": 4.704451998824482e-06, "loss": 0.7629, "step": 9629 }, { "epoch": 0.18, "learning_rate": 4.704379941403565e-06, "loss": 1.1127, "step": 9630 }, { "epoch": 0.18, "learning_rate": 4.7043078757515595e-06, "loss": 1.0069, "step": 9631 }, { "epoch": 0.18, "learning_rate": 4.704235801868737e-06, "loss": 1.1368, "step": 9632 }, { "epoch": 0.18, "learning_rate": 4.7041637197553645e-06, "loss": 0.8703, "step": 9633 }, { "epoch": 0.18, "learning_rate": 4.7040916294117135e-06, "loss": 0.9676, "step": 9634 }, { "epoch": 0.18, "learning_rate": 4.704019530838051e-06, "loss": 0.8893, "step": 9635 }, { "epoch": 0.18, "learning_rate": 4.703947424034647e-06, "loss": 1.0361, "step": 9636 }, { "epoch": 0.18, "learning_rate": 4.703875309001772e-06, "loss": 0.9788, "step": 9637 }, { "epoch": 0.18, "learning_rate": 4.703803185739694e-06, "loss": 0.9844, "step": 9638 }, { "epoch": 0.18, "learning_rate": 4.703731054248681e-06, "loss": 0.9001, "step": 9639 }, { "epoch": 0.18, "learning_rate": 4.703658914529005e-06, "loss": 1.0097, "step": 9640 }, { "epoch": 0.18, "learning_rate": 4.703586766580934e-06, "loss": 0.8178, "step": 9641 }, { "epoch": 0.18, "learning_rate": 4.703514610404738e-06, "loss": 0.897, "step": 9642 }, { "epoch": 0.18, "learning_rate": 4.703442446000686e-06, "loss": 1.1487, "step": 9643 }, { "epoch": 0.18, "learning_rate": 4.703370273369047e-06, "loss": 1.0317, "step": 9644 }, { "epoch": 0.18, "learning_rate": 4.703298092510091e-06, "loss": 1.0803, "step": 9645 }, { "epoch": 0.18, "learning_rate": 4.703225903424087e-06, "loss": 0.9172, "step": 9646 }, { "epoch": 0.18, "learning_rate": 4.703153706111306e-06, "loss": 0.9357, "step": 9647 }, { "epoch": 0.18, "learning_rate": 4.703081500572016e-06, "loss": 0.8419, "step": 9648 }, { "epoch": 0.18, "learning_rate": 4.703009286806488e-06, "loss": 1.0155, "step": 9649 }, { "epoch": 0.18, "learning_rate": 4.70293706481499e-06, "loss": 1.1004, "step": 9650 }, { "epoch": 0.18, "learning_rate": 4.702864834597792e-06, "loss": 0.9237, "step": 9651 }, { "epoch": 0.18, "learning_rate": 4.702792596155165e-06, "loss": 0.8401, "step": 9652 }, { "epoch": 0.18, "learning_rate": 4.7027203494873784e-06, "loss": 0.7589, "step": 9653 }, { "epoch": 0.18, "learning_rate": 4.702648094594701e-06, "loss": 0.8535, "step": 9654 }, { "epoch": 0.18, "learning_rate": 4.702575831477404e-06, "loss": 1.116, "step": 9655 }, { "epoch": 0.18, "learning_rate": 4.702503560135755e-06, "loss": 1.0794, "step": 9656 }, { "epoch": 0.18, "learning_rate": 4.702431280570026e-06, "loss": 0.9816, "step": 9657 }, { "epoch": 0.18, "learning_rate": 4.702358992780486e-06, "loss": 0.8568, "step": 9658 }, { "epoch": 0.18, "learning_rate": 4.702286696767405e-06, "loss": 0.8346, "step": 9659 }, { "epoch": 0.18, "learning_rate": 4.702214392531053e-06, "loss": 0.9677, "step": 9660 }, { "epoch": 0.18, "learning_rate": 4.7021420800717e-06, "loss": 0.8955, "step": 9661 }, { "epoch": 0.18, "learning_rate": 4.702069759389617e-06, "loss": 0.9787, "step": 9662 }, { "epoch": 0.18, "learning_rate": 4.7019974304850715e-06, "loss": 1.1584, "step": 9663 }, { "epoch": 0.18, "learning_rate": 4.701925093358336e-06, "loss": 0.9928, "step": 9664 }, { "epoch": 0.18, "learning_rate": 4.70185274800968e-06, "loss": 0.9099, "step": 9665 }, { "epoch": 0.18, "learning_rate": 4.701780394439372e-06, "loss": 0.83, "step": 9666 }, { "epoch": 0.18, "learning_rate": 4.701708032647685e-06, "loss": 1.033, "step": 9667 }, { "epoch": 0.18, "learning_rate": 4.701635662634887e-06, "loss": 1.0552, "step": 9668 }, { "epoch": 0.18, "learning_rate": 4.701563284401248e-06, "loss": 1.1908, "step": 9669 }, { "epoch": 0.18, "learning_rate": 4.7014908979470406e-06, "loss": 1.1175, "step": 9670 }, { "epoch": 0.18, "learning_rate": 4.701418503272533e-06, "loss": 0.8949, "step": 9671 }, { "epoch": 0.18, "learning_rate": 4.701346100377997e-06, "loss": 0.7774, "step": 9672 }, { "epoch": 0.18, "learning_rate": 4.701273689263701e-06, "loss": 0.8306, "step": 9673 }, { "epoch": 0.18, "learning_rate": 4.701201269929918e-06, "loss": 1.1357, "step": 9674 }, { "epoch": 0.18, "learning_rate": 4.701128842376915e-06, "loss": 1.0818, "step": 9675 }, { "epoch": 0.18, "learning_rate": 4.7010564066049656e-06, "loss": 1.0651, "step": 9676 }, { "epoch": 0.18, "learning_rate": 4.700983962614339e-06, "loss": 0.9529, "step": 9677 }, { "epoch": 0.18, "learning_rate": 4.700911510405306e-06, "loss": 0.989, "step": 9678 }, { "epoch": 0.18, "learning_rate": 4.700839049978136e-06, "loss": 0.9266, "step": 9679 }, { "epoch": 0.18, "learning_rate": 4.700766581333101e-06, "loss": 1.0702, "step": 9680 }, { "epoch": 0.18, "learning_rate": 4.700694104470472e-06, "loss": 1.0338, "step": 9681 }, { "epoch": 0.18, "learning_rate": 4.700621619390517e-06, "loss": 0.9304, "step": 9682 }, { "epoch": 0.18, "learning_rate": 4.70054912609351e-06, "loss": 0.9594, "step": 9683 }, { "epoch": 0.18, "learning_rate": 4.7004766245797196e-06, "loss": 0.9731, "step": 9684 }, { "epoch": 0.18, "learning_rate": 4.700404114849416e-06, "loss": 0.8345, "step": 9685 }, { "epoch": 0.18, "learning_rate": 4.7003315969028714e-06, "loss": 0.8916, "step": 9686 }, { "epoch": 0.18, "learning_rate": 4.7002590707403564e-06, "loss": 1.1656, "step": 9687 }, { "epoch": 0.18, "learning_rate": 4.700186536362141e-06, "loss": 1.1154, "step": 9688 }, { "epoch": 0.18, "learning_rate": 4.700113993768497e-06, "loss": 0.9094, "step": 9689 }, { "epoch": 0.18, "learning_rate": 4.700041442959694e-06, "loss": 0.7912, "step": 9690 }, { "epoch": 0.18, "learning_rate": 4.699968883936005e-06, "loss": 0.7807, "step": 9691 }, { "epoch": 0.18, "learning_rate": 4.699896316697699e-06, "loss": 0.9266, "step": 9692 }, { "epoch": 0.18, "learning_rate": 4.699823741245047e-06, "loss": 1.2192, "step": 9693 }, { "epoch": 0.18, "learning_rate": 4.699751157578321e-06, "loss": 1.0746, "step": 9694 }, { "epoch": 0.18, "learning_rate": 4.699678565697792e-06, "loss": 0.8346, "step": 9695 }, { "epoch": 0.18, "learning_rate": 4.6996059656037306e-06, "loss": 0.8061, "step": 9696 }, { "epoch": 0.18, "learning_rate": 4.699533357296408e-06, "loss": 1.0039, "step": 9697 }, { "epoch": 0.18, "learning_rate": 4.699460740776095e-06, "loss": 0.856, "step": 9698 }, { "epoch": 0.18, "learning_rate": 4.699388116043063e-06, "loss": 0.9568, "step": 9699 }, { "epoch": 0.18, "learning_rate": 4.699315483097583e-06, "loss": 0.9604, "step": 9700 }, { "epoch": 0.18, "learning_rate": 4.699242841939928e-06, "loss": 1.0946, "step": 9701 }, { "epoch": 0.18, "learning_rate": 4.699170192570365e-06, "loss": 1.1409, "step": 9702 }, { "epoch": 0.18, "learning_rate": 4.6990975349891695e-06, "loss": 0.9153, "step": 9703 }, { "epoch": 0.18, "learning_rate": 4.699024869196611e-06, "loss": 1.0056, "step": 9704 }, { "epoch": 0.18, "learning_rate": 4.6989521951929615e-06, "loss": 0.8849, "step": 9705 }, { "epoch": 0.18, "learning_rate": 4.698879512978491e-06, "loss": 0.8517, "step": 9706 }, { "epoch": 0.18, "learning_rate": 4.698806822553472e-06, "loss": 0.8606, "step": 9707 }, { "epoch": 0.18, "learning_rate": 4.698734123918177e-06, "loss": 0.8799, "step": 9708 }, { "epoch": 0.18, "learning_rate": 4.698661417072875e-06, "loss": 0.9627, "step": 9709 }, { "epoch": 0.18, "learning_rate": 4.698588702017839e-06, "loss": 1.0247, "step": 9710 }, { "epoch": 0.18, "learning_rate": 4.69851597875334e-06, "loss": 0.9406, "step": 9711 }, { "epoch": 0.18, "learning_rate": 4.69844324727965e-06, "loss": 0.9453, "step": 9712 }, { "epoch": 0.18, "learning_rate": 4.69837050759704e-06, "loss": 0.9602, "step": 9713 }, { "epoch": 0.18, "learning_rate": 4.698297759705782e-06, "loss": 0.8597, "step": 9714 }, { "epoch": 0.18, "learning_rate": 4.698225003606148e-06, "loss": 0.944, "step": 9715 }, { "epoch": 0.18, "learning_rate": 4.698152239298409e-06, "loss": 1.0145, "step": 9716 }, { "epoch": 0.18, "learning_rate": 4.698079466782837e-06, "loss": 0.8524, "step": 9717 }, { "epoch": 0.18, "learning_rate": 4.698006686059704e-06, "loss": 1.168, "step": 9718 }, { "epoch": 0.18, "learning_rate": 4.69793389712928e-06, "loss": 0.9382, "step": 9719 }, { "epoch": 0.18, "learning_rate": 4.697861099991839e-06, "loss": 0.962, "step": 9720 }, { "epoch": 0.18, "learning_rate": 4.697788294647653e-06, "loss": 0.9247, "step": 9721 }, { "epoch": 0.18, "learning_rate": 4.6977154810969926e-06, "loss": 0.8714, "step": 9722 }, { "epoch": 0.18, "learning_rate": 4.697642659340129e-06, "loss": 0.8596, "step": 9723 }, { "epoch": 0.18, "learning_rate": 4.697569829377336e-06, "loss": 1.0982, "step": 9724 }, { "epoch": 0.18, "learning_rate": 4.697496991208884e-06, "loss": 1.1179, "step": 9725 }, { "epoch": 0.18, "learning_rate": 4.697424144835045e-06, "loss": 0.8641, "step": 9726 }, { "epoch": 0.18, "learning_rate": 4.697351290256093e-06, "loss": 0.7064, "step": 9727 }, { "epoch": 0.18, "learning_rate": 4.6972784274722985e-06, "loss": 1.0075, "step": 9728 }, { "epoch": 0.18, "learning_rate": 4.697205556483933e-06, "loss": 0.9571, "step": 9729 }, { "epoch": 0.18, "learning_rate": 4.697132677291269e-06, "loss": 0.8308, "step": 9730 }, { "epoch": 0.18, "learning_rate": 4.69705978989458e-06, "loss": 1.1241, "step": 9731 }, { "epoch": 0.18, "learning_rate": 4.6969868942941375e-06, "loss": 0.938, "step": 9732 }, { "epoch": 0.18, "learning_rate": 4.696913990490212e-06, "loss": 0.7854, "step": 9733 }, { "epoch": 0.18, "learning_rate": 4.696841078483078e-06, "loss": 1.0441, "step": 9734 }, { "epoch": 0.18, "learning_rate": 4.696768158273006e-06, "loss": 0.9471, "step": 9735 }, { "epoch": 0.18, "learning_rate": 4.696695229860269e-06, "loss": 0.9182, "step": 9736 }, { "epoch": 0.18, "learning_rate": 4.69662229324514e-06, "loss": 1.2906, "step": 9737 }, { "epoch": 0.18, "learning_rate": 4.69654934842789e-06, "loss": 0.7954, "step": 9738 }, { "epoch": 0.18, "learning_rate": 4.696476395408793e-06, "loss": 0.852, "step": 9739 }, { "epoch": 0.18, "learning_rate": 4.69640343418812e-06, "loss": 0.7724, "step": 9740 }, { "epoch": 0.18, "learning_rate": 4.696330464766144e-06, "loss": 1.0032, "step": 9741 }, { "epoch": 0.18, "learning_rate": 4.6962574871431374e-06, "loss": 0.8909, "step": 9742 }, { "epoch": 0.18, "learning_rate": 4.6961845013193725e-06, "loss": 1.0074, "step": 9743 }, { "epoch": 0.18, "learning_rate": 4.6961115072951225e-06, "loss": 1.0465, "step": 9744 }, { "epoch": 0.18, "learning_rate": 4.6960385050706585e-06, "loss": 0.8762, "step": 9745 }, { "epoch": 0.18, "learning_rate": 4.695965494646255e-06, "loss": 0.9937, "step": 9746 }, { "epoch": 0.18, "learning_rate": 4.695892476022183e-06, "loss": 0.8785, "step": 9747 }, { "epoch": 0.18, "learning_rate": 4.695819449198716e-06, "loss": 1.1268, "step": 9748 }, { "epoch": 0.18, "learning_rate": 4.695746414176127e-06, "loss": 1.2209, "step": 9749 }, { "epoch": 0.18, "learning_rate": 4.695673370954688e-06, "loss": 1.1183, "step": 9750 }, { "epoch": 0.18, "learning_rate": 4.695600319534671e-06, "loss": 0.8417, "step": 9751 }, { "epoch": 0.18, "learning_rate": 4.695527259916351e-06, "loss": 0.9196, "step": 9752 }, { "epoch": 0.18, "learning_rate": 4.695454192099998e-06, "loss": 0.9933, "step": 9753 }, { "epoch": 0.18, "learning_rate": 4.695381116085889e-06, "loss": 0.9126, "step": 9754 }, { "epoch": 0.18, "learning_rate": 4.695308031874292e-06, "loss": 0.9313, "step": 9755 }, { "epoch": 0.18, "learning_rate": 4.695234939465483e-06, "loss": 0.9657, "step": 9756 }, { "epoch": 0.18, "learning_rate": 4.695161838859733e-06, "loss": 1.0801, "step": 9757 }, { "epoch": 0.18, "learning_rate": 4.695088730057317e-06, "loss": 0.8426, "step": 9758 }, { "epoch": 0.18, "learning_rate": 4.695015613058507e-06, "loss": 0.8, "step": 9759 }, { "epoch": 0.18, "learning_rate": 4.694942487863576e-06, "loss": 0.8711, "step": 9760 }, { "epoch": 0.18, "learning_rate": 4.694869354472796e-06, "loss": 0.9312, "step": 9761 }, { "epoch": 0.18, "learning_rate": 4.694796212886442e-06, "loss": 1.0839, "step": 9762 }, { "epoch": 0.18, "learning_rate": 4.694723063104787e-06, "loss": 1.0211, "step": 9763 }, { "epoch": 0.18, "learning_rate": 4.694649905128102e-06, "loss": 0.9308, "step": 9764 }, { "epoch": 0.18, "learning_rate": 4.694576738956662e-06, "loss": 0.8863, "step": 9765 }, { "epoch": 0.18, "learning_rate": 4.69450356459074e-06, "loss": 0.8727, "step": 9766 }, { "epoch": 0.18, "learning_rate": 4.694430382030609e-06, "loss": 1.1091, "step": 9767 }, { "epoch": 0.18, "learning_rate": 4.694357191276542e-06, "loss": 1.002, "step": 9768 }, { "epoch": 0.18, "learning_rate": 4.694283992328813e-06, "loss": 1.0047, "step": 9769 }, { "epoch": 0.18, "learning_rate": 4.6942107851876935e-06, "loss": 1.0168, "step": 9770 }, { "epoch": 0.18, "learning_rate": 4.694137569853459e-06, "loss": 0.8223, "step": 9771 }, { "epoch": 0.18, "learning_rate": 4.694064346326383e-06, "loss": 1.0098, "step": 9772 }, { "epoch": 0.18, "learning_rate": 4.6939911146067365e-06, "loss": 1.0624, "step": 9773 }, { "epoch": 0.18, "learning_rate": 4.693917874694795e-06, "loss": 1.1154, "step": 9774 }, { "epoch": 0.18, "learning_rate": 4.693844626590832e-06, "loss": 0.9264, "step": 9775 }, { "epoch": 0.18, "learning_rate": 4.693771370295121e-06, "loss": 0.9785, "step": 9776 }, { "epoch": 0.18, "learning_rate": 4.693698105807934e-06, "loss": 1.0448, "step": 9777 }, { "epoch": 0.18, "learning_rate": 4.693624833129544e-06, "loss": 0.9355, "step": 9778 }, { "epoch": 0.18, "learning_rate": 4.693551552260228e-06, "loss": 0.9103, "step": 9779 }, { "epoch": 0.18, "learning_rate": 4.693478263200258e-06, "loss": 1.025, "step": 9780 }, { "epoch": 0.18, "learning_rate": 4.693404965949907e-06, "loss": 1.1109, "step": 9781 }, { "epoch": 0.18, "learning_rate": 4.6933316605094485e-06, "loss": 1.0635, "step": 9782 }, { "epoch": 0.18, "learning_rate": 4.6932583468791574e-06, "loss": 0.8943, "step": 9783 }, { "epoch": 0.18, "learning_rate": 4.693185025059307e-06, "loss": 1.0743, "step": 9784 }, { "epoch": 0.18, "learning_rate": 4.6931116950501695e-06, "loss": 0.8572, "step": 9785 }, { "epoch": 0.18, "learning_rate": 4.693038356852022e-06, "loss": 0.8389, "step": 9786 }, { "epoch": 0.18, "learning_rate": 4.692965010465136e-06, "loss": 1.0793, "step": 9787 }, { "epoch": 0.18, "learning_rate": 4.6928916558897856e-06, "loss": 0.9171, "step": 9788 }, { "epoch": 0.18, "learning_rate": 4.6928182931262456e-06, "loss": 0.8456, "step": 9789 }, { "epoch": 0.18, "learning_rate": 4.692744922174789e-06, "loss": 0.8618, "step": 9790 }, { "epoch": 0.18, "learning_rate": 4.6926715430356895e-06, "loss": 0.8854, "step": 9791 }, { "epoch": 0.18, "learning_rate": 4.692598155709222e-06, "loss": 0.8883, "step": 9792 }, { "epoch": 0.18, "learning_rate": 4.692524760195661e-06, "loss": 0.9704, "step": 9793 }, { "epoch": 0.18, "learning_rate": 4.692451356495279e-06, "loss": 0.9407, "step": 9794 }, { "epoch": 0.18, "learning_rate": 4.692377944608351e-06, "loss": 0.7158, "step": 9795 }, { "epoch": 0.18, "learning_rate": 4.692304524535151e-06, "loss": 0.9305, "step": 9796 }, { "epoch": 0.18, "learning_rate": 4.692231096275953e-06, "loss": 0.6911, "step": 9797 }, { "epoch": 0.18, "learning_rate": 4.692157659831031e-06, "loss": 0.7866, "step": 9798 }, { "epoch": 0.18, "learning_rate": 4.692084215200661e-06, "loss": 0.959, "step": 9799 }, { "epoch": 0.18, "learning_rate": 4.692010762385114e-06, "loss": 1.0892, "step": 9800 }, { "epoch": 0.18, "learning_rate": 4.691937301384667e-06, "loss": 0.8617, "step": 9801 }, { "epoch": 0.18, "learning_rate": 4.691863832199592e-06, "loss": 0.8967, "step": 9802 }, { "epoch": 0.18, "learning_rate": 4.691790354830167e-06, "loss": 1.0102, "step": 9803 }, { "epoch": 0.18, "learning_rate": 4.6917168692766626e-06, "loss": 0.9235, "step": 9804 }, { "epoch": 0.18, "learning_rate": 4.691643375539355e-06, "loss": 1.1188, "step": 9805 }, { "epoch": 0.19, "learning_rate": 4.691569873618517e-06, "loss": 1.1155, "step": 9806 }, { "epoch": 0.19, "learning_rate": 4.691496363514425e-06, "loss": 0.9199, "step": 9807 }, { "epoch": 0.19, "learning_rate": 4.691422845227353e-06, "loss": 0.7766, "step": 9808 }, { "epoch": 0.19, "learning_rate": 4.691349318757575e-06, "loss": 0.9074, "step": 9809 }, { "epoch": 0.19, "learning_rate": 4.691275784105367e-06, "loss": 0.8752, "step": 9810 }, { "epoch": 0.19, "learning_rate": 4.6912022412710015e-06, "loss": 1.0463, "step": 9811 }, { "epoch": 0.19, "learning_rate": 4.691128690254754e-06, "loss": 1.0861, "step": 9812 }, { "epoch": 0.19, "learning_rate": 4.691055131056899e-06, "loss": 0.9915, "step": 9813 }, { "epoch": 0.19, "learning_rate": 4.690981563677712e-06, "loss": 0.7844, "step": 9814 }, { "epoch": 0.19, "learning_rate": 4.690907988117466e-06, "loss": 1.0117, "step": 9815 }, { "epoch": 0.19, "learning_rate": 4.6908344043764374e-06, "loss": 0.8376, "step": 9816 }, { "epoch": 0.19, "learning_rate": 4.6907608124549e-06, "loss": 0.7974, "step": 9817 }, { "epoch": 0.19, "learning_rate": 4.6906872123531285e-06, "loss": 1.0936, "step": 9818 }, { "epoch": 0.19, "learning_rate": 4.690613604071399e-06, "loss": 0.9711, "step": 9819 }, { "epoch": 0.19, "learning_rate": 4.690539987609985e-06, "loss": 1.0107, "step": 9820 }, { "epoch": 0.19, "learning_rate": 4.690466362969162e-06, "loss": 0.9462, "step": 9821 }, { "epoch": 0.19, "learning_rate": 4.690392730149205e-06, "loss": 1.0422, "step": 9822 }, { "epoch": 0.19, "learning_rate": 4.690319089150389e-06, "loss": 0.9156, "step": 9823 }, { "epoch": 0.19, "learning_rate": 4.690245439972988e-06, "loss": 0.8835, "step": 9824 }, { "epoch": 0.19, "learning_rate": 4.690171782617278e-06, "loss": 0.9974, "step": 9825 }, { "epoch": 0.19, "learning_rate": 4.690098117083534e-06, "loss": 0.923, "step": 9826 }, { "epoch": 0.19, "learning_rate": 4.69002444337203e-06, "loss": 0.8807, "step": 9827 }, { "epoch": 0.19, "learning_rate": 4.689950761483042e-06, "loss": 0.9456, "step": 9828 }, { "epoch": 0.19, "learning_rate": 4.689877071416845e-06, "loss": 0.8823, "step": 9829 }, { "epoch": 0.19, "learning_rate": 4.689803373173714e-06, "loss": 0.9435, "step": 9830 }, { "epoch": 0.19, "learning_rate": 4.6897296667539246e-06, "loss": 1.15, "step": 9831 }, { "epoch": 0.19, "learning_rate": 4.689655952157752e-06, "loss": 1.0757, "step": 9832 }, { "epoch": 0.19, "learning_rate": 4.689582229385472e-06, "loss": 0.8995, "step": 9833 }, { "epoch": 0.19, "learning_rate": 4.689508498437358e-06, "loss": 0.8658, "step": 9834 }, { "epoch": 0.19, "learning_rate": 4.689434759313687e-06, "loss": 0.9486, "step": 9835 }, { "epoch": 0.19, "learning_rate": 4.689361012014732e-06, "loss": 0.9343, "step": 9836 }, { "epoch": 0.19, "learning_rate": 4.689287256540772e-06, "loss": 1.1428, "step": 9837 }, { "epoch": 0.19, "learning_rate": 4.68921349289208e-06, "loss": 0.8647, "step": 9838 }, { "epoch": 0.19, "learning_rate": 4.689139721068932e-06, "loss": 0.7855, "step": 9839 }, { "epoch": 0.19, "learning_rate": 4.689065941071604e-06, "loss": 0.9064, "step": 9840 }, { "epoch": 0.19, "learning_rate": 4.688992152900369e-06, "loss": 1.0012, "step": 9841 }, { "epoch": 0.19, "learning_rate": 4.6889183565555064e-06, "loss": 0.8291, "step": 9842 }, { "epoch": 0.19, "learning_rate": 4.688844552037289e-06, "loss": 0.9633, "step": 9843 }, { "epoch": 0.19, "learning_rate": 4.688770739345992e-06, "loss": 1.168, "step": 9844 }, { "epoch": 0.19, "learning_rate": 4.6886969184818946e-06, "loss": 0.9875, "step": 9845 }, { "epoch": 0.19, "learning_rate": 4.688623089445268e-06, "loss": 0.7213, "step": 9846 }, { "epoch": 0.19, "learning_rate": 4.68854925223639e-06, "loss": 0.8123, "step": 9847 }, { "epoch": 0.19, "learning_rate": 4.688475406855537e-06, "loss": 1.1482, "step": 9848 }, { "epoch": 0.19, "learning_rate": 4.6884015533029836e-06, "loss": 1.1713, "step": 9849 }, { "epoch": 0.19, "learning_rate": 4.6883276915790066e-06, "loss": 1.0043, "step": 9850 }, { "epoch": 0.19, "learning_rate": 4.688253821683881e-06, "loss": 0.8466, "step": 9851 }, { "epoch": 0.19, "learning_rate": 4.688179943617882e-06, "loss": 0.9556, "step": 9852 }, { "epoch": 0.19, "learning_rate": 4.688106057381286e-06, "loss": 1.0747, "step": 9853 }, { "epoch": 0.19, "learning_rate": 4.688032162974369e-06, "loss": 0.9455, "step": 9854 }, { "epoch": 0.19, "learning_rate": 4.687958260397408e-06, "loss": 0.9151, "step": 9855 }, { "epoch": 0.19, "learning_rate": 4.6878843496506775e-06, "loss": 1.097, "step": 9856 }, { "epoch": 0.19, "learning_rate": 4.687810430734453e-06, "loss": 1.1715, "step": 9857 }, { "epoch": 0.19, "learning_rate": 4.687736503649013e-06, "loss": 0.8161, "step": 9858 }, { "epoch": 0.19, "learning_rate": 4.687662568394631e-06, "loss": 0.9236, "step": 9859 }, { "epoch": 0.19, "learning_rate": 4.687588624971584e-06, "loss": 0.998, "step": 9860 }, { "epoch": 0.19, "learning_rate": 4.687514673380149e-06, "loss": 0.975, "step": 9861 }, { "epoch": 0.19, "learning_rate": 4.6874407136206e-06, "loss": 1.1548, "step": 9862 }, { "epoch": 0.19, "learning_rate": 4.687366745693216e-06, "loss": 1.1078, "step": 9863 }, { "epoch": 0.19, "learning_rate": 4.687292769598271e-06, "loss": 0.9377, "step": 9864 }, { "epoch": 0.19, "learning_rate": 4.6872187853360405e-06, "loss": 0.8416, "step": 9865 }, { "epoch": 0.19, "learning_rate": 4.687144792906804e-06, "loss": 1.0721, "step": 9866 }, { "epoch": 0.19, "learning_rate": 4.687070792310835e-06, "loss": 0.8475, "step": 9867 }, { "epoch": 0.19, "learning_rate": 4.686996783548411e-06, "loss": 0.8192, "step": 9868 }, { "epoch": 0.19, "learning_rate": 4.686922766619808e-06, "loss": 1.2213, "step": 9869 }, { "epoch": 0.19, "learning_rate": 4.686848741525302e-06, "loss": 1.0276, "step": 9870 }, { "epoch": 0.19, "learning_rate": 4.68677470826517e-06, "loss": 1.0757, "step": 9871 }, { "epoch": 0.19, "learning_rate": 4.686700666839689e-06, "loss": 0.9309, "step": 9872 }, { "epoch": 0.19, "learning_rate": 4.686626617249135e-06, "loss": 0.9073, "step": 9873 }, { "epoch": 0.19, "learning_rate": 4.686552559493783e-06, "loss": 0.9877, "step": 9874 }, { "epoch": 0.19, "learning_rate": 4.686478493573911e-06, "loss": 1.0798, "step": 9875 }, { "epoch": 0.19, "learning_rate": 4.6864044194897966e-06, "loss": 1.0129, "step": 9876 }, { "epoch": 0.19, "learning_rate": 4.686330337241713e-06, "loss": 0.7762, "step": 9877 }, { "epoch": 0.19, "learning_rate": 4.686256246829941e-06, "loss": 0.7641, "step": 9878 }, { "epoch": 0.19, "learning_rate": 4.686182148254755e-06, "loss": 0.7728, "step": 9879 }, { "epoch": 0.19, "learning_rate": 4.686108041516431e-06, "loss": 0.864, "step": 9880 }, { "epoch": 0.19, "learning_rate": 4.686033926615246e-06, "loss": 1.1567, "step": 9881 }, { "epoch": 0.19, "learning_rate": 4.685959803551478e-06, "loss": 1.2135, "step": 9882 }, { "epoch": 0.19, "learning_rate": 4.685885672325403e-06, "loss": 0.8992, "step": 9883 }, { "epoch": 0.19, "learning_rate": 4.685811532937299e-06, "loss": 1.0309, "step": 9884 }, { "epoch": 0.19, "learning_rate": 4.685737385387441e-06, "loss": 0.8712, "step": 9885 }, { "epoch": 0.19, "learning_rate": 4.685663229676106e-06, "loss": 1.0445, "step": 9886 }, { "epoch": 0.19, "learning_rate": 4.685589065803573e-06, "loss": 0.8374, "step": 9887 }, { "epoch": 0.19, "learning_rate": 4.685514893770116e-06, "loss": 0.8459, "step": 9888 }, { "epoch": 0.19, "learning_rate": 4.685440713576014e-06, "loss": 0.8408, "step": 9889 }, { "epoch": 0.19, "learning_rate": 4.685366525221543e-06, "loss": 0.8713, "step": 9890 }, { "epoch": 0.19, "learning_rate": 4.685292328706981e-06, "loss": 0.8819, "step": 9891 }, { "epoch": 0.19, "learning_rate": 4.6852181240326046e-06, "loss": 0.9944, "step": 9892 }, { "epoch": 0.19, "learning_rate": 4.685143911198689e-06, "loss": 1.2151, "step": 9893 }, { "epoch": 0.19, "learning_rate": 4.685069690205515e-06, "loss": 1.023, "step": 9894 }, { "epoch": 0.19, "learning_rate": 4.6849954610533576e-06, "loss": 0.7577, "step": 9895 }, { "epoch": 0.19, "learning_rate": 4.684921223742493e-06, "loss": 0.6262, "step": 9896 }, { "epoch": 0.19, "learning_rate": 4.684846978273201e-06, "loss": 0.8919, "step": 9897 }, { "epoch": 0.19, "learning_rate": 4.684772724645756e-06, "loss": 0.8438, "step": 9898 }, { "epoch": 0.19, "learning_rate": 4.684698462860437e-06, "loss": 1.0014, "step": 9899 }, { "epoch": 0.19, "learning_rate": 4.684624192917522e-06, "loss": 1.0957, "step": 9900 }, { "epoch": 0.19, "learning_rate": 4.684549914817285e-06, "loss": 0.8692, "step": 9901 }, { "epoch": 0.19, "learning_rate": 4.684475628560008e-06, "loss": 0.9205, "step": 9902 }, { "epoch": 0.19, "learning_rate": 4.6844013341459645e-06, "loss": 0.808, "step": 9903 }, { "epoch": 0.19, "learning_rate": 4.684327031575434e-06, "loss": 0.8467, "step": 9904 }, { "epoch": 0.19, "learning_rate": 4.684252720848693e-06, "loss": 1.0256, "step": 9905 }, { "epoch": 0.19, "learning_rate": 4.68417840196602e-06, "loss": 1.0848, "step": 9906 }, { "epoch": 0.19, "learning_rate": 4.684104074927691e-06, "loss": 1.105, "step": 9907 }, { "epoch": 0.19, "learning_rate": 4.684029739733985e-06, "loss": 0.8291, "step": 9908 }, { "epoch": 0.19, "learning_rate": 4.683955396385178e-06, "loss": 1.0904, "step": 9909 }, { "epoch": 0.19, "learning_rate": 4.68388104488155e-06, "loss": 0.7419, "step": 9910 }, { "epoch": 0.19, "learning_rate": 4.683806685223376e-06, "loss": 0.862, "step": 9911 }, { "epoch": 0.19, "learning_rate": 4.6837323174109355e-06, "loss": 1.0981, "step": 9912 }, { "epoch": 0.19, "learning_rate": 4.683657941444504e-06, "loss": 1.0609, "step": 9913 }, { "epoch": 0.19, "learning_rate": 4.683583557324362e-06, "loss": 1.069, "step": 9914 }, { "epoch": 0.19, "learning_rate": 4.683509165050786e-06, "loss": 1.0103, "step": 9915 }, { "epoch": 0.19, "learning_rate": 4.683434764624053e-06, "loss": 0.9266, "step": 9916 }, { "epoch": 0.19, "learning_rate": 4.683360356044442e-06, "loss": 0.8441, "step": 9917 }, { "epoch": 0.19, "learning_rate": 4.6832859393122295e-06, "loss": 0.8963, "step": 9918 }, { "epoch": 0.19, "learning_rate": 4.683211514427696e-06, "loss": 1.1516, "step": 9919 }, { "epoch": 0.19, "learning_rate": 4.683137081391116e-06, "loss": 0.9659, "step": 9920 }, { "epoch": 0.19, "learning_rate": 4.6830626402027705e-06, "loss": 0.8698, "step": 9921 }, { "epoch": 0.19, "learning_rate": 4.682988190862935e-06, "loss": 1.2036, "step": 9922 }, { "epoch": 0.19, "learning_rate": 4.682913733371889e-06, "loss": 0.8707, "step": 9923 }, { "epoch": 0.19, "learning_rate": 4.682839267729909e-06, "loss": 1.1781, "step": 9924 }, { "epoch": 0.19, "learning_rate": 4.682764793937276e-06, "loss": 1.0604, "step": 9925 }, { "epoch": 0.19, "learning_rate": 4.682690311994264e-06, "loss": 1.1324, "step": 9926 }, { "epoch": 0.19, "learning_rate": 4.682615821901155e-06, "loss": 0.8647, "step": 9927 }, { "epoch": 0.19, "learning_rate": 4.682541323658225e-06, "loss": 1.0647, "step": 9928 }, { "epoch": 0.19, "learning_rate": 4.682466817265753e-06, "loss": 0.7765, "step": 9929 }, { "epoch": 0.19, "learning_rate": 4.682392302724016e-06, "loss": 0.968, "step": 9930 }, { "epoch": 0.19, "learning_rate": 4.682317780033293e-06, "loss": 1.0972, "step": 9931 }, { "epoch": 0.19, "learning_rate": 4.682243249193863e-06, "loss": 1.1044, "step": 9932 }, { "epoch": 0.19, "learning_rate": 4.6821687102060035e-06, "loss": 1.0379, "step": 9933 }, { "epoch": 0.19, "learning_rate": 4.682094163069993e-06, "loss": 0.8474, "step": 9934 }, { "epoch": 0.19, "learning_rate": 4.682019607786109e-06, "loss": 0.8875, "step": 9935 }, { "epoch": 0.19, "learning_rate": 4.681945044354631e-06, "loss": 0.9982, "step": 9936 }, { "epoch": 0.19, "learning_rate": 4.681870472775838e-06, "loss": 0.9464, "step": 9937 }, { "epoch": 0.19, "learning_rate": 4.681795893050006e-06, "loss": 1.2219, "step": 9938 }, { "epoch": 0.19, "learning_rate": 4.681721305177416e-06, "loss": 0.8398, "step": 9939 }, { "epoch": 0.19, "learning_rate": 4.681646709158345e-06, "loss": 0.8813, "step": 9940 }, { "epoch": 0.19, "learning_rate": 4.681572104993073e-06, "loss": 0.8337, "step": 9941 }, { "epoch": 0.19, "learning_rate": 4.681497492681877e-06, "loss": 0.9764, "step": 9942 }, { "epoch": 0.19, "learning_rate": 4.681422872225037e-06, "loss": 1.1108, "step": 9943 }, { "epoch": 0.19, "learning_rate": 4.68134824362283e-06, "loss": 0.8928, "step": 9944 }, { "epoch": 0.19, "learning_rate": 4.681273606875536e-06, "loss": 0.7388, "step": 9945 }, { "epoch": 0.19, "learning_rate": 4.681198961983433e-06, "loss": 0.8768, "step": 9946 }, { "epoch": 0.19, "learning_rate": 4.6811243089468e-06, "loss": 0.9764, "step": 9947 }, { "epoch": 0.19, "learning_rate": 4.681049647765916e-06, "loss": 0.8135, "step": 9948 }, { "epoch": 0.19, "learning_rate": 4.68097497844106e-06, "loss": 0.8914, "step": 9949 }, { "epoch": 0.19, "learning_rate": 4.680900300972508e-06, "loss": 1.0701, "step": 9950 }, { "epoch": 0.19, "learning_rate": 4.680825615360543e-06, "loss": 1.0487, "step": 9951 }, { "epoch": 0.19, "learning_rate": 4.6807509216054425e-06, "loss": 0.6875, "step": 9952 }, { "epoch": 0.19, "learning_rate": 4.680676219707484e-06, "loss": 0.9194, "step": 9953 }, { "epoch": 0.19, "learning_rate": 4.680601509666947e-06, "loss": 0.9484, "step": 9954 }, { "epoch": 0.19, "learning_rate": 4.680526791484111e-06, "loss": 1.0832, "step": 9955 }, { "epoch": 0.19, "learning_rate": 4.680452065159255e-06, "loss": 1.2261, "step": 9956 }, { "epoch": 0.19, "learning_rate": 4.6803773306926585e-06, "loss": 0.8179, "step": 9957 }, { "epoch": 0.19, "learning_rate": 4.6803025880845995e-06, "loss": 0.7916, "step": 9958 }, { "epoch": 0.19, "learning_rate": 4.680227837335357e-06, "loss": 1.1382, "step": 9959 }, { "epoch": 0.19, "learning_rate": 4.680153078445211e-06, "loss": 0.7875, "step": 9960 }, { "epoch": 0.19, "learning_rate": 4.680078311414441e-06, "loss": 0.9615, "step": 9961 }, { "epoch": 0.19, "learning_rate": 4.680003536243324e-06, "loss": 0.8082, "step": 9962 }, { "epoch": 0.19, "learning_rate": 4.679928752932141e-06, "loss": 0.8932, "step": 9963 }, { "epoch": 0.19, "learning_rate": 4.6798539614811715e-06, "loss": 0.7043, "step": 9964 }, { "epoch": 0.19, "learning_rate": 4.679779161890694e-06, "loss": 1.1002, "step": 9965 }, { "epoch": 0.19, "learning_rate": 4.679704354160988e-06, "loss": 0.8847, "step": 9966 }, { "epoch": 0.19, "learning_rate": 4.679629538292332e-06, "loss": 0.8593, "step": 9967 }, { "epoch": 0.19, "learning_rate": 4.679554714285006e-06, "loss": 1.1326, "step": 9968 }, { "epoch": 0.19, "learning_rate": 4.679479882139291e-06, "loss": 1.0715, "step": 9969 }, { "epoch": 0.19, "learning_rate": 4.679405041855464e-06, "loss": 0.8488, "step": 9970 }, { "epoch": 0.19, "learning_rate": 4.679330193433805e-06, "loss": 0.993, "step": 9971 }, { "epoch": 0.19, "learning_rate": 4.6792553368745946e-06, "loss": 0.9861, "step": 9972 }, { "epoch": 0.19, "learning_rate": 4.679180472178111e-06, "loss": 0.7441, "step": 9973 }, { "epoch": 0.19, "learning_rate": 4.679105599344635e-06, "loss": 1.1392, "step": 9974 }, { "epoch": 0.19, "learning_rate": 4.679030718374446e-06, "loss": 1.1799, "step": 9975 }, { "epoch": 0.19, "learning_rate": 4.678955829267822e-06, "loss": 0.9821, "step": 9976 }, { "epoch": 0.19, "learning_rate": 4.678880932025044e-06, "loss": 0.988, "step": 9977 }, { "epoch": 0.19, "learning_rate": 4.678806026646391e-06, "loss": 1.1088, "step": 9978 }, { "epoch": 0.19, "learning_rate": 4.678731113132143e-06, "loss": 1.0625, "step": 9979 }, { "epoch": 0.19, "learning_rate": 4.6786561914825816e-06, "loss": 0.9076, "step": 9980 }, { "epoch": 0.19, "learning_rate": 4.678581261697983e-06, "loss": 1.231, "step": 9981 }, { "epoch": 0.19, "learning_rate": 4.678506323778629e-06, "loss": 1.0271, "step": 9982 }, { "epoch": 0.19, "learning_rate": 4.6784313777248e-06, "loss": 0.8309, "step": 9983 }, { "epoch": 0.19, "learning_rate": 4.678356423536774e-06, "loss": 0.9253, "step": 9984 }, { "epoch": 0.19, "learning_rate": 4.678281461214833e-06, "loss": 0.8517, "step": 9985 }, { "epoch": 0.19, "learning_rate": 4.678206490759255e-06, "loss": 0.8956, "step": 9986 }, { "epoch": 0.19, "learning_rate": 4.678131512170321e-06, "loss": 1.0178, "step": 9987 }, { "epoch": 0.19, "learning_rate": 4.678056525448311e-06, "loss": 1.0362, "step": 9988 }, { "epoch": 0.19, "learning_rate": 4.677981530593504e-06, "loss": 0.7458, "step": 9989 }, { "epoch": 0.19, "learning_rate": 4.677906527606181e-06, "loss": 0.89, "step": 9990 }, { "epoch": 0.19, "learning_rate": 4.677831516486622e-06, "loss": 0.8196, "step": 9991 }, { "epoch": 0.19, "learning_rate": 4.677756497235107e-06, "loss": 0.9906, "step": 9992 }, { "epoch": 0.19, "learning_rate": 4.677681469851916e-06, "loss": 1.0438, "step": 9993 }, { "epoch": 0.19, "learning_rate": 4.677606434337329e-06, "loss": 1.0913, "step": 9994 }, { "epoch": 0.19, "learning_rate": 4.677531390691626e-06, "loss": 1.0414, "step": 9995 }, { "epoch": 0.19, "learning_rate": 4.677456338915088e-06, "loss": 1.0541, "step": 9996 }, { "epoch": 0.19, "learning_rate": 4.677381279007995e-06, "loss": 0.7279, "step": 9997 }, { "epoch": 0.19, "learning_rate": 4.6773062109706265e-06, "loss": 0.8293, "step": 9998 }, { "epoch": 0.19, "learning_rate": 4.677231134803264e-06, "loss": 0.9447, "step": 9999 }, { "epoch": 0.19, "learning_rate": 4.677156050506186e-06, "loss": 1.1297, "step": 10000 }, { "epoch": 0.19, "learning_rate": 4.6770809580796756e-06, "loss": 0.9211, "step": 10001 }, { "epoch": 0.19, "learning_rate": 4.677005857524011e-06, "loss": 0.7148, "step": 10002 }, { "epoch": 0.19, "learning_rate": 4.676930748839473e-06, "loss": 0.8578, "step": 10003 }, { "epoch": 0.19, "learning_rate": 4.676855632026343e-06, "loss": 0.7584, "step": 10004 }, { "epoch": 0.19, "learning_rate": 4.6767805070849e-06, "loss": 0.979, "step": 10005 }, { "epoch": 0.19, "learning_rate": 4.676705374015425e-06, "loss": 1.1712, "step": 10006 }, { "epoch": 0.19, "learning_rate": 4.6766302328182e-06, "loss": 1.2516, "step": 10007 }, { "epoch": 0.19, "learning_rate": 4.676555083493504e-06, "loss": 0.641, "step": 10008 }, { "epoch": 0.19, "learning_rate": 4.676479926041618e-06, "loss": 0.8873, "step": 10009 }, { "epoch": 0.19, "learning_rate": 4.676404760462823e-06, "loss": 0.9808, "step": 10010 }, { "epoch": 0.19, "learning_rate": 4.676329586757399e-06, "loss": 0.9946, "step": 10011 }, { "epoch": 0.19, "learning_rate": 4.676254404925627e-06, "loss": 1.2775, "step": 10012 }, { "epoch": 0.19, "learning_rate": 4.676179214967789e-06, "loss": 0.9983, "step": 10013 }, { "epoch": 0.19, "learning_rate": 4.676104016884163e-06, "loss": 0.8162, "step": 10014 }, { "epoch": 0.19, "learning_rate": 4.676028810675032e-06, "loss": 0.9471, "step": 10015 }, { "epoch": 0.19, "learning_rate": 4.675953596340675e-06, "loss": 0.9432, "step": 10016 }, { "epoch": 0.19, "learning_rate": 4.675878373881376e-06, "loss": 0.8209, "step": 10017 }, { "epoch": 0.19, "learning_rate": 4.675803143297413e-06, "loss": 1.072, "step": 10018 }, { "epoch": 0.19, "learning_rate": 4.675727904589067e-06, "loss": 1.1456, "step": 10019 }, { "epoch": 0.19, "learning_rate": 4.67565265775662e-06, "loss": 0.8301, "step": 10020 }, { "epoch": 0.19, "learning_rate": 4.675577402800353e-06, "loss": 0.8943, "step": 10021 }, { "epoch": 0.19, "learning_rate": 4.675502139720547e-06, "loss": 1.0847, "step": 10022 }, { "epoch": 0.19, "learning_rate": 4.675426868517482e-06, "loss": 0.8228, "step": 10023 }, { "epoch": 0.19, "learning_rate": 4.67535158919144e-06, "loss": 0.9487, "step": 10024 }, { "epoch": 0.19, "learning_rate": 4.6752763017427025e-06, "loss": 1.1374, "step": 10025 }, { "epoch": 0.19, "learning_rate": 4.675201006171549e-06, "loss": 0.9409, "step": 10026 }, { "epoch": 0.19, "learning_rate": 4.6751257024782625e-06, "loss": 0.857, "step": 10027 }, { "epoch": 0.19, "learning_rate": 4.675050390663123e-06, "loss": 0.8409, "step": 10028 }, { "epoch": 0.19, "learning_rate": 4.674975070726412e-06, "loss": 1.0638, "step": 10029 }, { "epoch": 0.19, "learning_rate": 4.674899742668411e-06, "loss": 0.8226, "step": 10030 }, { "epoch": 0.19, "learning_rate": 4.674824406489401e-06, "loss": 1.2339, "step": 10031 }, { "epoch": 0.19, "learning_rate": 4.674749062189663e-06, "loss": 0.9647, "step": 10032 }, { "epoch": 0.19, "learning_rate": 4.674673709769478e-06, "loss": 0.9284, "step": 10033 }, { "epoch": 0.19, "learning_rate": 4.674598349229129e-06, "loss": 0.7006, "step": 10034 }, { "epoch": 0.19, "learning_rate": 4.674522980568896e-06, "loss": 0.8908, "step": 10035 }, { "epoch": 0.19, "learning_rate": 4.674447603789062e-06, "loss": 0.9775, "step": 10036 }, { "epoch": 0.19, "learning_rate": 4.674372218889907e-06, "loss": 1.1182, "step": 10037 }, { "epoch": 0.19, "learning_rate": 4.674296825871711e-06, "loss": 1.1092, "step": 10038 }, { "epoch": 0.19, "learning_rate": 4.6742214247347594e-06, "loss": 0.8417, "step": 10039 }, { "epoch": 0.19, "learning_rate": 4.6741460154793305e-06, "loss": 0.9465, "step": 10040 }, { "epoch": 0.19, "learning_rate": 4.674070598105708e-06, "loss": 0.9404, "step": 10041 }, { "epoch": 0.19, "learning_rate": 4.673995172614171e-06, "loss": 0.9644, "step": 10042 }, { "epoch": 0.19, "learning_rate": 4.673919739005004e-06, "loss": 1.1557, "step": 10043 }, { "epoch": 0.19, "learning_rate": 4.673844297278487e-06, "loss": 0.9857, "step": 10044 }, { "epoch": 0.19, "learning_rate": 4.673768847434902e-06, "loss": 0.9333, "step": 10045 }, { "epoch": 0.19, "learning_rate": 4.673693389474531e-06, "loss": 0.9742, "step": 10046 }, { "epoch": 0.19, "learning_rate": 4.673617923397655e-06, "loss": 0.9026, "step": 10047 }, { "epoch": 0.19, "learning_rate": 4.673542449204556e-06, "loss": 1.0099, "step": 10048 }, { "epoch": 0.19, "learning_rate": 4.673466966895518e-06, "loss": 1.1145, "step": 10049 }, { "epoch": 0.19, "learning_rate": 4.673391476470819e-06, "loss": 1.1738, "step": 10050 }, { "epoch": 0.19, "learning_rate": 4.673315977930744e-06, "loss": 1.0569, "step": 10051 }, { "epoch": 0.19, "learning_rate": 4.673240471275573e-06, "loss": 0.8442, "step": 10052 }, { "epoch": 0.19, "learning_rate": 4.673164956505589e-06, "loss": 0.9542, "step": 10053 }, { "epoch": 0.19, "learning_rate": 4.6730894336210745e-06, "loss": 0.809, "step": 10054 }, { "epoch": 0.19, "learning_rate": 4.67301390262231e-06, "loss": 0.8362, "step": 10055 }, { "epoch": 0.19, "learning_rate": 4.6729383635095785e-06, "loss": 1.2172, "step": 10056 }, { "epoch": 0.19, "learning_rate": 4.672862816283161e-06, "loss": 1.0012, "step": 10057 }, { "epoch": 0.19, "learning_rate": 4.672787260943341e-06, "loss": 0.8313, "step": 10058 }, { "epoch": 0.19, "learning_rate": 4.6727116974904e-06, "loss": 0.7455, "step": 10059 }, { "epoch": 0.19, "learning_rate": 4.67263612592462e-06, "loss": 0.9125, "step": 10060 }, { "epoch": 0.19, "learning_rate": 4.672560546246283e-06, "loss": 0.8601, "step": 10061 }, { "epoch": 0.19, "learning_rate": 4.672484958455672e-06, "loss": 1.0981, "step": 10062 }, { "epoch": 0.19, "learning_rate": 4.672409362553069e-06, "loss": 0.9941, "step": 10063 }, { "epoch": 0.19, "learning_rate": 4.672333758538755e-06, "loss": 1.0154, "step": 10064 }, { "epoch": 0.19, "learning_rate": 4.672258146413014e-06, "loss": 0.9532, "step": 10065 }, { "epoch": 0.19, "learning_rate": 4.672182526176128e-06, "loss": 0.8254, "step": 10066 }, { "epoch": 0.19, "learning_rate": 4.672106897828378e-06, "loss": 0.9904, "step": 10067 }, { "epoch": 0.19, "learning_rate": 4.6720312613700485e-06, "loss": 1.1927, "step": 10068 }, { "epoch": 0.19, "learning_rate": 4.6719556168014205e-06, "loss": 0.9693, "step": 10069 }, { "epoch": 0.19, "learning_rate": 4.671879964122777e-06, "loss": 0.9555, "step": 10070 }, { "epoch": 0.19, "learning_rate": 4.6718043033344e-06, "loss": 0.9508, "step": 10071 }, { "epoch": 0.19, "learning_rate": 4.671728634436573e-06, "loss": 0.8587, "step": 10072 }, { "epoch": 0.19, "learning_rate": 4.671652957429576e-06, "loss": 0.8219, "step": 10073 }, { "epoch": 0.19, "learning_rate": 4.671577272313695e-06, "loss": 0.9583, "step": 10074 }, { "epoch": 0.19, "learning_rate": 4.671501579089211e-06, "loss": 1.169, "step": 10075 }, { "epoch": 0.19, "learning_rate": 4.671425877756407e-06, "loss": 0.808, "step": 10076 }, { "epoch": 0.19, "learning_rate": 4.671350168315565e-06, "loss": 0.8139, "step": 10077 }, { "epoch": 0.19, "learning_rate": 4.671274450766968e-06, "loss": 1.0308, "step": 10078 }, { "epoch": 0.19, "learning_rate": 4.671198725110898e-06, "loss": 0.9429, "step": 10079 }, { "epoch": 0.19, "learning_rate": 4.671122991347639e-06, "loss": 1.084, "step": 10080 }, { "epoch": 0.19, "learning_rate": 4.671047249477474e-06, "loss": 1.1912, "step": 10081 }, { "epoch": 0.19, "learning_rate": 4.670971499500685e-06, "loss": 1.0654, "step": 10082 }, { "epoch": 0.19, "learning_rate": 4.670895741417555e-06, "loss": 1.0153, "step": 10083 }, { "epoch": 0.19, "learning_rate": 4.6708199752283655e-06, "loss": 1.1442, "step": 10084 }, { "epoch": 0.19, "learning_rate": 4.670744200933403e-06, "loss": 0.8405, "step": 10085 }, { "epoch": 0.19, "learning_rate": 4.670668418532947e-06, "loss": 0.8725, "step": 10086 }, { "epoch": 0.19, "learning_rate": 4.670592628027281e-06, "loss": 1.0604, "step": 10087 }, { "epoch": 0.19, "learning_rate": 4.670516829416689e-06, "loss": 1.1014, "step": 10088 }, { "epoch": 0.19, "learning_rate": 4.670441022701454e-06, "loss": 0.8986, "step": 10089 }, { "epoch": 0.19, "learning_rate": 4.670365207881859e-06, "loss": 0.9107, "step": 10090 }, { "epoch": 0.19, "learning_rate": 4.670289384958186e-06, "loss": 1.084, "step": 10091 }, { "epoch": 0.19, "learning_rate": 4.67021355393072e-06, "loss": 0.7085, "step": 10092 }, { "epoch": 0.19, "learning_rate": 4.670137714799744e-06, "loss": 0.9585, "step": 10093 }, { "epoch": 0.19, "learning_rate": 4.670061867565539e-06, "loss": 0.9285, "step": 10094 }, { "epoch": 0.19, "learning_rate": 4.669986012228389e-06, "loss": 0.858, "step": 10095 }, { "epoch": 0.19, "learning_rate": 4.669910148788579e-06, "loss": 0.6745, "step": 10096 }, { "epoch": 0.19, "learning_rate": 4.66983427724639e-06, "loss": 0.9392, "step": 10097 }, { "epoch": 0.19, "learning_rate": 4.669758397602107e-06, "loss": 0.7408, "step": 10098 }, { "epoch": 0.19, "learning_rate": 4.669682509856012e-06, "loss": 1.0538, "step": 10099 }, { "epoch": 0.19, "learning_rate": 4.66960661400839e-06, "loss": 1.1418, "step": 10100 }, { "epoch": 0.19, "learning_rate": 4.6695307100595224e-06, "loss": 1.0538, "step": 10101 }, { "epoch": 0.19, "learning_rate": 4.669454798009695e-06, "loss": 0.7414, "step": 10102 }, { "epoch": 0.19, "learning_rate": 4.669378877859189e-06, "loss": 0.8824, "step": 10103 }, { "epoch": 0.19, "learning_rate": 4.669302949608288e-06, "loss": 0.9075, "step": 10104 }, { "epoch": 0.19, "learning_rate": 4.669227013257277e-06, "loss": 0.8206, "step": 10105 }, { "epoch": 0.19, "learning_rate": 4.669151068806439e-06, "loss": 1.0658, "step": 10106 }, { "epoch": 0.19, "learning_rate": 4.669075116256058e-06, "loss": 0.8346, "step": 10107 }, { "epoch": 0.19, "learning_rate": 4.668999155606416e-06, "loss": 0.7094, "step": 10108 }, { "epoch": 0.19, "learning_rate": 4.668923186857797e-06, "loss": 0.8184, "step": 10109 }, { "epoch": 0.19, "learning_rate": 4.668847210010488e-06, "loss": 1.0101, "step": 10110 }, { "epoch": 0.19, "learning_rate": 4.668771225064768e-06, "loss": 1.0603, "step": 10111 }, { "epoch": 0.19, "learning_rate": 4.668695232020923e-06, "loss": 1.1747, "step": 10112 }, { "epoch": 0.19, "learning_rate": 4.6686192308792365e-06, "loss": 0.9143, "step": 10113 }, { "epoch": 0.19, "learning_rate": 4.668543221639993e-06, "loss": 0.8531, "step": 10114 }, { "epoch": 0.19, "learning_rate": 4.6684672043034744e-06, "loss": 0.8005, "step": 10115 }, { "epoch": 0.19, "learning_rate": 4.668391178869966e-06, "loss": 0.921, "step": 10116 }, { "epoch": 0.19, "learning_rate": 4.668315145339753e-06, "loss": 0.8032, "step": 10117 }, { "epoch": 0.19, "learning_rate": 4.668239103713116e-06, "loss": 1.0341, "step": 10118 }, { "epoch": 0.19, "learning_rate": 4.668163053990341e-06, "loss": 0.9341, "step": 10119 }, { "epoch": 0.19, "learning_rate": 4.668086996171712e-06, "loss": 0.9028, "step": 10120 }, { "epoch": 0.19, "learning_rate": 4.668010930257513e-06, "loss": 0.888, "step": 10121 }, { "epoch": 0.19, "learning_rate": 4.6679348562480265e-06, "loss": 1.0219, "step": 10122 }, { "epoch": 0.19, "learning_rate": 4.667858774143539e-06, "loss": 0.8666, "step": 10123 }, { "epoch": 0.19, "learning_rate": 4.667782683944332e-06, "loss": 1.1021, "step": 10124 }, { "epoch": 0.19, "learning_rate": 4.667706585650691e-06, "loss": 1.0548, "step": 10125 }, { "epoch": 0.19, "learning_rate": 4.667630479262901e-06, "loss": 1.0701, "step": 10126 }, { "epoch": 0.19, "learning_rate": 4.667554364781245e-06, "loss": 0.8138, "step": 10127 }, { "epoch": 0.19, "learning_rate": 4.667478242206007e-06, "loss": 0.9673, "step": 10128 }, { "epoch": 0.19, "learning_rate": 4.667402111537472e-06, "loss": 0.9061, "step": 10129 }, { "epoch": 0.19, "learning_rate": 4.6673259727759245e-06, "loss": 0.9998, "step": 10130 }, { "epoch": 0.19, "learning_rate": 4.667249825921648e-06, "loss": 1.1196, "step": 10131 }, { "epoch": 0.19, "learning_rate": 4.667173670974927e-06, "loss": 1.0034, "step": 10132 }, { "epoch": 0.19, "learning_rate": 4.667097507936045e-06, "loss": 0.8502, "step": 10133 }, { "epoch": 0.19, "learning_rate": 4.6670213368052885e-06, "loss": 0.9224, "step": 10134 }, { "epoch": 0.19, "learning_rate": 4.66694515758294e-06, "loss": 0.8116, "step": 10135 }, { "epoch": 0.19, "learning_rate": 4.666868970269285e-06, "loss": 1.1763, "step": 10136 }, { "epoch": 0.19, "learning_rate": 4.666792774864608e-06, "loss": 1.1276, "step": 10137 }, { "epoch": 0.19, "learning_rate": 4.6667165713691935e-06, "loss": 0.9319, "step": 10138 }, { "epoch": 0.19, "learning_rate": 4.666640359783326e-06, "loss": 0.9931, "step": 10139 }, { "epoch": 0.19, "learning_rate": 4.666564140107289e-06, "loss": 0.8163, "step": 10140 }, { "epoch": 0.19, "learning_rate": 4.666487912341367e-06, "loss": 0.8363, "step": 10141 }, { "epoch": 0.19, "learning_rate": 4.6664116764858474e-06, "loss": 0.7736, "step": 10142 }, { "epoch": 0.19, "learning_rate": 4.666335432541013e-06, "loss": 1.0369, "step": 10143 }, { "epoch": 0.19, "learning_rate": 4.666259180507147e-06, "loss": 0.9884, "step": 10144 }, { "epoch": 0.19, "learning_rate": 4.666182920384536e-06, "loss": 0.924, "step": 10145 }, { "epoch": 0.19, "learning_rate": 4.666106652173466e-06, "loss": 0.9155, "step": 10146 }, { "epoch": 0.19, "learning_rate": 4.666030375874219e-06, "loss": 0.8511, "step": 10147 }, { "epoch": 0.19, "learning_rate": 4.665954091487081e-06, "loss": 0.9094, "step": 10148 }, { "epoch": 0.19, "learning_rate": 4.665877799012336e-06, "loss": 0.9152, "step": 10149 }, { "epoch": 0.19, "learning_rate": 4.6658014984502704e-06, "loss": 1.0937, "step": 10150 }, { "epoch": 0.19, "learning_rate": 4.665725189801169e-06, "loss": 1.019, "step": 10151 }, { "epoch": 0.19, "learning_rate": 4.665648873065316e-06, "loss": 0.8864, "step": 10152 }, { "epoch": 0.19, "learning_rate": 4.665572548242996e-06, "loss": 1.0292, "step": 10153 }, { "epoch": 0.19, "learning_rate": 4.665496215334495e-06, "loss": 0.7939, "step": 10154 }, { "epoch": 0.19, "learning_rate": 4.6654198743400966e-06, "loss": 1.0413, "step": 10155 }, { "epoch": 0.19, "learning_rate": 4.665343525260088e-06, "loss": 1.2245, "step": 10156 }, { "epoch": 0.19, "learning_rate": 4.665267168094753e-06, "loss": 0.9711, "step": 10157 }, { "epoch": 0.19, "learning_rate": 4.665190802844375e-06, "loss": 0.8481, "step": 10158 }, { "epoch": 0.19, "learning_rate": 4.665114429509242e-06, "loss": 0.7289, "step": 10159 }, { "epoch": 0.19, "learning_rate": 4.665038048089639e-06, "loss": 0.8336, "step": 10160 }, { "epoch": 0.19, "learning_rate": 4.664961658585849e-06, "loss": 1.0001, "step": 10161 }, { "epoch": 0.19, "learning_rate": 4.66488526099816e-06, "loss": 1.1495, "step": 10162 }, { "epoch": 0.19, "learning_rate": 4.664808855326854e-06, "loss": 1.1559, "step": 10163 }, { "epoch": 0.19, "learning_rate": 4.66473244157222e-06, "loss": 1.0533, "step": 10164 }, { "epoch": 0.19, "learning_rate": 4.66465601973454e-06, "loss": 1.0397, "step": 10165 }, { "epoch": 0.19, "learning_rate": 4.664579589814101e-06, "loss": 0.8964, "step": 10166 }, { "epoch": 0.19, "learning_rate": 4.664503151811189e-06, "loss": 0.9868, "step": 10167 }, { "epoch": 0.19, "learning_rate": 4.664426705726088e-06, "loss": 0.8871, "step": 10168 }, { "epoch": 0.19, "learning_rate": 4.664350251559085e-06, "loss": 1.0474, "step": 10169 }, { "epoch": 0.19, "learning_rate": 4.664273789310463e-06, "loss": 1.1572, "step": 10170 }, { "epoch": 0.19, "learning_rate": 4.664197318980509e-06, "loss": 1.0685, "step": 10171 }, { "epoch": 0.19, "learning_rate": 4.6641208405695095e-06, "loss": 0.9472, "step": 10172 }, { "epoch": 0.19, "learning_rate": 4.6640443540777495e-06, "loss": 0.9452, "step": 10173 }, { "epoch": 0.19, "learning_rate": 4.663967859505514e-06, "loss": 0.9077, "step": 10174 }, { "epoch": 0.19, "learning_rate": 4.6638913568530875e-06, "loss": 0.804, "step": 10175 }, { "epoch": 0.19, "learning_rate": 4.663814846120758e-06, "loss": 1.0803, "step": 10176 }, { "epoch": 0.19, "learning_rate": 4.66373832730881e-06, "loss": 1.1, "step": 10177 }, { "epoch": 0.19, "learning_rate": 4.66366180041753e-06, "loss": 0.9114, "step": 10178 }, { "epoch": 0.19, "learning_rate": 4.663585265447203e-06, "loss": 0.8672, "step": 10179 }, { "epoch": 0.19, "learning_rate": 4.663508722398114e-06, "loss": 0.9483, "step": 10180 }, { "epoch": 0.19, "learning_rate": 4.663432171270551e-06, "loss": 1.2188, "step": 10181 }, { "epoch": 0.19, "learning_rate": 4.6633556120647985e-06, "loss": 1.1183, "step": 10182 }, { "epoch": 0.19, "learning_rate": 4.663279044781142e-06, "loss": 0.967, "step": 10183 }, { "epoch": 0.19, "learning_rate": 4.6632024694198675e-06, "loss": 0.9431, "step": 10184 }, { "epoch": 0.19, "learning_rate": 4.663125885981262e-06, "loss": 0.9127, "step": 10185 }, { "epoch": 0.19, "learning_rate": 4.66304929446561e-06, "loss": 1.017, "step": 10186 }, { "epoch": 0.19, "learning_rate": 4.662972694873199e-06, "loss": 0.9606, "step": 10187 }, { "epoch": 0.19, "learning_rate": 4.662896087204314e-06, "loss": 1.0317, "step": 10188 }, { "epoch": 0.19, "learning_rate": 4.6628194714592414e-06, "loss": 0.7035, "step": 10189 }, { "epoch": 0.19, "learning_rate": 4.662742847638268e-06, "loss": 1.0267, "step": 10190 }, { "epoch": 0.19, "learning_rate": 4.662666215741678e-06, "loss": 1.028, "step": 10191 }, { "epoch": 0.19, "learning_rate": 4.662589575769759e-06, "loss": 0.8634, "step": 10192 }, { "epoch": 0.19, "learning_rate": 4.662512927722797e-06, "loss": 1.0237, "step": 10193 }, { "epoch": 0.19, "learning_rate": 4.662436271601077e-06, "loss": 0.9044, "step": 10194 }, { "epoch": 0.19, "learning_rate": 4.662359607404888e-06, "loss": 0.9199, "step": 10195 }, { "epoch": 0.19, "learning_rate": 4.662282935134514e-06, "loss": 1.0822, "step": 10196 }, { "epoch": 0.19, "learning_rate": 4.662206254790241e-06, "loss": 1.0934, "step": 10197 }, { "epoch": 0.19, "learning_rate": 4.662129566372356e-06, "loss": 0.8282, "step": 10198 }, { "epoch": 0.19, "learning_rate": 4.662052869881146e-06, "loss": 1.122, "step": 10199 }, { "epoch": 0.19, "learning_rate": 4.661976165316897e-06, "loss": 1.2295, "step": 10200 }, { "epoch": 0.19, "learning_rate": 4.661899452679896e-06, "loss": 0.9716, "step": 10201 }, { "epoch": 0.19, "learning_rate": 4.661822731970428e-06, "loss": 0.8187, "step": 10202 }, { "epoch": 0.19, "learning_rate": 4.66174600318878e-06, "loss": 0.8763, "step": 10203 }, { "epoch": 0.19, "learning_rate": 4.661669266335239e-06, "loss": 0.9465, "step": 10204 }, { "epoch": 0.19, "learning_rate": 4.661592521410091e-06, "loss": 0.9348, "step": 10205 }, { "epoch": 0.19, "learning_rate": 4.661515768413623e-06, "loss": 1.0463, "step": 10206 }, { "epoch": 0.19, "learning_rate": 4.661439007346121e-06, "loss": 0.985, "step": 10207 }, { "epoch": 0.19, "learning_rate": 4.6613622382078725e-06, "loss": 0.9329, "step": 10208 }, { "epoch": 0.19, "learning_rate": 4.661285460999163e-06, "loss": 0.9354, "step": 10209 }, { "epoch": 0.19, "learning_rate": 4.661208675720281e-06, "loss": 0.8301, "step": 10210 }, { "epoch": 0.19, "learning_rate": 4.661131882371512e-06, "loss": 1.2296, "step": 10211 }, { "epoch": 0.19, "learning_rate": 4.6610550809531414e-06, "loss": 0.9893, "step": 10212 }, { "epoch": 0.19, "learning_rate": 4.6609782714654586e-06, "loss": 0.9767, "step": 10213 }, { "epoch": 0.19, "learning_rate": 4.660901453908748e-06, "loss": 1.0954, "step": 10214 }, { "epoch": 0.19, "learning_rate": 4.660824628283299e-06, "loss": 1.0288, "step": 10215 }, { "epoch": 0.19, "learning_rate": 4.6607477945893965e-06, "loss": 0.7706, "step": 10216 }, { "epoch": 0.19, "learning_rate": 4.660670952827328e-06, "loss": 0.8269, "step": 10217 }, { "epoch": 0.19, "learning_rate": 4.66059410299738e-06, "loss": 1.1453, "step": 10218 }, { "epoch": 0.19, "learning_rate": 4.66051724509984e-06, "loss": 1.2697, "step": 10219 }, { "epoch": 0.19, "learning_rate": 4.660440379134996e-06, "loss": 0.9513, "step": 10220 }, { "epoch": 0.19, "learning_rate": 4.6603635051031326e-06, "loss": 0.9507, "step": 10221 }, { "epoch": 0.19, "learning_rate": 4.660286623004539e-06, "loss": 0.8445, "step": 10222 }, { "epoch": 0.19, "learning_rate": 4.660209732839501e-06, "loss": 0.9359, "step": 10223 }, { "epoch": 0.19, "learning_rate": 4.660132834608306e-06, "loss": 0.8527, "step": 10224 }, { "epoch": 0.19, "learning_rate": 4.660055928311241e-06, "loss": 1.0143, "step": 10225 }, { "epoch": 0.19, "learning_rate": 4.659979013948593e-06, "loss": 0.8372, "step": 10226 }, { "epoch": 0.19, "learning_rate": 4.659902091520651e-06, "loss": 0.8933, "step": 10227 }, { "epoch": 0.19, "learning_rate": 4.6598251610277e-06, "loss": 0.9774, "step": 10228 }, { "epoch": 0.19, "learning_rate": 4.659748222470027e-06, "loss": 0.8194, "step": 10229 }, { "epoch": 0.19, "learning_rate": 4.659671275847922e-06, "loss": 0.9868, "step": 10230 }, { "epoch": 0.19, "learning_rate": 4.65959432116167e-06, "loss": 1.031, "step": 10231 }, { "epoch": 0.19, "learning_rate": 4.6595173584115594e-06, "loss": 1.0977, "step": 10232 }, { "epoch": 0.19, "learning_rate": 4.659440387597876e-06, "loss": 0.6754, "step": 10233 }, { "epoch": 0.19, "learning_rate": 4.659363408720911e-06, "loss": 1.0051, "step": 10234 }, { "epoch": 0.19, "learning_rate": 4.659286421780947e-06, "loss": 0.8466, "step": 10235 }, { "epoch": 0.19, "learning_rate": 4.659209426778274e-06, "loss": 0.8584, "step": 10236 }, { "epoch": 0.19, "learning_rate": 4.659132423713179e-06, "loss": 1.3392, "step": 10237 }, { "epoch": 0.19, "learning_rate": 4.659055412585951e-06, "loss": 0.8854, "step": 10238 }, { "epoch": 0.19, "learning_rate": 4.658978393396875e-06, "loss": 0.9094, "step": 10239 }, { "epoch": 0.19, "learning_rate": 4.658901366146241e-06, "loss": 0.7303, "step": 10240 }, { "epoch": 0.19, "learning_rate": 4.658824330834334e-06, "loss": 0.8896, "step": 10241 }, { "epoch": 0.19, "learning_rate": 4.658747287461445e-06, "loss": 0.8833, "step": 10242 }, { "epoch": 0.19, "learning_rate": 4.658670236027858e-06, "loss": 1.1648, "step": 10243 }, { "epoch": 0.19, "learning_rate": 4.658593176533864e-06, "loss": 1.1633, "step": 10244 }, { "epoch": 0.19, "learning_rate": 4.6585161089797485e-06, "loss": 0.8979, "step": 10245 }, { "epoch": 0.19, "learning_rate": 4.6584390333658e-06, "loss": 0.8887, "step": 10246 }, { "epoch": 0.19, "learning_rate": 4.658361949692306e-06, "loss": 0.989, "step": 10247 }, { "epoch": 0.19, "learning_rate": 4.658284857959556e-06, "loss": 0.808, "step": 10248 }, { "epoch": 0.19, "learning_rate": 4.6582077581678355e-06, "loss": 0.8943, "step": 10249 }, { "epoch": 0.19, "learning_rate": 4.658130650317433e-06, "loss": 1.1792, "step": 10250 }, { "epoch": 0.19, "learning_rate": 4.658053534408637e-06, "loss": 0.9881, "step": 10251 }, { "epoch": 0.19, "learning_rate": 4.657976410441736e-06, "loss": 0.9038, "step": 10252 }, { "epoch": 0.19, "learning_rate": 4.657899278417017e-06, "loss": 0.8774, "step": 10253 }, { "epoch": 0.19, "learning_rate": 4.657822138334768e-06, "loss": 0.9585, "step": 10254 }, { "epoch": 0.19, "learning_rate": 4.657744990195278e-06, "loss": 1.1311, "step": 10255 }, { "epoch": 0.19, "learning_rate": 4.657667833998833e-06, "loss": 1.1399, "step": 10256 }, { "epoch": 0.19, "learning_rate": 4.6575906697457244e-06, "loss": 1.0507, "step": 10257 }, { "epoch": 0.19, "learning_rate": 4.657513497436237e-06, "loss": 0.8208, "step": 10258 }, { "epoch": 0.19, "learning_rate": 4.65743631707066e-06, "loss": 0.7966, "step": 10259 }, { "epoch": 0.19, "learning_rate": 4.6573591286492826e-06, "loss": 0.7989, "step": 10260 }, { "epoch": 0.19, "learning_rate": 4.657281932172393e-06, "loss": 0.8365, "step": 10261 }, { "epoch": 0.19, "learning_rate": 4.657204727640277e-06, "loss": 1.1339, "step": 10262 }, { "epoch": 0.19, "learning_rate": 4.6571275150532265e-06, "loss": 1.2929, "step": 10263 }, { "epoch": 0.19, "learning_rate": 4.657050294411527e-06, "loss": 0.7802, "step": 10264 }, { "epoch": 0.19, "learning_rate": 4.656973065715468e-06, "loss": 0.8565, "step": 10265 }, { "epoch": 0.19, "learning_rate": 4.656895828965338e-06, "loss": 0.8998, "step": 10266 }, { "epoch": 0.19, "learning_rate": 4.6568185841614255e-06, "loss": 1.0389, "step": 10267 }, { "epoch": 0.19, "learning_rate": 4.656741331304018e-06, "loss": 0.9237, "step": 10268 }, { "epoch": 0.19, "learning_rate": 4.656664070393404e-06, "loss": 1.0592, "step": 10269 }, { "epoch": 0.19, "learning_rate": 4.656586801429873e-06, "loss": 0.8706, "step": 10270 }, { "epoch": 0.19, "learning_rate": 4.656509524413713e-06, "loss": 0.7217, "step": 10271 }, { "epoch": 0.19, "learning_rate": 4.656432239345213e-06, "loss": 1.028, "step": 10272 }, { "epoch": 0.19, "learning_rate": 4.65635494622466e-06, "loss": 0.7847, "step": 10273 }, { "epoch": 0.19, "learning_rate": 4.656277645052345e-06, "loss": 0.9304, "step": 10274 }, { "epoch": 0.19, "learning_rate": 4.6562003358285545e-06, "loss": 1.0786, "step": 10275 }, { "epoch": 0.19, "learning_rate": 4.656123018553579e-06, "loss": 0.9342, "step": 10276 }, { "epoch": 0.19, "learning_rate": 4.656045693227706e-06, "loss": 0.8687, "step": 10277 }, { "epoch": 0.19, "learning_rate": 4.6559683598512224e-06, "loss": 0.7901, "step": 10278 }, { "epoch": 0.19, "learning_rate": 4.655891018424422e-06, "loss": 0.8933, "step": 10279 }, { "epoch": 0.19, "learning_rate": 4.655813668947589e-06, "loss": 0.9272, "step": 10280 }, { "epoch": 0.19, "learning_rate": 4.655736311421014e-06, "loss": 1.1656, "step": 10281 }, { "epoch": 0.19, "learning_rate": 4.655658945844986e-06, "loss": 1.1246, "step": 10282 }, { "epoch": 0.19, "learning_rate": 4.655581572219794e-06, "loss": 1.0065, "step": 10283 }, { "epoch": 0.19, "learning_rate": 4.6555041905457254e-06, "loss": 0.9579, "step": 10284 }, { "epoch": 0.19, "learning_rate": 4.655426800823071e-06, "loss": 1.0056, "step": 10285 }, { "epoch": 0.19, "learning_rate": 4.655349403052119e-06, "loss": 0.9287, "step": 10286 }, { "epoch": 0.19, "learning_rate": 4.655271997233159e-06, "loss": 1.0265, "step": 10287 }, { "epoch": 0.19, "learning_rate": 4.655194583366478e-06, "loss": 1.0362, "step": 10288 }, { "epoch": 0.19, "learning_rate": 4.655117161452367e-06, "loss": 1.0388, "step": 10289 }, { "epoch": 0.19, "learning_rate": 4.655039731491115e-06, "loss": 0.9989, "step": 10290 }, { "epoch": 0.19, "learning_rate": 4.654962293483011e-06, "loss": 0.8036, "step": 10291 }, { "epoch": 0.19, "learning_rate": 4.654884847428343e-06, "loss": 0.9299, "step": 10292 }, { "epoch": 0.19, "learning_rate": 4.654807393327402e-06, "loss": 1.0713, "step": 10293 }, { "epoch": 0.19, "learning_rate": 4.6547299311804755e-06, "loss": 1.1481, "step": 10294 }, { "epoch": 0.19, "learning_rate": 4.654652460987854e-06, "loss": 0.7463, "step": 10295 }, { "epoch": 0.19, "learning_rate": 4.654574982749825e-06, "loss": 0.7747, "step": 10296 }, { "epoch": 0.19, "learning_rate": 4.654497496466681e-06, "loss": 0.9928, "step": 10297 }, { "epoch": 0.19, "learning_rate": 4.654420002138709e-06, "loss": 0.9318, "step": 10298 }, { "epoch": 0.19, "learning_rate": 4.654342499766198e-06, "loss": 0.86, "step": 10299 }, { "epoch": 0.19, "learning_rate": 4.654264989349439e-06, "loss": 1.119, "step": 10300 }, { "epoch": 0.19, "learning_rate": 4.654187470888719e-06, "loss": 1.0532, "step": 10301 }, { "epoch": 0.19, "learning_rate": 4.65410994438433e-06, "loss": 0.9404, "step": 10302 }, { "epoch": 0.19, "learning_rate": 4.654032409836561e-06, "loss": 1.0302, "step": 10303 }, { "epoch": 0.19, "learning_rate": 4.6539548672457e-06, "loss": 0.8924, "step": 10304 }, { "epoch": 0.19, "learning_rate": 4.653877316612039e-06, "loss": 0.9608, "step": 10305 }, { "epoch": 0.19, "learning_rate": 4.653799757935865e-06, "loss": 1.14, "step": 10306 }, { "epoch": 0.19, "learning_rate": 4.653722191217469e-06, "loss": 1.0478, "step": 10307 }, { "epoch": 0.19, "learning_rate": 4.65364461645714e-06, "loss": 0.9166, "step": 10308 }, { "epoch": 0.19, "learning_rate": 4.653567033655169e-06, "loss": 1.0656, "step": 10309 }, { "epoch": 0.19, "learning_rate": 4.653489442811844e-06, "loss": 0.8943, "step": 10310 }, { "epoch": 0.19, "learning_rate": 4.653411843927455e-06, "loss": 0.9202, "step": 10311 }, { "epoch": 0.19, "learning_rate": 4.653334237002294e-06, "loss": 0.9028, "step": 10312 }, { "epoch": 0.19, "learning_rate": 4.653256622036647e-06, "loss": 0.9706, "step": 10313 }, { "epoch": 0.19, "learning_rate": 4.653178999030807e-06, "loss": 1.0287, "step": 10314 }, { "epoch": 0.19, "learning_rate": 4.653101367985062e-06, "loss": 0.8493, "step": 10315 }, { "epoch": 0.19, "learning_rate": 4.653023728899703e-06, "loss": 0.9299, "step": 10316 }, { "epoch": 0.19, "learning_rate": 4.65294608177502e-06, "loss": 0.7801, "step": 10317 }, { "epoch": 0.19, "learning_rate": 4.652868426611301e-06, "loss": 1.0179, "step": 10318 }, { "epoch": 0.19, "learning_rate": 4.652790763408838e-06, "loss": 1.1808, "step": 10319 }, { "epoch": 0.19, "learning_rate": 4.65271309216792e-06, "loss": 0.9218, "step": 10320 }, { "epoch": 0.19, "learning_rate": 4.652635412888837e-06, "loss": 0.8315, "step": 10321 }, { "epoch": 0.19, "learning_rate": 4.652557725571879e-06, "loss": 0.9533, "step": 10322 }, { "epoch": 0.19, "learning_rate": 4.652480030217338e-06, "loss": 0.8246, "step": 10323 }, { "epoch": 0.19, "learning_rate": 4.652402326825501e-06, "loss": 1.0121, "step": 10324 }, { "epoch": 0.19, "learning_rate": 4.652324615396661e-06, "loss": 1.1929, "step": 10325 }, { "epoch": 0.19, "learning_rate": 4.6522468959311066e-06, "loss": 0.9044, "step": 10326 }, { "epoch": 0.19, "learning_rate": 4.652169168429128e-06, "loss": 0.8066, "step": 10327 }, { "epoch": 0.19, "learning_rate": 4.652091432891016e-06, "loss": 0.8931, "step": 10328 }, { "epoch": 0.19, "learning_rate": 4.652013689317059e-06, "loss": 1.048, "step": 10329 }, { "epoch": 0.19, "learning_rate": 4.651935937707551e-06, "loss": 0.8771, "step": 10330 }, { "epoch": 0.19, "learning_rate": 4.6518581780627795e-06, "loss": 1.162, "step": 10331 }, { "epoch": 0.19, "learning_rate": 4.651780410383036e-06, "loss": 1.1107, "step": 10332 }, { "epoch": 0.19, "learning_rate": 4.65170263466861e-06, "loss": 0.9567, "step": 10333 }, { "epoch": 0.19, "learning_rate": 4.651624850919791e-06, "loss": 1.0305, "step": 10334 }, { "epoch": 0.19, "learning_rate": 4.651547059136873e-06, "loss": 0.9891, "step": 10335 }, { "epoch": 0.2, "learning_rate": 4.651469259320143e-06, "loss": 0.892, "step": 10336 }, { "epoch": 0.2, "learning_rate": 4.651391451469893e-06, "loss": 1.1265, "step": 10337 }, { "epoch": 0.2, "learning_rate": 4.651313635586413e-06, "loss": 1.0798, "step": 10338 }, { "epoch": 0.2, "learning_rate": 4.651235811669994e-06, "loss": 1.0744, "step": 10339 }, { "epoch": 0.2, "learning_rate": 4.651157979720927e-06, "loss": 0.8379, "step": 10340 }, { "epoch": 0.2, "learning_rate": 4.651080139739501e-06, "loss": 0.8683, "step": 10341 }, { "epoch": 0.2, "learning_rate": 4.651002291726009e-06, "loss": 0.722, "step": 10342 }, { "epoch": 0.2, "learning_rate": 4.65092443568074e-06, "loss": 1.2055, "step": 10343 }, { "epoch": 0.2, "learning_rate": 4.6508465716039845e-06, "loss": 1.2003, "step": 10344 }, { "epoch": 0.2, "learning_rate": 4.650768699496034e-06, "loss": 0.922, "step": 10345 }, { "epoch": 0.2, "learning_rate": 4.6506908193571794e-06, "loss": 0.9789, "step": 10346 }, { "epoch": 0.2, "learning_rate": 4.650612931187711e-06, "loss": 0.7634, "step": 10347 }, { "epoch": 0.2, "learning_rate": 4.6505350349879195e-06, "loss": 0.9819, "step": 10348 }, { "epoch": 0.2, "learning_rate": 4.650457130758097e-06, "loss": 0.9819, "step": 10349 }, { "epoch": 0.2, "learning_rate": 4.650379218498533e-06, "loss": 1.1541, "step": 10350 }, { "epoch": 0.2, "learning_rate": 4.650301298209518e-06, "loss": 0.668, "step": 10351 }, { "epoch": 0.2, "learning_rate": 4.650223369891346e-06, "loss": 0.9233, "step": 10352 }, { "epoch": 0.2, "learning_rate": 4.650145433544305e-06, "loss": 1.0187, "step": 10353 }, { "epoch": 0.2, "learning_rate": 4.650067489168686e-06, "loss": 0.8037, "step": 10354 }, { "epoch": 0.2, "learning_rate": 4.6499895367647815e-06, "loss": 0.8563, "step": 10355 }, { "epoch": 0.2, "learning_rate": 4.649911576332882e-06, "loss": 1.1123, "step": 10356 }, { "epoch": 0.2, "learning_rate": 4.6498336078732795e-06, "loss": 0.9551, "step": 10357 }, { "epoch": 0.2, "learning_rate": 4.649755631386263e-06, "loss": 0.9359, "step": 10358 }, { "epoch": 0.2, "learning_rate": 4.649677646872125e-06, "loss": 0.6225, "step": 10359 }, { "epoch": 0.2, "learning_rate": 4.649599654331157e-06, "loss": 1.0317, "step": 10360 }, { "epoch": 0.2, "learning_rate": 4.649521653763649e-06, "loss": 0.835, "step": 10361 }, { "epoch": 0.2, "learning_rate": 4.649443645169894e-06, "loss": 0.9091, "step": 10362 }, { "epoch": 0.2, "learning_rate": 4.649365628550182e-06, "loss": 0.9075, "step": 10363 }, { "epoch": 0.2, "learning_rate": 4.649287603904805e-06, "loss": 0.9855, "step": 10364 }, { "epoch": 0.2, "learning_rate": 4.649209571234053e-06, "loss": 0.9305, "step": 10365 }, { "epoch": 0.2, "learning_rate": 4.64913153053822e-06, "loss": 0.8244, "step": 10366 }, { "epoch": 0.2, "learning_rate": 4.6490534818175945e-06, "loss": 0.8872, "step": 10367 }, { "epoch": 0.2, "learning_rate": 4.64897542507247e-06, "loss": 1.0577, "step": 10368 }, { "epoch": 0.2, "learning_rate": 4.6488973603031355e-06, "loss": 0.9734, "step": 10369 }, { "epoch": 0.2, "learning_rate": 4.6488192875098855e-06, "loss": 0.6812, "step": 10370 }, { "epoch": 0.2, "learning_rate": 4.64874120669301e-06, "loss": 0.7254, "step": 10371 }, { "epoch": 0.2, "learning_rate": 4.6486631178528e-06, "loss": 0.9761, "step": 10372 }, { "epoch": 0.2, "learning_rate": 4.648585020989549e-06, "loss": 0.8528, "step": 10373 }, { "epoch": 0.2, "learning_rate": 4.648506916103547e-06, "loss": 1.0029, "step": 10374 }, { "epoch": 0.2, "learning_rate": 4.648428803195085e-06, "loss": 1.1882, "step": 10375 }, { "epoch": 0.2, "learning_rate": 4.648350682264457e-06, "loss": 1.1761, "step": 10376 }, { "epoch": 0.2, "learning_rate": 4.648272553311954e-06, "loss": 0.9188, "step": 10377 }, { "epoch": 0.2, "learning_rate": 4.648194416337865e-06, "loss": 0.8233, "step": 10378 }, { "epoch": 0.2, "learning_rate": 4.648116271342486e-06, "loss": 0.8613, "step": 10379 }, { "epoch": 0.2, "learning_rate": 4.648038118326105e-06, "loss": 0.9228, "step": 10380 }, { "epoch": 0.2, "learning_rate": 4.647959957289017e-06, "loss": 1.1851, "step": 10381 }, { "epoch": 0.2, "learning_rate": 4.6478817882315115e-06, "loss": 0.7791, "step": 10382 }, { "epoch": 0.2, "learning_rate": 4.647803611153881e-06, "loss": 0.8695, "step": 10383 }, { "epoch": 0.2, "learning_rate": 4.6477254260564184e-06, "loss": 0.8645, "step": 10384 }, { "epoch": 0.2, "learning_rate": 4.647647232939414e-06, "loss": 0.8505, "step": 10385 }, { "epoch": 0.2, "learning_rate": 4.647569031803162e-06, "loss": 1.0057, "step": 10386 }, { "epoch": 0.2, "learning_rate": 4.647490822647952e-06, "loss": 1.0849, "step": 10387 }, { "epoch": 0.2, "learning_rate": 4.647412605474077e-06, "loss": 0.9545, "step": 10388 }, { "epoch": 0.2, "learning_rate": 4.647334380281831e-06, "loss": 0.845, "step": 10389 }, { "epoch": 0.2, "learning_rate": 4.647256147071502e-06, "loss": 0.8535, "step": 10390 }, { "epoch": 0.2, "learning_rate": 4.6471779058433856e-06, "loss": 0.9274, "step": 10391 }, { "epoch": 0.2, "learning_rate": 4.647099656597772e-06, "loss": 0.9324, "step": 10392 }, { "epoch": 0.2, "learning_rate": 4.647021399334955e-06, "loss": 1.1303, "step": 10393 }, { "epoch": 0.2, "learning_rate": 4.646943134055226e-06, "loss": 1.162, "step": 10394 }, { "epoch": 0.2, "learning_rate": 4.646864860758876e-06, "loss": 1.0918, "step": 10395 }, { "epoch": 0.2, "learning_rate": 4.646786579446199e-06, "loss": 0.9737, "step": 10396 }, { "epoch": 0.2, "learning_rate": 4.646708290117487e-06, "loss": 0.8621, "step": 10397 }, { "epoch": 0.2, "learning_rate": 4.646629992773032e-06, "loss": 1.0649, "step": 10398 }, { "epoch": 0.2, "learning_rate": 4.646551687413127e-06, "loss": 0.9735, "step": 10399 }, { "epoch": 0.2, "learning_rate": 4.646473374038063e-06, "loss": 1.0181, "step": 10400 }, { "epoch": 0.2, "learning_rate": 4.646395052648133e-06, "loss": 0.8253, "step": 10401 }, { "epoch": 0.2, "learning_rate": 4.64631672324363e-06, "loss": 0.9012, "step": 10402 }, { "epoch": 0.2, "learning_rate": 4.646238385824846e-06, "loss": 0.8713, "step": 10403 }, { "epoch": 0.2, "learning_rate": 4.646160040392073e-06, "loss": 0.926, "step": 10404 }, { "epoch": 0.2, "learning_rate": 4.646081686945606e-06, "loss": 0.9792, "step": 10405 }, { "epoch": 0.2, "learning_rate": 4.6460033254857354e-06, "loss": 1.1055, "step": 10406 }, { "epoch": 0.2, "learning_rate": 4.645924956012753e-06, "loss": 0.8315, "step": 10407 }, { "epoch": 0.2, "learning_rate": 4.645846578526953e-06, "loss": 0.8318, "step": 10408 }, { "epoch": 0.2, "learning_rate": 4.645768193028628e-06, "loss": 0.9178, "step": 10409 }, { "epoch": 0.2, "learning_rate": 4.64568979951807e-06, "loss": 0.9155, "step": 10410 }, { "epoch": 0.2, "learning_rate": 4.645611397995573e-06, "loss": 0.8641, "step": 10411 }, { "epoch": 0.2, "learning_rate": 4.6455329884614285e-06, "loss": 1.1202, "step": 10412 }, { "epoch": 0.2, "learning_rate": 4.64545457091593e-06, "loss": 0.9543, "step": 10413 }, { "epoch": 0.2, "learning_rate": 4.645376145359368e-06, "loss": 0.8047, "step": 10414 }, { "epoch": 0.2, "learning_rate": 4.6452977117920386e-06, "loss": 0.951, "step": 10415 }, { "epoch": 0.2, "learning_rate": 4.645219270214233e-06, "loss": 0.9646, "step": 10416 }, { "epoch": 0.2, "learning_rate": 4.6451408206262446e-06, "loss": 0.8033, "step": 10417 }, { "epoch": 0.2, "learning_rate": 4.645062363028366e-06, "loss": 1.0668, "step": 10418 }, { "epoch": 0.2, "learning_rate": 4.644983897420891e-06, "loss": 1.0396, "step": 10419 }, { "epoch": 0.2, "learning_rate": 4.644905423804111e-06, "loss": 0.9619, "step": 10420 }, { "epoch": 0.2, "learning_rate": 4.6448269421783204e-06, "loss": 0.8258, "step": 10421 }, { "epoch": 0.2, "learning_rate": 4.644748452543811e-06, "loss": 0.9373, "step": 10422 }, { "epoch": 0.2, "learning_rate": 4.644669954900878e-06, "loss": 0.8941, "step": 10423 }, { "epoch": 0.2, "learning_rate": 4.644591449249812e-06, "loss": 0.9196, "step": 10424 }, { "epoch": 0.2, "learning_rate": 4.644512935590908e-06, "loss": 0.9808, "step": 10425 }, { "epoch": 0.2, "learning_rate": 4.644434413924458e-06, "loss": 0.8558, "step": 10426 }, { "epoch": 0.2, "learning_rate": 4.644355884250756e-06, "loss": 0.974, "step": 10427 }, { "epoch": 0.2, "learning_rate": 4.644277346570095e-06, "loss": 1.0171, "step": 10428 }, { "epoch": 0.2, "learning_rate": 4.644198800882768e-06, "loss": 0.7911, "step": 10429 }, { "epoch": 0.2, "learning_rate": 4.6441202471890675e-06, "loss": 0.9899, "step": 10430 }, { "epoch": 0.2, "learning_rate": 4.644041685489289e-06, "loss": 1.3428, "step": 10431 }, { "epoch": 0.2, "learning_rate": 4.643963115783723e-06, "loss": 0.9568, "step": 10432 }, { "epoch": 0.2, "learning_rate": 4.643884538072666e-06, "loss": 0.8967, "step": 10433 }, { "epoch": 0.2, "learning_rate": 4.643805952356409e-06, "loss": 1.058, "step": 10434 }, { "epoch": 0.2, "learning_rate": 4.643727358635247e-06, "loss": 0.742, "step": 10435 }, { "epoch": 0.2, "learning_rate": 4.643648756909472e-06, "loss": 1.1145, "step": 10436 }, { "epoch": 0.2, "learning_rate": 4.64357014717938e-06, "loss": 1.14, "step": 10437 }, { "epoch": 0.2, "learning_rate": 4.643491529445261e-06, "loss": 1.0912, "step": 10438 }, { "epoch": 0.2, "learning_rate": 4.643412903707411e-06, "loss": 0.9777, "step": 10439 }, { "epoch": 0.2, "learning_rate": 4.643334269966122e-06, "loss": 0.8307, "step": 10440 }, { "epoch": 0.2, "learning_rate": 4.64325562822169e-06, "loss": 0.7819, "step": 10441 }, { "epoch": 0.2, "learning_rate": 4.643176978474406e-06, "loss": 0.9673, "step": 10442 }, { "epoch": 0.2, "learning_rate": 4.643098320724566e-06, "loss": 1.2065, "step": 10443 }, { "epoch": 0.2, "learning_rate": 4.643019654972461e-06, "loss": 1.0936, "step": 10444 }, { "epoch": 0.2, "learning_rate": 4.6429409812183875e-06, "loss": 0.7727, "step": 10445 }, { "epoch": 0.2, "learning_rate": 4.642862299462638e-06, "loss": 0.8215, "step": 10446 }, { "epoch": 0.2, "learning_rate": 4.6427836097055064e-06, "loss": 0.9371, "step": 10447 }, { "epoch": 0.2, "learning_rate": 4.642704911947287e-06, "loss": 0.8962, "step": 10448 }, { "epoch": 0.2, "learning_rate": 4.642626206188272e-06, "loss": 0.7767, "step": 10449 }, { "epoch": 0.2, "learning_rate": 4.642547492428757e-06, "loss": 1.0829, "step": 10450 }, { "epoch": 0.2, "learning_rate": 4.642468770669035e-06, "loss": 0.9719, "step": 10451 }, { "epoch": 0.2, "learning_rate": 4.642390040909401e-06, "loss": 1.0283, "step": 10452 }, { "epoch": 0.2, "learning_rate": 4.642311303150148e-06, "loss": 0.7441, "step": 10453 }, { "epoch": 0.2, "learning_rate": 4.64223255739157e-06, "loss": 0.8831, "step": 10454 }, { "epoch": 0.2, "learning_rate": 4.642153803633961e-06, "loss": 0.8267, "step": 10455 }, { "epoch": 0.2, "learning_rate": 4.642075041877616e-06, "loss": 1.0291, "step": 10456 }, { "epoch": 0.2, "learning_rate": 4.641996272122828e-06, "loss": 1.0988, "step": 10457 }, { "epoch": 0.2, "learning_rate": 4.641917494369892e-06, "loss": 0.8109, "step": 10458 }, { "epoch": 0.2, "learning_rate": 4.641838708619102e-06, "loss": 0.9082, "step": 10459 }, { "epoch": 0.2, "learning_rate": 4.641759914870752e-06, "loss": 1.045, "step": 10460 }, { "epoch": 0.2, "learning_rate": 4.641681113125135e-06, "loss": 1.095, "step": 10461 }, { "epoch": 0.2, "learning_rate": 4.641602303382547e-06, "loss": 1.1379, "step": 10462 }, { "epoch": 0.2, "learning_rate": 4.6415234856432825e-06, "loss": 1.0168, "step": 10463 }, { "epoch": 0.2, "learning_rate": 4.641444659907634e-06, "loss": 1.0104, "step": 10464 }, { "epoch": 0.2, "learning_rate": 4.641365826175898e-06, "loss": 0.974, "step": 10465 }, { "epoch": 0.2, "learning_rate": 4.641286984448365e-06, "loss": 1.246, "step": 10466 }, { "epoch": 0.2, "learning_rate": 4.6412081347253344e-06, "loss": 0.8745, "step": 10467 }, { "epoch": 0.2, "learning_rate": 4.641129277007098e-06, "loss": 1.0349, "step": 10468 }, { "epoch": 0.2, "learning_rate": 4.64105041129395e-06, "loss": 0.9692, "step": 10469 }, { "epoch": 0.2, "learning_rate": 4.6409715375861854e-06, "loss": 1.0494, "step": 10470 }, { "epoch": 0.2, "learning_rate": 4.640892655884099e-06, "loss": 0.8569, "step": 10471 }, { "epoch": 0.2, "learning_rate": 4.640813766187985e-06, "loss": 1.0305, "step": 10472 }, { "epoch": 0.2, "learning_rate": 4.640734868498138e-06, "loss": 0.9675, "step": 10473 }, { "epoch": 0.2, "learning_rate": 4.640655962814853e-06, "loss": 1.1621, "step": 10474 }, { "epoch": 0.2, "learning_rate": 4.640577049138424e-06, "loss": 1.0183, "step": 10475 }, { "epoch": 0.2, "learning_rate": 4.640498127469145e-06, "loss": 1.0658, "step": 10476 }, { "epoch": 0.2, "learning_rate": 4.640419197807314e-06, "loss": 1.0245, "step": 10477 }, { "epoch": 0.2, "learning_rate": 4.640340260153221e-06, "loss": 1.0726, "step": 10478 }, { "epoch": 0.2, "learning_rate": 4.640261314507164e-06, "loss": 0.8816, "step": 10479 }, { "epoch": 0.2, "learning_rate": 4.6401823608694366e-06, "loss": 0.7955, "step": 10480 }, { "epoch": 0.2, "learning_rate": 4.640103399240334e-06, "loss": 1.1153, "step": 10481 }, { "epoch": 0.2, "learning_rate": 4.640024429620151e-06, "loss": 0.993, "step": 10482 }, { "epoch": 0.2, "learning_rate": 4.639945452009182e-06, "loss": 1.1207, "step": 10483 }, { "epoch": 0.2, "learning_rate": 4.639866466407723e-06, "loss": 0.9491, "step": 10484 }, { "epoch": 0.2, "learning_rate": 4.639787472816068e-06, "loss": 0.7675, "step": 10485 }, { "epoch": 0.2, "learning_rate": 4.639708471234512e-06, "loss": 0.7632, "step": 10486 }, { "epoch": 0.2, "learning_rate": 4.63962946166335e-06, "loss": 1.2644, "step": 10487 }, { "epoch": 0.2, "learning_rate": 4.639550444102878e-06, "loss": 0.827, "step": 10488 }, { "epoch": 0.2, "learning_rate": 4.639471418553389e-06, "loss": 0.8668, "step": 10489 }, { "epoch": 0.2, "learning_rate": 4.63939238501518e-06, "loss": 1.0186, "step": 10490 }, { "epoch": 0.2, "learning_rate": 4.639313343488545e-06, "loss": 0.9443, "step": 10491 }, { "epoch": 0.2, "learning_rate": 4.6392342939737814e-06, "loss": 0.9284, "step": 10492 }, { "epoch": 0.2, "learning_rate": 4.639155236471181e-06, "loss": 0.9978, "step": 10493 }, { "epoch": 0.2, "learning_rate": 4.63907617098104e-06, "loss": 1.2121, "step": 10494 }, { "epoch": 0.2, "learning_rate": 4.638997097503655e-06, "loss": 0.9045, "step": 10495 }, { "epoch": 0.2, "learning_rate": 4.63891801603932e-06, "loss": 0.8987, "step": 10496 }, { "epoch": 0.2, "learning_rate": 4.638838926588332e-06, "loss": 0.9506, "step": 10497 }, { "epoch": 0.2, "learning_rate": 4.638759829150983e-06, "loss": 0.7943, "step": 10498 }, { "epoch": 0.2, "learning_rate": 4.6386807237275714e-06, "loss": 0.9039, "step": 10499 }, { "epoch": 0.2, "learning_rate": 4.638601610318392e-06, "loss": 1.075, "step": 10500 }, { "epoch": 0.2, "learning_rate": 4.638522488923739e-06, "loss": 0.8415, "step": 10501 }, { "epoch": 0.2, "learning_rate": 4.638443359543909e-06, "loss": 0.9017, "step": 10502 }, { "epoch": 0.2, "learning_rate": 4.638364222179197e-06, "loss": 0.8687, "step": 10503 }, { "epoch": 0.2, "learning_rate": 4.638285076829898e-06, "loss": 0.9536, "step": 10504 }, { "epoch": 0.2, "learning_rate": 4.638205923496309e-06, "loss": 0.9246, "step": 10505 }, { "epoch": 0.2, "learning_rate": 4.638126762178724e-06, "loss": 1.1334, "step": 10506 }, { "epoch": 0.2, "learning_rate": 4.638047592877439e-06, "loss": 0.8014, "step": 10507 }, { "epoch": 0.2, "learning_rate": 4.637968415592751e-06, "loss": 0.7507, "step": 10508 }, { "epoch": 0.2, "learning_rate": 4.637889230324953e-06, "loss": 0.9401, "step": 10509 }, { "epoch": 0.2, "learning_rate": 4.637810037074344e-06, "loss": 1.0582, "step": 10510 }, { "epoch": 0.2, "learning_rate": 4.637730835841216e-06, "loss": 0.9995, "step": 10511 }, { "epoch": 0.2, "learning_rate": 4.637651626625868e-06, "loss": 1.178, "step": 10512 }, { "epoch": 0.2, "learning_rate": 4.637572409428593e-06, "loss": 0.9636, "step": 10513 }, { "epoch": 0.2, "learning_rate": 4.637493184249689e-06, "loss": 0.9495, "step": 10514 }, { "epoch": 0.2, "learning_rate": 4.637413951089451e-06, "loss": 0.9763, "step": 10515 }, { "epoch": 0.2, "learning_rate": 4.6373347099481755e-06, "loss": 0.9304, "step": 10516 }, { "epoch": 0.2, "learning_rate": 4.637255460826156e-06, "loss": 1.097, "step": 10517 }, { "epoch": 0.2, "learning_rate": 4.637176203723692e-06, "loss": 1.0755, "step": 10518 }, { "epoch": 0.2, "learning_rate": 4.637096938641077e-06, "loss": 0.8462, "step": 10519 }, { "epoch": 0.2, "learning_rate": 4.637017665578607e-06, "loss": 0.8202, "step": 10520 }, { "epoch": 0.2, "learning_rate": 4.636938384536579e-06, "loss": 1.0345, "step": 10521 }, { "epoch": 0.2, "learning_rate": 4.636859095515288e-06, "loss": 0.8979, "step": 10522 }, { "epoch": 0.2, "learning_rate": 4.636779798515031e-06, "loss": 0.8268, "step": 10523 }, { "epoch": 0.2, "learning_rate": 4.636700493536104e-06, "loss": 1.0394, "step": 10524 }, { "epoch": 0.2, "learning_rate": 4.636621180578802e-06, "loss": 1.166, "step": 10525 }, { "epoch": 0.2, "learning_rate": 4.636541859643423e-06, "loss": 1.2295, "step": 10526 }, { "epoch": 0.2, "learning_rate": 4.6364625307302625e-06, "loss": 1.1157, "step": 10527 }, { "epoch": 0.2, "learning_rate": 4.636383193839615e-06, "loss": 0.8806, "step": 10528 }, { "epoch": 0.2, "learning_rate": 4.636303848971779e-06, "loss": 0.9277, "step": 10529 }, { "epoch": 0.2, "learning_rate": 4.636224496127051e-06, "loss": 1.0966, "step": 10530 }, { "epoch": 0.2, "learning_rate": 4.636145135305725e-06, "loss": 1.2283, "step": 10531 }, { "epoch": 0.2, "learning_rate": 4.636065766508098e-06, "loss": 1.0043, "step": 10532 }, { "epoch": 0.2, "learning_rate": 4.635986389734468e-06, "loss": 1.0135, "step": 10533 }, { "epoch": 0.2, "learning_rate": 4.635907004985129e-06, "loss": 0.9407, "step": 10534 }, { "epoch": 0.2, "learning_rate": 4.635827612260381e-06, "loss": 0.713, "step": 10535 }, { "epoch": 0.2, "learning_rate": 4.6357482115605164e-06, "loss": 0.9744, "step": 10536 }, { "epoch": 0.2, "learning_rate": 4.635668802885834e-06, "loss": 0.9677, "step": 10537 }, { "epoch": 0.2, "learning_rate": 4.63558938623663e-06, "loss": 1.2675, "step": 10538 }, { "epoch": 0.2, "learning_rate": 4.6355099616132e-06, "loss": 0.9174, "step": 10539 }, { "epoch": 0.2, "learning_rate": 4.635430529015842e-06, "loss": 0.8901, "step": 10540 }, { "epoch": 0.2, "learning_rate": 4.635351088444852e-06, "loss": 0.9957, "step": 10541 }, { "epoch": 0.2, "learning_rate": 4.635271639900525e-06, "loss": 0.9334, "step": 10542 }, { "epoch": 0.2, "learning_rate": 4.635192183383161e-06, "loss": 1.0722, "step": 10543 }, { "epoch": 0.2, "learning_rate": 4.635112718893054e-06, "loss": 1.0557, "step": 10544 }, { "epoch": 0.2, "learning_rate": 4.635033246430501e-06, "loss": 0.8011, "step": 10545 }, { "epoch": 0.2, "learning_rate": 4.6349537659958e-06, "loss": 0.7335, "step": 10546 }, { "epoch": 0.2, "learning_rate": 4.634874277589248e-06, "loss": 0.8793, "step": 10547 }, { "epoch": 0.2, "learning_rate": 4.63479478121114e-06, "loss": 0.9246, "step": 10548 }, { "epoch": 0.2, "learning_rate": 4.634715276861773e-06, "loss": 0.9218, "step": 10549 }, { "epoch": 0.2, "learning_rate": 4.634635764541446e-06, "loss": 1.0822, "step": 10550 }, { "epoch": 0.2, "learning_rate": 4.634556244250453e-06, "loss": 1.0538, "step": 10551 }, { "epoch": 0.2, "learning_rate": 4.634476715989094e-06, "loss": 0.8336, "step": 10552 }, { "epoch": 0.2, "learning_rate": 4.6343971797576634e-06, "loss": 0.8821, "step": 10553 }, { "epoch": 0.2, "learning_rate": 4.634317635556459e-06, "loss": 0.9731, "step": 10554 }, { "epoch": 0.2, "learning_rate": 4.634238083385778e-06, "loss": 0.8965, "step": 10555 }, { "epoch": 0.2, "learning_rate": 4.634158523245918e-06, "loss": 1.0724, "step": 10556 }, { "epoch": 0.2, "learning_rate": 4.6340789551371755e-06, "loss": 0.9828, "step": 10557 }, { "epoch": 0.2, "learning_rate": 4.633999379059848e-06, "loss": 0.9902, "step": 10558 }, { "epoch": 0.2, "learning_rate": 4.6339197950142316e-06, "loss": 0.8633, "step": 10559 }, { "epoch": 0.2, "learning_rate": 4.633840203000624e-06, "loss": 0.8556, "step": 10560 }, { "epoch": 0.2, "learning_rate": 4.6337606030193224e-06, "loss": 0.9608, "step": 10561 }, { "epoch": 0.2, "learning_rate": 4.633680995070626e-06, "loss": 1.0505, "step": 10562 }, { "epoch": 0.2, "learning_rate": 4.6336013791548275e-06, "loss": 1.0947, "step": 10563 }, { "epoch": 0.2, "learning_rate": 4.633521755272228e-06, "loss": 0.7487, "step": 10564 }, { "epoch": 0.2, "learning_rate": 4.633442123423124e-06, "loss": 0.9869, "step": 10565 }, { "epoch": 0.2, "learning_rate": 4.633362483607811e-06, "loss": 0.8126, "step": 10566 }, { "epoch": 0.2, "learning_rate": 4.6332828358265905e-06, "loss": 0.7973, "step": 10567 }, { "epoch": 0.2, "learning_rate": 4.633203180079756e-06, "loss": 1.1495, "step": 10568 }, { "epoch": 0.2, "learning_rate": 4.6331235163676054e-06, "loss": 0.9552, "step": 10569 }, { "epoch": 0.2, "learning_rate": 4.633043844690438e-06, "loss": 1.0077, "step": 10570 }, { "epoch": 0.2, "learning_rate": 4.63296416504855e-06, "loss": 1.0261, "step": 10571 }, { "epoch": 0.2, "learning_rate": 4.632884477442239e-06, "loss": 0.9864, "step": 10572 }, { "epoch": 0.2, "learning_rate": 4.632804781871804e-06, "loss": 0.9473, "step": 10573 }, { "epoch": 0.2, "learning_rate": 4.6327250783375395e-06, "loss": 1.092, "step": 10574 }, { "epoch": 0.2, "learning_rate": 4.632645366839746e-06, "loss": 1.1515, "step": 10575 }, { "epoch": 0.2, "learning_rate": 4.632565647378719e-06, "loss": 1.1011, "step": 10576 }, { "epoch": 0.2, "learning_rate": 4.632485919954759e-06, "loss": 0.844, "step": 10577 }, { "epoch": 0.2, "learning_rate": 4.632406184568161e-06, "loss": 0.839, "step": 10578 }, { "epoch": 0.2, "learning_rate": 4.632326441219223e-06, "loss": 0.9824, "step": 10579 }, { "epoch": 0.2, "learning_rate": 4.632246689908245e-06, "loss": 0.9828, "step": 10580 }, { "epoch": 0.2, "learning_rate": 4.6321669306355225e-06, "loss": 1.261, "step": 10581 }, { "epoch": 0.2, "learning_rate": 4.632087163401354e-06, "loss": 0.7913, "step": 10582 }, { "epoch": 0.2, "learning_rate": 4.632007388206037e-06, "loss": 0.9941, "step": 10583 }, { "epoch": 0.2, "learning_rate": 4.6319276050498705e-06, "loss": 0.9185, "step": 10584 }, { "epoch": 0.2, "learning_rate": 4.631847813933152e-06, "loss": 0.9308, "step": 10585 }, { "epoch": 0.2, "learning_rate": 4.631768014856178e-06, "loss": 0.9215, "step": 10586 }, { "epoch": 0.2, "learning_rate": 4.631688207819248e-06, "loss": 1.0777, "step": 10587 }, { "epoch": 0.2, "learning_rate": 4.631608392822659e-06, "loss": 1.0254, "step": 10588 }, { "epoch": 0.2, "learning_rate": 4.6315285698667114e-06, "loss": 0.9203, "step": 10589 }, { "epoch": 0.2, "learning_rate": 4.6314487389517e-06, "loss": 0.7776, "step": 10590 }, { "epoch": 0.2, "learning_rate": 4.631368900077924e-06, "loss": 0.8921, "step": 10591 }, { "epoch": 0.2, "learning_rate": 4.631289053245684e-06, "loss": 0.921, "step": 10592 }, { "epoch": 0.2, "learning_rate": 4.631209198455275e-06, "loss": 1.227, "step": 10593 }, { "epoch": 0.2, "learning_rate": 4.6311293357069945e-06, "loss": 1.0552, "step": 10594 }, { "epoch": 0.2, "learning_rate": 4.631049465001144e-06, "loss": 0.955, "step": 10595 }, { "epoch": 0.2, "learning_rate": 4.63096958633802e-06, "loss": 0.9115, "step": 10596 }, { "epoch": 0.2, "learning_rate": 4.6308896997179206e-06, "loss": 1.0392, "step": 10597 }, { "epoch": 0.2, "learning_rate": 4.630809805141144e-06, "loss": 0.9581, "step": 10598 }, { "epoch": 0.2, "learning_rate": 4.63072990260799e-06, "loss": 1.034, "step": 10599 }, { "epoch": 0.2, "learning_rate": 4.630649992118755e-06, "loss": 1.1719, "step": 10600 }, { "epoch": 0.2, "learning_rate": 4.630570073673739e-06, "loss": 0.8501, "step": 10601 }, { "epoch": 0.2, "learning_rate": 4.630490147273239e-06, "loss": 0.7612, "step": 10602 }, { "epoch": 0.2, "learning_rate": 4.630410212917554e-06, "loss": 0.9501, "step": 10603 }, { "epoch": 0.2, "learning_rate": 4.630330270606983e-06, "loss": 0.9541, "step": 10604 }, { "epoch": 0.2, "learning_rate": 4.630250320341825e-06, "loss": 1.0543, "step": 10605 }, { "epoch": 0.2, "learning_rate": 4.630170362122377e-06, "loss": 1.0154, "step": 10606 }, { "epoch": 0.2, "learning_rate": 4.630090395948938e-06, "loss": 0.9767, "step": 10607 }, { "epoch": 0.2, "learning_rate": 4.630010421821806e-06, "loss": 0.8167, "step": 10608 }, { "epoch": 0.2, "learning_rate": 4.629930439741281e-06, "loss": 0.971, "step": 10609 }, { "epoch": 0.2, "learning_rate": 4.629850449707661e-06, "loss": 0.8698, "step": 10610 }, { "epoch": 0.2, "learning_rate": 4.629770451721245e-06, "loss": 0.9218, "step": 10611 }, { "epoch": 0.2, "learning_rate": 4.629690445782331e-06, "loss": 0.9066, "step": 10612 }, { "epoch": 0.2, "learning_rate": 4.629610431891218e-06, "loss": 1.1105, "step": 10613 }, { "epoch": 0.2, "learning_rate": 4.629530410048207e-06, "loss": 0.8439, "step": 10614 }, { "epoch": 0.2, "learning_rate": 4.629450380253592e-06, "loss": 0.8796, "step": 10615 }, { "epoch": 0.2, "learning_rate": 4.629370342507675e-06, "loss": 0.8622, "step": 10616 }, { "epoch": 0.2, "learning_rate": 4.629290296810756e-06, "loss": 0.8819, "step": 10617 }, { "epoch": 0.2, "learning_rate": 4.629210243163131e-06, "loss": 1.4316, "step": 10618 }, { "epoch": 0.2, "learning_rate": 4.629130181565101e-06, "loss": 1.0188, "step": 10619 }, { "epoch": 0.2, "learning_rate": 4.629050112016964e-06, "loss": 0.9547, "step": 10620 }, { "epoch": 0.2, "learning_rate": 4.628970034519019e-06, "loss": 1.072, "step": 10621 }, { "epoch": 0.2, "learning_rate": 4.628889949071565e-06, "loss": 0.8829, "step": 10622 }, { "epoch": 0.2, "learning_rate": 4.628809855674901e-06, "loss": 0.8569, "step": 10623 }, { "epoch": 0.2, "learning_rate": 4.628729754329327e-06, "loss": 0.8695, "step": 10624 }, { "epoch": 0.2, "learning_rate": 4.628649645035141e-06, "loss": 1.0333, "step": 10625 }, { "epoch": 0.2, "learning_rate": 4.6285695277926426e-06, "loss": 0.7558, "step": 10626 }, { "epoch": 0.2, "learning_rate": 4.6284894026021304e-06, "loss": 0.8319, "step": 10627 }, { "epoch": 0.2, "learning_rate": 4.628409269463904e-06, "loss": 0.9113, "step": 10628 }, { "epoch": 0.2, "learning_rate": 4.628329128378263e-06, "loss": 0.9068, "step": 10629 }, { "epoch": 0.2, "learning_rate": 4.628248979345506e-06, "loss": 1.048, "step": 10630 }, { "epoch": 0.2, "learning_rate": 4.628168822365934e-06, "loss": 1.0629, "step": 10631 }, { "epoch": 0.2, "learning_rate": 4.6280886574398435e-06, "loss": 0.8866, "step": 10632 }, { "epoch": 0.2, "learning_rate": 4.628008484567535e-06, "loss": 0.9407, "step": 10633 }, { "epoch": 0.2, "learning_rate": 4.627928303749308e-06, "loss": 1.0007, "step": 10634 }, { "epoch": 0.2, "learning_rate": 4.627848114985463e-06, "loss": 0.8246, "step": 10635 }, { "epoch": 0.2, "learning_rate": 4.627767918276298e-06, "loss": 0.7468, "step": 10636 }, { "epoch": 0.2, "learning_rate": 4.627687713622113e-06, "loss": 0.9219, "step": 10637 }, { "epoch": 0.2, "learning_rate": 4.6276075010232065e-06, "loss": 1.0582, "step": 10638 }, { "epoch": 0.2, "learning_rate": 4.627527280479879e-06, "loss": 0.8856, "step": 10639 }, { "epoch": 0.2, "learning_rate": 4.627447051992431e-06, "loss": 0.9612, "step": 10640 }, { "epoch": 0.2, "learning_rate": 4.62736681556116e-06, "loss": 0.909, "step": 10641 }, { "epoch": 0.2, "learning_rate": 4.627286571186367e-06, "loss": 0.8149, "step": 10642 }, { "epoch": 0.2, "learning_rate": 4.62720631886835e-06, "loss": 1.1536, "step": 10643 }, { "epoch": 0.2, "learning_rate": 4.62712605860741e-06, "loss": 1.2324, "step": 10644 }, { "epoch": 0.2, "learning_rate": 4.627045790403848e-06, "loss": 1.0547, "step": 10645 }, { "epoch": 0.2, "learning_rate": 4.626965514257961e-06, "loss": 0.9878, "step": 10646 }, { "epoch": 0.2, "learning_rate": 4.626885230170051e-06, "loss": 0.7506, "step": 10647 }, { "epoch": 0.2, "learning_rate": 4.6268049381404154e-06, "loss": 0.97, "step": 10648 }, { "epoch": 0.2, "learning_rate": 4.6267246381693565e-06, "loss": 1.0969, "step": 10649 }, { "epoch": 0.2, "learning_rate": 4.626644330257173e-06, "loss": 1.1544, "step": 10650 }, { "epoch": 0.2, "learning_rate": 4.626564014404164e-06, "loss": 1.0031, "step": 10651 }, { "epoch": 0.2, "learning_rate": 4.626483690610631e-06, "loss": 0.7974, "step": 10652 }, { "epoch": 0.2, "learning_rate": 4.626403358876872e-06, "loss": 0.9053, "step": 10653 }, { "epoch": 0.2, "learning_rate": 4.6263230192031895e-06, "loss": 0.8318, "step": 10654 }, { "epoch": 0.2, "learning_rate": 4.6262426715898815e-06, "loss": 1.1213, "step": 10655 }, { "epoch": 0.2, "learning_rate": 4.626162316037247e-06, "loss": 1.2078, "step": 10656 }, { "epoch": 0.2, "learning_rate": 4.626081952545589e-06, "loss": 0.864, "step": 10657 }, { "epoch": 0.2, "learning_rate": 4.626001581115207e-06, "loss": 1.0085, "step": 10658 }, { "epoch": 0.2, "learning_rate": 4.6259212017464e-06, "loss": 0.9213, "step": 10659 }, { "epoch": 0.2, "learning_rate": 4.625840814439467e-06, "loss": 0.9428, "step": 10660 }, { "epoch": 0.2, "learning_rate": 4.62576041919471e-06, "loss": 0.9191, "step": 10661 }, { "epoch": 0.2, "learning_rate": 4.625680016012429e-06, "loss": 1.1364, "step": 10662 }, { "epoch": 0.2, "learning_rate": 4.625599604892924e-06, "loss": 0.9804, "step": 10663 }, { "epoch": 0.2, "learning_rate": 4.6255191858364955e-06, "loss": 0.8003, "step": 10664 }, { "epoch": 0.2, "learning_rate": 4.625438758843443e-06, "loss": 0.9623, "step": 10665 }, { "epoch": 0.2, "learning_rate": 4.625358323914068e-06, "loss": 1.0198, "step": 10666 }, { "epoch": 0.2, "learning_rate": 4.625277881048671e-06, "loss": 0.9724, "step": 10667 }, { "epoch": 0.2, "learning_rate": 4.62519743024755e-06, "loss": 1.0766, "step": 10668 }, { "epoch": 0.2, "learning_rate": 4.625116971511008e-06, "loss": 1.2148, "step": 10669 }, { "epoch": 0.2, "learning_rate": 4.625036504839343e-06, "loss": 0.8275, "step": 10670 }, { "epoch": 0.2, "learning_rate": 4.6249560302328575e-06, "loss": 0.9094, "step": 10671 }, { "epoch": 0.2, "learning_rate": 4.624875547691851e-06, "loss": 1.0076, "step": 10672 }, { "epoch": 0.2, "learning_rate": 4.624795057216626e-06, "loss": 0.744, "step": 10673 }, { "epoch": 0.2, "learning_rate": 4.62471455880748e-06, "loss": 1.1088, "step": 10674 }, { "epoch": 0.2, "learning_rate": 4.624634052464715e-06, "loss": 0.9812, "step": 10675 }, { "epoch": 0.2, "learning_rate": 4.624553538188632e-06, "loss": 0.8968, "step": 10676 }, { "epoch": 0.2, "learning_rate": 4.624473015979531e-06, "loss": 0.9269, "step": 10677 }, { "epoch": 0.2, "learning_rate": 4.624392485837713e-06, "loss": 0.8591, "step": 10678 }, { "epoch": 0.2, "learning_rate": 4.624311947763479e-06, "loss": 0.8625, "step": 10679 }, { "epoch": 0.2, "learning_rate": 4.6242314017571284e-06, "loss": 1.0332, "step": 10680 }, { "epoch": 0.2, "learning_rate": 4.624150847818964e-06, "loss": 1.0801, "step": 10681 }, { "epoch": 0.2, "learning_rate": 4.624070285949285e-06, "loss": 1.0786, "step": 10682 }, { "epoch": 0.2, "learning_rate": 4.623989716148392e-06, "loss": 1.069, "step": 10683 }, { "epoch": 0.2, "learning_rate": 4.623909138416587e-06, "loss": 0.8932, "step": 10684 }, { "epoch": 0.2, "learning_rate": 4.62382855275417e-06, "loss": 0.9691, "step": 10685 }, { "epoch": 0.2, "learning_rate": 4.623747959161443e-06, "loss": 0.8812, "step": 10686 }, { "epoch": 0.2, "learning_rate": 4.6236673576387056e-06, "loss": 1.0599, "step": 10687 }, { "epoch": 0.2, "learning_rate": 4.623586748186261e-06, "loss": 0.9279, "step": 10688 }, { "epoch": 0.2, "learning_rate": 4.623506130804407e-06, "loss": 0.9088, "step": 10689 }, { "epoch": 0.2, "learning_rate": 4.623425505493446e-06, "loss": 0.8871, "step": 10690 }, { "epoch": 0.2, "learning_rate": 4.62334487225368e-06, "loss": 1.0751, "step": 10691 }, { "epoch": 0.2, "learning_rate": 4.6232642310854095e-06, "loss": 0.9622, "step": 10692 }, { "epoch": 0.2, "learning_rate": 4.623183581988935e-06, "loss": 1.0606, "step": 10693 }, { "epoch": 0.2, "learning_rate": 4.623102924964558e-06, "loss": 0.9725, "step": 10694 }, { "epoch": 0.2, "learning_rate": 4.6230222600125805e-06, "loss": 0.984, "step": 10695 }, { "epoch": 0.2, "learning_rate": 4.622941587133302e-06, "loss": 0.8652, "step": 10696 }, { "epoch": 0.2, "learning_rate": 4.6228609063270255e-06, "loss": 0.8294, "step": 10697 }, { "epoch": 0.2, "learning_rate": 4.622780217594051e-06, "loss": 0.9954, "step": 10698 }, { "epoch": 0.2, "learning_rate": 4.62269952093468e-06, "loss": 1.1416, "step": 10699 }, { "epoch": 0.2, "learning_rate": 4.622618816349215e-06, "loss": 0.9498, "step": 10700 }, { "epoch": 0.2, "learning_rate": 4.622538103837955e-06, "loss": 0.9417, "step": 10701 }, { "epoch": 0.2, "learning_rate": 4.622457383401204e-06, "loss": 0.7843, "step": 10702 }, { "epoch": 0.2, "learning_rate": 4.622376655039262e-06, "loss": 0.9005, "step": 10703 }, { "epoch": 0.2, "learning_rate": 4.622295918752431e-06, "loss": 1.0191, "step": 10704 }, { "epoch": 0.2, "learning_rate": 4.6222151745410116e-06, "loss": 0.9416, "step": 10705 }, { "epoch": 0.2, "learning_rate": 4.622134422405306e-06, "loss": 1.0466, "step": 10706 }, { "epoch": 0.2, "learning_rate": 4.622053662345616e-06, "loss": 0.9196, "step": 10707 }, { "epoch": 0.2, "learning_rate": 4.621972894362241e-06, "loss": 0.766, "step": 10708 }, { "epoch": 0.2, "learning_rate": 4.621892118455486e-06, "loss": 0.9402, "step": 10709 }, { "epoch": 0.2, "learning_rate": 4.62181133462565e-06, "loss": 0.9749, "step": 10710 }, { "epoch": 0.2, "learning_rate": 4.621730542873036e-06, "loss": 1.1268, "step": 10711 }, { "epoch": 0.2, "learning_rate": 4.621649743197945e-06, "loss": 0.9912, "step": 10712 }, { "epoch": 0.2, "learning_rate": 4.621568935600679e-06, "loss": 0.9341, "step": 10713 }, { "epoch": 0.2, "learning_rate": 4.6214881200815394e-06, "loss": 1.027, "step": 10714 }, { "epoch": 0.2, "learning_rate": 4.621407296640828e-06, "loss": 0.896, "step": 10715 }, { "epoch": 0.2, "learning_rate": 4.621326465278847e-06, "loss": 1.0219, "step": 10716 }, { "epoch": 0.2, "learning_rate": 4.621245625995899e-06, "loss": 0.8297, "step": 10717 }, { "epoch": 0.2, "learning_rate": 4.621164778792284e-06, "loss": 0.9897, "step": 10718 }, { "epoch": 0.2, "learning_rate": 4.621083923668305e-06, "loss": 0.9341, "step": 10719 }, { "epoch": 0.2, "learning_rate": 4.621003060624263e-06, "loss": 0.6997, "step": 10720 }, { "epoch": 0.2, "learning_rate": 4.620922189660461e-06, "loss": 0.8151, "step": 10721 }, { "epoch": 0.2, "learning_rate": 4.620841310777201e-06, "loss": 0.976, "step": 10722 }, { "epoch": 0.2, "learning_rate": 4.620760423974784e-06, "loss": 0.627, "step": 10723 }, { "epoch": 0.2, "learning_rate": 4.620679529253513e-06, "loss": 1.004, "step": 10724 }, { "epoch": 0.2, "learning_rate": 4.620598626613689e-06, "loss": 1.1603, "step": 10725 }, { "epoch": 0.2, "learning_rate": 4.620517716055616e-06, "loss": 0.9607, "step": 10726 }, { "epoch": 0.2, "learning_rate": 4.6204367975795935e-06, "loss": 1.0509, "step": 10727 }, { "epoch": 0.2, "learning_rate": 4.620355871185925e-06, "loss": 0.8513, "step": 10728 }, { "epoch": 0.2, "learning_rate": 4.620274936874914e-06, "loss": 0.8135, "step": 10729 }, { "epoch": 0.2, "learning_rate": 4.620193994646861e-06, "loss": 0.8918, "step": 10730 }, { "epoch": 0.2, "learning_rate": 4.620113044502068e-06, "loss": 1.2597, "step": 10731 }, { "epoch": 0.2, "learning_rate": 4.620032086440838e-06, "loss": 1.1716, "step": 10732 }, { "epoch": 0.2, "learning_rate": 4.619951120463474e-06, "loss": 0.8946, "step": 10733 }, { "epoch": 0.2, "learning_rate": 4.619870146570276e-06, "loss": 0.8612, "step": 10734 }, { "epoch": 0.2, "learning_rate": 4.619789164761549e-06, "loss": 0.8523, "step": 10735 }, { "epoch": 0.2, "learning_rate": 4.619708175037594e-06, "loss": 0.8625, "step": 10736 }, { "epoch": 0.2, "learning_rate": 4.619627177398714e-06, "loss": 1.0451, "step": 10737 }, { "epoch": 0.2, "learning_rate": 4.61954617184521e-06, "loss": 0.9834, "step": 10738 }, { "epoch": 0.2, "learning_rate": 4.6194651583773875e-06, "loss": 1.103, "step": 10739 }, { "epoch": 0.2, "learning_rate": 4.619384136995546e-06, "loss": 0.968, "step": 10740 }, { "epoch": 0.2, "learning_rate": 4.619303107699989e-06, "loss": 0.8332, "step": 10741 }, { "epoch": 0.2, "learning_rate": 4.619222070491019e-06, "loss": 0.7501, "step": 10742 }, { "epoch": 0.2, "learning_rate": 4.619141025368939e-06, "loss": 1.0703, "step": 10743 }, { "epoch": 0.2, "learning_rate": 4.619059972334052e-06, "loss": 1.0545, "step": 10744 }, { "epoch": 0.2, "learning_rate": 4.618978911386659e-06, "loss": 0.9012, "step": 10745 }, { "epoch": 0.2, "learning_rate": 4.618897842527064e-06, "loss": 0.9589, "step": 10746 }, { "epoch": 0.2, "learning_rate": 4.61881676575557e-06, "loss": 0.8479, "step": 10747 }, { "epoch": 0.2, "learning_rate": 4.6187356810724786e-06, "loss": 0.927, "step": 10748 }, { "epoch": 0.2, "learning_rate": 4.618654588478093e-06, "loss": 1.0853, "step": 10749 }, { "epoch": 0.2, "learning_rate": 4.618573487972716e-06, "loss": 0.9555, "step": 10750 }, { "epoch": 0.2, "learning_rate": 4.618492379556652e-06, "loss": 0.8828, "step": 10751 }, { "epoch": 0.2, "learning_rate": 4.618411263230201e-06, "loss": 0.9283, "step": 10752 }, { "epoch": 0.2, "learning_rate": 4.618330138993667e-06, "loss": 0.9524, "step": 10753 }, { "epoch": 0.2, "learning_rate": 4.618249006847354e-06, "loss": 0.8916, "step": 10754 }, { "epoch": 0.2, "learning_rate": 4.618167866791564e-06, "loss": 0.8534, "step": 10755 }, { "epoch": 0.2, "learning_rate": 4.618086718826601e-06, "loss": 0.9077, "step": 10756 }, { "epoch": 0.2, "learning_rate": 4.618005562952766e-06, "loss": 0.8314, "step": 10757 }, { "epoch": 0.2, "learning_rate": 4.617924399170364e-06, "loss": 0.915, "step": 10758 }, { "epoch": 0.2, "learning_rate": 4.617843227479696e-06, "loss": 0.92, "step": 10759 }, { "epoch": 0.2, "learning_rate": 4.617762047881067e-06, "loss": 0.9529, "step": 10760 }, { "epoch": 0.2, "learning_rate": 4.617680860374779e-06, "loss": 0.9175, "step": 10761 }, { "epoch": 0.2, "learning_rate": 4.617599664961137e-06, "loss": 1.2497, "step": 10762 }, { "epoch": 0.2, "learning_rate": 4.617518461640441e-06, "loss": 1.1713, "step": 10763 }, { "epoch": 0.2, "learning_rate": 4.6174372504129974e-06, "loss": 0.9299, "step": 10764 }, { "epoch": 0.2, "learning_rate": 4.617356031279107e-06, "loss": 0.9296, "step": 10765 }, { "epoch": 0.2, "learning_rate": 4.6172748042390745e-06, "loss": 0.9473, "step": 10766 }, { "epoch": 0.2, "learning_rate": 4.617193569293203e-06, "loss": 0.7683, "step": 10767 }, { "epoch": 0.2, "learning_rate": 4.617112326441796e-06, "loss": 1.2416, "step": 10768 }, { "epoch": 0.2, "learning_rate": 4.617031075685156e-06, "loss": 1.1901, "step": 10769 }, { "epoch": 0.2, "learning_rate": 4.616949817023587e-06, "loss": 0.9763, "step": 10770 }, { "epoch": 0.2, "learning_rate": 4.616868550457392e-06, "loss": 1.0816, "step": 10771 }, { "epoch": 0.2, "learning_rate": 4.616787275986874e-06, "loss": 0.8418, "step": 10772 }, { "epoch": 0.2, "learning_rate": 4.616705993612338e-06, "loss": 0.8419, "step": 10773 }, { "epoch": 0.2, "learning_rate": 4.616624703334087e-06, "loss": 0.9485, "step": 10774 }, { "epoch": 0.2, "learning_rate": 4.616543405152424e-06, "loss": 1.0966, "step": 10775 }, { "epoch": 0.2, "learning_rate": 4.616462099067654e-06, "loss": 0.8579, "step": 10776 }, { "epoch": 0.2, "learning_rate": 4.616380785080077e-06, "loss": 0.8341, "step": 10777 }, { "epoch": 0.2, "learning_rate": 4.61629946319e-06, "loss": 0.6254, "step": 10778 }, { "epoch": 0.2, "learning_rate": 4.616218133397727e-06, "loss": 0.7746, "step": 10779 }, { "epoch": 0.2, "learning_rate": 4.6161367957035594e-06, "loss": 1.0122, "step": 10780 }, { "epoch": 0.2, "learning_rate": 4.616055450107802e-06, "loss": 1.0967, "step": 10781 }, { "epoch": 0.2, "learning_rate": 4.615974096610758e-06, "loss": 1.0436, "step": 10782 }, { "epoch": 0.2, "learning_rate": 4.615892735212731e-06, "loss": 0.8718, "step": 10783 }, { "epoch": 0.2, "learning_rate": 4.615811365914027e-06, "loss": 0.8358, "step": 10784 }, { "epoch": 0.2, "learning_rate": 4.615729988714948e-06, "loss": 0.8133, "step": 10785 }, { "epoch": 0.2, "learning_rate": 4.615648603615797e-06, "loss": 0.9845, "step": 10786 }, { "epoch": 0.2, "learning_rate": 4.61556721061688e-06, "loss": 1.083, "step": 10787 }, { "epoch": 0.2, "learning_rate": 4.6154858097185e-06, "loss": 1.0388, "step": 10788 }, { "epoch": 0.2, "learning_rate": 4.61540440092096e-06, "loss": 1.0146, "step": 10789 }, { "epoch": 0.2, "learning_rate": 4.615322984224565e-06, "loss": 1.0643, "step": 10790 }, { "epoch": 0.2, "learning_rate": 4.615241559629619e-06, "loss": 0.9073, "step": 10791 }, { "epoch": 0.2, "learning_rate": 4.615160127136426e-06, "loss": 0.9202, "step": 10792 }, { "epoch": 0.2, "learning_rate": 4.61507868674529e-06, "loss": 1.2117, "step": 10793 }, { "epoch": 0.2, "learning_rate": 4.6149972384565146e-06, "loss": 1.0936, "step": 10794 }, { "epoch": 0.2, "learning_rate": 4.614915782270405e-06, "loss": 0.9492, "step": 10795 }, { "epoch": 0.2, "learning_rate": 4.614834318187263e-06, "loss": 1.0522, "step": 10796 }, { "epoch": 0.2, "learning_rate": 4.6147528462073965e-06, "loss": 0.9572, "step": 10797 }, { "epoch": 0.2, "learning_rate": 4.6146713663311074e-06, "loss": 0.6994, "step": 10798 }, { "epoch": 0.2, "learning_rate": 4.614589878558699e-06, "loss": 0.9741, "step": 10799 }, { "epoch": 0.2, "learning_rate": 4.614508382890479e-06, "loss": 1.0984, "step": 10800 }, { "epoch": 0.2, "learning_rate": 4.614426879326748e-06, "loss": 0.7186, "step": 10801 }, { "epoch": 0.2, "learning_rate": 4.6143453678678115e-06, "loss": 0.7054, "step": 10802 }, { "epoch": 0.2, "learning_rate": 4.6142638485139755e-06, "loss": 0.7831, "step": 10803 }, { "epoch": 0.2, "learning_rate": 4.614182321265543e-06, "loss": 0.977, "step": 10804 }, { "epoch": 0.2, "learning_rate": 4.614100786122817e-06, "loss": 0.952, "step": 10805 }, { "epoch": 0.2, "learning_rate": 4.614019243086105e-06, "loss": 1.0714, "step": 10806 }, { "epoch": 0.2, "learning_rate": 4.613937692155709e-06, "loss": 1.1366, "step": 10807 }, { "epoch": 0.2, "learning_rate": 4.613856133331934e-06, "loss": 1.0856, "step": 10808 }, { "epoch": 0.2, "learning_rate": 4.6137745666150866e-06, "loss": 0.9744, "step": 10809 }, { "epoch": 0.2, "learning_rate": 4.61369299200547e-06, "loss": 0.798, "step": 10810 }, { "epoch": 0.2, "learning_rate": 4.613611409503387e-06, "loss": 1.1016, "step": 10811 }, { "epoch": 0.2, "learning_rate": 4.613529819109145e-06, "loss": 1.229, "step": 10812 }, { "epoch": 0.2, "learning_rate": 4.613448220823046e-06, "loss": 0.9768, "step": 10813 }, { "epoch": 0.2, "learning_rate": 4.6133666146453976e-06, "loss": 0.9579, "step": 10814 }, { "epoch": 0.2, "learning_rate": 4.613285000576503e-06, "loss": 1.0101, "step": 10815 }, { "epoch": 0.2, "learning_rate": 4.6132033786166666e-06, "loss": 0.888, "step": 10816 }, { "epoch": 0.2, "learning_rate": 4.613121748766193e-06, "loss": 0.8367, "step": 10817 }, { "epoch": 0.2, "learning_rate": 4.613040111025388e-06, "loss": 1.1486, "step": 10818 }, { "epoch": 0.2, "learning_rate": 4.612958465394556e-06, "loss": 1.061, "step": 10819 }, { "epoch": 0.2, "learning_rate": 4.612876811874002e-06, "loss": 1.0153, "step": 10820 }, { "epoch": 0.2, "learning_rate": 4.6127951504640314e-06, "loss": 0.9936, "step": 10821 }, { "epoch": 0.2, "learning_rate": 4.612713481164948e-06, "loss": 0.8961, "step": 10822 }, { "epoch": 0.2, "learning_rate": 4.612631803977056e-06, "loss": 0.8566, "step": 10823 }, { "epoch": 0.2, "learning_rate": 4.612550118900663e-06, "loss": 0.9948, "step": 10824 }, { "epoch": 0.2, "learning_rate": 4.612468425936073e-06, "loss": 1.0307, "step": 10825 }, { "epoch": 0.2, "learning_rate": 4.6123867250835896e-06, "loss": 0.893, "step": 10826 }, { "epoch": 0.2, "learning_rate": 4.612305016343519e-06, "loss": 1.0326, "step": 10827 }, { "epoch": 0.2, "learning_rate": 4.612223299716167e-06, "loss": 1.0474, "step": 10828 }, { "epoch": 0.2, "learning_rate": 4.612141575201837e-06, "loss": 0.9147, "step": 10829 }, { "epoch": 0.2, "learning_rate": 4.612059842800836e-06, "loss": 0.9822, "step": 10830 }, { "epoch": 0.2, "learning_rate": 4.611978102513468e-06, "loss": 1.0956, "step": 10831 }, { "epoch": 0.2, "learning_rate": 4.611896354340038e-06, "loss": 0.8911, "step": 10832 }, { "epoch": 0.2, "learning_rate": 4.611814598280853e-06, "loss": 0.9473, "step": 10833 }, { "epoch": 0.2, "learning_rate": 4.611732834336216e-06, "loss": 0.8251, "step": 10834 }, { "epoch": 0.2, "learning_rate": 4.611651062506433e-06, "loss": 0.8727, "step": 10835 }, { "epoch": 0.2, "learning_rate": 4.611569282791811e-06, "loss": 0.9208, "step": 10836 }, { "epoch": 0.2, "learning_rate": 4.611487495192653e-06, "loss": 0.9822, "step": 10837 }, { "epoch": 0.2, "learning_rate": 4.611405699709266e-06, "loss": 0.9152, "step": 10838 }, { "epoch": 0.2, "learning_rate": 4.6113238963419545e-06, "loss": 0.8971, "step": 10839 }, { "epoch": 0.2, "learning_rate": 4.611242085091025e-06, "loss": 0.9844, "step": 10840 }, { "epoch": 0.2, "learning_rate": 4.6111602659567815e-06, "loss": 0.9842, "step": 10841 }, { "epoch": 0.2, "learning_rate": 4.61107843893953e-06, "loss": 0.8971, "step": 10842 }, { "epoch": 0.2, "learning_rate": 4.610996604039577e-06, "loss": 0.9995, "step": 10843 }, { "epoch": 0.2, "learning_rate": 4.610914761257227e-06, "loss": 0.7972, "step": 10844 }, { "epoch": 0.2, "learning_rate": 4.610832910592786e-06, "loss": 0.8864, "step": 10845 }, { "epoch": 0.2, "learning_rate": 4.61075105204656e-06, "loss": 1.0027, "step": 10846 }, { "epoch": 0.2, "learning_rate": 4.610669185618854e-06, "loss": 1.04, "step": 10847 }, { "epoch": 0.2, "learning_rate": 4.610587311309974e-06, "loss": 1.0515, "step": 10848 }, { "epoch": 0.2, "learning_rate": 4.6105054291202264e-06, "loss": 0.9394, "step": 10849 }, { "epoch": 0.2, "learning_rate": 4.6104235390499155e-06, "loss": 1.2031, "step": 10850 }, { "epoch": 0.2, "learning_rate": 4.610341641099349e-06, "loss": 1.1985, "step": 10851 }, { "epoch": 0.2, "learning_rate": 4.6102597352688295e-06, "loss": 0.9651, "step": 10852 }, { "epoch": 0.2, "learning_rate": 4.610177821558666e-06, "loss": 0.9315, "step": 10853 }, { "epoch": 0.2, "learning_rate": 4.610095899969163e-06, "loss": 0.7511, "step": 10854 }, { "epoch": 0.2, "learning_rate": 4.6100139705006265e-06, "loss": 0.9786, "step": 10855 }, { "epoch": 0.2, "learning_rate": 4.609932033153362e-06, "loss": 1.2141, "step": 10856 }, { "epoch": 0.2, "learning_rate": 4.609850087927678e-06, "loss": 1.0696, "step": 10857 }, { "epoch": 0.2, "learning_rate": 4.609768134823877e-06, "loss": 0.8971, "step": 10858 }, { "epoch": 0.2, "learning_rate": 4.609686173842266e-06, "loss": 0.8895, "step": 10859 }, { "epoch": 0.2, "learning_rate": 4.609604204983152e-06, "loss": 0.8685, "step": 10860 }, { "epoch": 0.2, "learning_rate": 4.609522228246841e-06, "loss": 0.8107, "step": 10861 }, { "epoch": 0.2, "learning_rate": 4.609440243633638e-06, "loss": 1.1958, "step": 10862 }, { "epoch": 0.2, "learning_rate": 4.6093582511438505e-06, "loss": 1.0561, "step": 10863 }, { "epoch": 0.2, "learning_rate": 4.609276250777784e-06, "loss": 0.8144, "step": 10864 }, { "epoch": 0.2, "learning_rate": 4.609194242535744e-06, "loss": 0.8493, "step": 10865 }, { "epoch": 0.21, "learning_rate": 4.609112226418038e-06, "loss": 0.8739, "step": 10866 }, { "epoch": 0.21, "learning_rate": 4.609030202424971e-06, "loss": 0.8832, "step": 10867 }, { "epoch": 0.21, "learning_rate": 4.6089481705568505e-06, "loss": 1.1873, "step": 10868 }, { "epoch": 0.21, "learning_rate": 4.6088661308139815e-06, "loss": 0.96, "step": 10869 }, { "epoch": 0.21, "learning_rate": 4.6087840831966715e-06, "loss": 0.8102, "step": 10870 }, { "epoch": 0.21, "learning_rate": 4.608702027705226e-06, "loss": 1.048, "step": 10871 }, { "epoch": 0.21, "learning_rate": 4.608619964339952e-06, "loss": 0.8666, "step": 10872 }, { "epoch": 0.21, "learning_rate": 4.608537893101156e-06, "loss": 0.835, "step": 10873 }, { "epoch": 0.21, "learning_rate": 4.6084558139891444e-06, "loss": 0.947, "step": 10874 }, { "epoch": 0.21, "learning_rate": 4.608373727004223e-06, "loss": 1.0044, "step": 10875 }, { "epoch": 0.21, "learning_rate": 4.608291632146698e-06, "loss": 0.9749, "step": 10876 }, { "epoch": 0.21, "learning_rate": 4.608209529416878e-06, "loss": 0.8761, "step": 10877 }, { "epoch": 0.21, "learning_rate": 4.608127418815067e-06, "loss": 0.9438, "step": 10878 }, { "epoch": 0.21, "learning_rate": 4.608045300341574e-06, "loss": 1.0115, "step": 10879 }, { "epoch": 0.21, "learning_rate": 4.607963173996704e-06, "loss": 0.857, "step": 10880 }, { "epoch": 0.21, "learning_rate": 4.6078810397807635e-06, "loss": 1.1425, "step": 10881 }, { "epoch": 0.21, "learning_rate": 4.607798897694061e-06, "loss": 0.8171, "step": 10882 }, { "epoch": 0.21, "learning_rate": 4.6077167477369015e-06, "loss": 0.8004, "step": 10883 }, { "epoch": 0.21, "learning_rate": 4.607634589909592e-06, "loss": 0.9586, "step": 10884 }, { "epoch": 0.21, "learning_rate": 4.60755242421244e-06, "loss": 0.9304, "step": 10885 }, { "epoch": 0.21, "learning_rate": 4.607470250645752e-06, "loss": 0.8522, "step": 10886 }, { "epoch": 0.21, "learning_rate": 4.607388069209834e-06, "loss": 1.164, "step": 10887 }, { "epoch": 0.21, "learning_rate": 4.607305879904994e-06, "loss": 1.1303, "step": 10888 }, { "epoch": 0.21, "learning_rate": 4.607223682731539e-06, "loss": 0.905, "step": 10889 }, { "epoch": 0.21, "learning_rate": 4.607141477689775e-06, "loss": 0.9445, "step": 10890 }, { "epoch": 0.21, "learning_rate": 4.607059264780008e-06, "loss": 0.9757, "step": 10891 }, { "epoch": 0.21, "learning_rate": 4.606977044002548e-06, "loss": 1.0038, "step": 10892 }, { "epoch": 0.21, "learning_rate": 4.6068948153577e-06, "loss": 1.0681, "step": 10893 }, { "epoch": 0.21, "learning_rate": 4.606812578845771e-06, "loss": 1.1031, "step": 10894 }, { "epoch": 0.21, "learning_rate": 4.606730334467069e-06, "loss": 0.9487, "step": 10895 }, { "epoch": 0.21, "learning_rate": 4.6066480822218996e-06, "loss": 0.9669, "step": 10896 }, { "epoch": 0.21, "learning_rate": 4.606565822110572e-06, "loss": 0.9777, "step": 10897 }, { "epoch": 0.21, "learning_rate": 4.606483554133391e-06, "loss": 0.7842, "step": 10898 }, { "epoch": 0.21, "learning_rate": 4.6064012782906655e-06, "loss": 1.0592, "step": 10899 }, { "epoch": 0.21, "learning_rate": 4.606318994582702e-06, "loss": 1.1834, "step": 10900 }, { "epoch": 0.21, "learning_rate": 4.6062367030098085e-06, "loss": 1.0863, "step": 10901 }, { "epoch": 0.21, "learning_rate": 4.606154403572292e-06, "loss": 1.0959, "step": 10902 }, { "epoch": 0.21, "learning_rate": 4.606072096270459e-06, "loss": 0.9459, "step": 10903 }, { "epoch": 0.21, "learning_rate": 4.605989781104617e-06, "loss": 0.8101, "step": 10904 }, { "epoch": 0.21, "learning_rate": 4.605907458075074e-06, "loss": 1.0322, "step": 10905 }, { "epoch": 0.21, "learning_rate": 4.605825127182137e-06, "loss": 1.1595, "step": 10906 }, { "epoch": 0.21, "learning_rate": 4.605742788426114e-06, "loss": 1.0703, "step": 10907 }, { "epoch": 0.21, "learning_rate": 4.605660441807311e-06, "loss": 0.8958, "step": 10908 }, { "epoch": 0.21, "learning_rate": 4.605578087326038e-06, "loss": 0.7325, "step": 10909 }, { "epoch": 0.21, "learning_rate": 4.6054957249826e-06, "loss": 0.8484, "step": 10910 }, { "epoch": 0.21, "learning_rate": 4.605413354777305e-06, "loss": 1.0892, "step": 10911 }, { "epoch": 0.21, "learning_rate": 4.605330976710462e-06, "loss": 1.0775, "step": 10912 }, { "epoch": 0.21, "learning_rate": 4.605248590782377e-06, "loss": 1.0904, "step": 10913 }, { "epoch": 0.21, "learning_rate": 4.605166196993359e-06, "loss": 0.9813, "step": 10914 }, { "epoch": 0.21, "learning_rate": 4.605083795343715e-06, "loss": 1.0391, "step": 10915 }, { "epoch": 0.21, "learning_rate": 4.6050013858337525e-06, "loss": 0.9394, "step": 10916 }, { "epoch": 0.21, "learning_rate": 4.604918968463779e-06, "loss": 0.8683, "step": 10917 }, { "epoch": 0.21, "learning_rate": 4.604836543234103e-06, "loss": 1.051, "step": 10918 }, { "epoch": 0.21, "learning_rate": 4.6047541101450325e-06, "loss": 1.0906, "step": 10919 }, { "epoch": 0.21, "learning_rate": 4.604671669196873e-06, "loss": 0.9598, "step": 10920 }, { "epoch": 0.21, "learning_rate": 4.604589220389935e-06, "loss": 0.9458, "step": 10921 }, { "epoch": 0.21, "learning_rate": 4.6045067637245255e-06, "loss": 0.926, "step": 10922 }, { "epoch": 0.21, "learning_rate": 4.604424299200952e-06, "loss": 0.9254, "step": 10923 }, { "epoch": 0.21, "learning_rate": 4.604341826819523e-06, "loss": 1.0588, "step": 10924 }, { "epoch": 0.21, "learning_rate": 4.604259346580546e-06, "loss": 1.1312, "step": 10925 }, { "epoch": 0.21, "learning_rate": 4.60417685848433e-06, "loss": 0.9287, "step": 10926 }, { "epoch": 0.21, "learning_rate": 4.6040943625311805e-06, "loss": 0.7451, "step": 10927 }, { "epoch": 0.21, "learning_rate": 4.604011858721408e-06, "loss": 0.864, "step": 10928 }, { "epoch": 0.21, "learning_rate": 4.60392934705532e-06, "loss": 0.8915, "step": 10929 }, { "epoch": 0.21, "learning_rate": 4.603846827533223e-06, "loss": 1.1236, "step": 10930 }, { "epoch": 0.21, "learning_rate": 4.6037643001554275e-06, "loss": 1.0225, "step": 10931 }, { "epoch": 0.21, "learning_rate": 4.60368176492224e-06, "loss": 1.1273, "step": 10932 }, { "epoch": 0.21, "learning_rate": 4.60359922183397e-06, "loss": 1.1068, "step": 10933 }, { "epoch": 0.21, "learning_rate": 4.603516670890924e-06, "loss": 0.928, "step": 10934 }, { "epoch": 0.21, "learning_rate": 4.603434112093412e-06, "loss": 1.0111, "step": 10935 }, { "epoch": 0.21, "learning_rate": 4.603351545441742e-06, "loss": 0.8286, "step": 10936 }, { "epoch": 0.21, "learning_rate": 4.603268970936222e-06, "loss": 1.0634, "step": 10937 }, { "epoch": 0.21, "learning_rate": 4.6031863885771585e-06, "loss": 1.0627, "step": 10938 }, { "epoch": 0.21, "learning_rate": 4.603103798364863e-06, "loss": 0.9794, "step": 10939 }, { "epoch": 0.21, "learning_rate": 4.603021200299642e-06, "loss": 0.8771, "step": 10940 }, { "epoch": 0.21, "learning_rate": 4.602938594381804e-06, "loss": 1.0669, "step": 10941 }, { "epoch": 0.21, "learning_rate": 4.602855980611658e-06, "loss": 0.8411, "step": 10942 }, { "epoch": 0.21, "learning_rate": 4.602773358989512e-06, "loss": 1.122, "step": 10943 }, { "epoch": 0.21, "learning_rate": 4.602690729515675e-06, "loss": 1.0333, "step": 10944 }, { "epoch": 0.21, "learning_rate": 4.602608092190455e-06, "loss": 0.7649, "step": 10945 }, { "epoch": 0.21, "learning_rate": 4.602525447014161e-06, "loss": 0.9224, "step": 10946 }, { "epoch": 0.21, "learning_rate": 4.602442793987102e-06, "loss": 0.9662, "step": 10947 }, { "epoch": 0.21, "learning_rate": 4.602360133109586e-06, "loss": 0.798, "step": 10948 }, { "epoch": 0.21, "learning_rate": 4.602277464381922e-06, "loss": 0.9663, "step": 10949 }, { "epoch": 0.21, "learning_rate": 4.6021947878044174e-06, "loss": 1.0817, "step": 10950 }, { "epoch": 0.21, "learning_rate": 4.602112103377382e-06, "loss": 0.7507, "step": 10951 }, { "epoch": 0.21, "learning_rate": 4.602029411101124e-06, "loss": 0.9067, "step": 10952 }, { "epoch": 0.21, "learning_rate": 4.601946710975953e-06, "loss": 0.9203, "step": 10953 }, { "epoch": 0.21, "learning_rate": 4.6018640030021785e-06, "loss": 0.7657, "step": 10954 }, { "epoch": 0.21, "learning_rate": 4.601781287180107e-06, "loss": 0.9445, "step": 10955 }, { "epoch": 0.21, "learning_rate": 4.60169856351005e-06, "loss": 1.2321, "step": 10956 }, { "epoch": 0.21, "learning_rate": 4.601615831992314e-06, "loss": 0.8694, "step": 10957 }, { "epoch": 0.21, "learning_rate": 4.601533092627209e-06, "loss": 1.0135, "step": 10958 }, { "epoch": 0.21, "learning_rate": 4.601450345415044e-06, "loss": 0.9678, "step": 10959 }, { "epoch": 0.21, "learning_rate": 4.6013675903561274e-06, "loss": 0.9, "step": 10960 }, { "epoch": 0.21, "learning_rate": 4.601284827450769e-06, "loss": 1.0289, "step": 10961 }, { "epoch": 0.21, "learning_rate": 4.601202056699277e-06, "loss": 1.1245, "step": 10962 }, { "epoch": 0.21, "learning_rate": 4.601119278101962e-06, "loss": 0.8768, "step": 10963 }, { "epoch": 0.21, "learning_rate": 4.601036491659131e-06, "loss": 0.7741, "step": 10964 }, { "epoch": 0.21, "learning_rate": 4.600953697371096e-06, "loss": 0.8802, "step": 10965 }, { "epoch": 0.21, "learning_rate": 4.600870895238162e-06, "loss": 0.795, "step": 10966 }, { "epoch": 0.21, "learning_rate": 4.600788085260641e-06, "loss": 0.6958, "step": 10967 }, { "epoch": 0.21, "learning_rate": 4.600705267438843e-06, "loss": 0.9415, "step": 10968 }, { "epoch": 0.21, "learning_rate": 4.600622441773075e-06, "loss": 0.8997, "step": 10969 }, { "epoch": 0.21, "learning_rate": 4.600539608263647e-06, "loss": 0.986, "step": 10970 }, { "epoch": 0.21, "learning_rate": 4.600456766910869e-06, "loss": 1.0024, "step": 10971 }, { "epoch": 0.21, "learning_rate": 4.600373917715049e-06, "loss": 0.9282, "step": 10972 }, { "epoch": 0.21, "learning_rate": 4.600291060676498e-06, "loss": 0.8132, "step": 10973 }, { "epoch": 0.21, "learning_rate": 4.600208195795525e-06, "loss": 0.961, "step": 10974 }, { "epoch": 0.21, "learning_rate": 4.600125323072438e-06, "loss": 1.095, "step": 10975 }, { "epoch": 0.21, "learning_rate": 4.6000424425075485e-06, "loss": 0.7809, "step": 10976 }, { "epoch": 0.21, "learning_rate": 4.599959554101164e-06, "loss": 0.9196, "step": 10977 }, { "epoch": 0.21, "learning_rate": 4.599876657853595e-06, "loss": 0.9904, "step": 10978 }, { "epoch": 0.21, "learning_rate": 4.599793753765151e-06, "loss": 0.8962, "step": 10979 }, { "epoch": 0.21, "learning_rate": 4.599710841836142e-06, "loss": 1.0078, "step": 10980 }, { "epoch": 0.21, "learning_rate": 4.599627922066876e-06, "loss": 1.1122, "step": 10981 }, { "epoch": 0.21, "learning_rate": 4.599544994457665e-06, "loss": 0.9073, "step": 10982 }, { "epoch": 0.21, "learning_rate": 4.599462059008817e-06, "loss": 1.0312, "step": 10983 }, { "epoch": 0.21, "learning_rate": 4.599379115720641e-06, "loss": 0.838, "step": 10984 }, { "epoch": 0.21, "learning_rate": 4.5992961645934484e-06, "loss": 1.0969, "step": 10985 }, { "epoch": 0.21, "learning_rate": 4.599213205627549e-06, "loss": 0.9117, "step": 10986 }, { "epoch": 0.21, "learning_rate": 4.599130238823251e-06, "loss": 1.0354, "step": 10987 }, { "epoch": 0.21, "learning_rate": 4.599047264180866e-06, "loss": 0.9523, "step": 10988 }, { "epoch": 0.21, "learning_rate": 4.598964281700702e-06, "loss": 0.903, "step": 10989 }, { "epoch": 0.21, "learning_rate": 4.59888129138307e-06, "loss": 0.9926, "step": 10990 }, { "epoch": 0.21, "learning_rate": 4.598798293228279e-06, "loss": 0.9334, "step": 10991 }, { "epoch": 0.21, "learning_rate": 4.5987152872366404e-06, "loss": 1.0103, "step": 10992 }, { "epoch": 0.21, "learning_rate": 4.598632273408463e-06, "loss": 1.1395, "step": 10993 }, { "epoch": 0.21, "learning_rate": 4.598549251744058e-06, "loss": 0.9814, "step": 10994 }, { "epoch": 0.21, "learning_rate": 4.598466222243733e-06, "loss": 0.7169, "step": 10995 }, { "epoch": 0.21, "learning_rate": 4.5983831849078e-06, "loss": 0.8397, "step": 10996 }, { "epoch": 0.21, "learning_rate": 4.598300139736568e-06, "loss": 0.9225, "step": 10997 }, { "epoch": 0.21, "learning_rate": 4.598217086730348e-06, "loss": 0.915, "step": 10998 }, { "epoch": 0.21, "learning_rate": 4.59813402588945e-06, "loss": 1.1671, "step": 10999 }, { "epoch": 0.21, "learning_rate": 4.598050957214183e-06, "loss": 1.0745, "step": 11000 }, { "epoch": 0.21, "learning_rate": 4.597967880704859e-06, "loss": 0.9476, "step": 11001 }, { "epoch": 0.21, "learning_rate": 4.597884796361786e-06, "loss": 0.9874, "step": 11002 }, { "epoch": 0.21, "learning_rate": 4.597801704185277e-06, "loss": 0.9989, "step": 11003 }, { "epoch": 0.21, "learning_rate": 4.597718604175641e-06, "loss": 0.9103, "step": 11004 }, { "epoch": 0.21, "learning_rate": 4.597635496333187e-06, "loss": 0.9782, "step": 11005 }, { "epoch": 0.21, "learning_rate": 4.597552380658227e-06, "loss": 1.1647, "step": 11006 }, { "epoch": 0.21, "learning_rate": 4.59746925715107e-06, "loss": 0.9647, "step": 11007 }, { "epoch": 0.21, "learning_rate": 4.597386125812027e-06, "loss": 0.7872, "step": 11008 }, { "epoch": 0.21, "learning_rate": 4.597302986641409e-06, "loss": 1.0056, "step": 11009 }, { "epoch": 0.21, "learning_rate": 4.597219839639526e-06, "loss": 0.9524, "step": 11010 }, { "epoch": 0.21, "learning_rate": 4.597136684806689e-06, "loss": 1.038, "step": 11011 }, { "epoch": 0.21, "learning_rate": 4.597053522143206e-06, "loss": 1.1131, "step": 11012 }, { "epoch": 0.21, "learning_rate": 4.596970351649391e-06, "loss": 1.0654, "step": 11013 }, { "epoch": 0.21, "learning_rate": 4.596887173325553e-06, "loss": 0.9191, "step": 11014 }, { "epoch": 0.21, "learning_rate": 4.596803987172003e-06, "loss": 0.916, "step": 11015 }, { "epoch": 0.21, "learning_rate": 4.59672079318905e-06, "loss": 0.8725, "step": 11016 }, { "epoch": 0.21, "learning_rate": 4.596637591377007e-06, "loss": 0.8389, "step": 11017 }, { "epoch": 0.21, "learning_rate": 4.596554381736182e-06, "loss": 1.0181, "step": 11018 }, { "epoch": 0.21, "learning_rate": 4.596471164266888e-06, "loss": 1.0346, "step": 11019 }, { "epoch": 0.21, "learning_rate": 4.596387938969436e-06, "loss": 0.9521, "step": 11020 }, { "epoch": 0.21, "learning_rate": 4.596304705844134e-06, "loss": 0.7269, "step": 11021 }, { "epoch": 0.21, "learning_rate": 4.596221464891295e-06, "loss": 0.6609, "step": 11022 }, { "epoch": 0.21, "learning_rate": 4.59613821611123e-06, "loss": 0.8308, "step": 11023 }, { "epoch": 0.21, "learning_rate": 4.5960549595042486e-06, "loss": 1.0236, "step": 11024 }, { "epoch": 0.21, "learning_rate": 4.595971695070662e-06, "loss": 0.9135, "step": 11025 }, { "epoch": 0.21, "learning_rate": 4.595888422810782e-06, "loss": 0.7452, "step": 11026 }, { "epoch": 0.21, "learning_rate": 4.595805142724918e-06, "loss": 0.8682, "step": 11027 }, { "epoch": 0.21, "learning_rate": 4.5957218548133835e-06, "loss": 0.9605, "step": 11028 }, { "epoch": 0.21, "learning_rate": 4.5956385590764865e-06, "loss": 0.8069, "step": 11029 }, { "epoch": 0.21, "learning_rate": 4.59555525551454e-06, "loss": 1.2278, "step": 11030 }, { "epoch": 0.21, "learning_rate": 4.595471944127854e-06, "loss": 1.1512, "step": 11031 }, { "epoch": 0.21, "learning_rate": 4.59538862491674e-06, "loss": 0.8128, "step": 11032 }, { "epoch": 0.21, "learning_rate": 4.59530529788151e-06, "loss": 0.8117, "step": 11033 }, { "epoch": 0.21, "learning_rate": 4.5952219630224724e-06, "loss": 1.0644, "step": 11034 }, { "epoch": 0.21, "learning_rate": 4.595138620339942e-06, "loss": 1.0266, "step": 11035 }, { "epoch": 0.21, "learning_rate": 4.595055269834228e-06, "loss": 0.9104, "step": 11036 }, { "epoch": 0.21, "learning_rate": 4.594971911505641e-06, "loss": 1.2516, "step": 11037 }, { "epoch": 0.21, "learning_rate": 4.5948885453544936e-06, "loss": 1.0418, "step": 11038 }, { "epoch": 0.21, "learning_rate": 4.594805171381097e-06, "loss": 0.8674, "step": 11039 }, { "epoch": 0.21, "learning_rate": 4.594721789585761e-06, "loss": 1.0428, "step": 11040 }, { "epoch": 0.21, "learning_rate": 4.594638399968799e-06, "loss": 0.8911, "step": 11041 }, { "epoch": 0.21, "learning_rate": 4.5945550025305205e-06, "loss": 0.8331, "step": 11042 }, { "epoch": 0.21, "learning_rate": 4.594471597271239e-06, "loss": 1.0212, "step": 11043 }, { "epoch": 0.21, "learning_rate": 4.594388184191264e-06, "loss": 1.1144, "step": 11044 }, { "epoch": 0.21, "learning_rate": 4.594304763290908e-06, "loss": 0.9691, "step": 11045 }, { "epoch": 0.21, "learning_rate": 4.594221334570482e-06, "loss": 0.694, "step": 11046 }, { "epoch": 0.21, "learning_rate": 4.594137898030299e-06, "loss": 0.9152, "step": 11047 }, { "epoch": 0.21, "learning_rate": 4.594054453670668e-06, "loss": 0.8294, "step": 11048 }, { "epoch": 0.21, "learning_rate": 4.593971001491902e-06, "loss": 0.9608, "step": 11049 }, { "epoch": 0.21, "learning_rate": 4.593887541494313e-06, "loss": 1.1902, "step": 11050 }, { "epoch": 0.21, "learning_rate": 4.593804073678212e-06, "loss": 1.0156, "step": 11051 }, { "epoch": 0.21, "learning_rate": 4.59372059804391e-06, "loss": 0.892, "step": 11052 }, { "epoch": 0.21, "learning_rate": 4.59363711459172e-06, "loss": 0.8143, "step": 11053 }, { "epoch": 0.21, "learning_rate": 4.593553623321953e-06, "loss": 0.9034, "step": 11054 }, { "epoch": 0.21, "learning_rate": 4.593470124234921e-06, "loss": 1.1064, "step": 11055 }, { "epoch": 0.21, "learning_rate": 4.593386617330937e-06, "loss": 1.2099, "step": 11056 }, { "epoch": 0.21, "learning_rate": 4.59330310261031e-06, "loss": 0.9654, "step": 11057 }, { "epoch": 0.21, "learning_rate": 4.593219580073354e-06, "loss": 1.0338, "step": 11058 }, { "epoch": 0.21, "learning_rate": 4.59313604972038e-06, "loss": 0.8363, "step": 11059 }, { "epoch": 0.21, "learning_rate": 4.593052511551701e-06, "loss": 0.884, "step": 11060 }, { "epoch": 0.21, "learning_rate": 4.592968965567627e-06, "loss": 0.8752, "step": 11061 }, { "epoch": 0.21, "learning_rate": 4.592885411768472e-06, "loss": 0.9719, "step": 11062 }, { "epoch": 0.21, "learning_rate": 4.5928018501545454e-06, "loss": 1.042, "step": 11063 }, { "epoch": 0.21, "learning_rate": 4.5927182807261625e-06, "loss": 0.8091, "step": 11064 }, { "epoch": 0.21, "learning_rate": 4.592634703483633e-06, "loss": 0.9043, "step": 11065 }, { "epoch": 0.21, "learning_rate": 4.59255111842727e-06, "loss": 0.7873, "step": 11066 }, { "epoch": 0.21, "learning_rate": 4.592467525557385e-06, "loss": 1.0677, "step": 11067 }, { "epoch": 0.21, "learning_rate": 4.5923839248742905e-06, "loss": 0.8051, "step": 11068 }, { "epoch": 0.21, "learning_rate": 4.592300316378299e-06, "loss": 1.344, "step": 11069 }, { "epoch": 0.21, "learning_rate": 4.592216700069722e-06, "loss": 0.8418, "step": 11070 }, { "epoch": 0.21, "learning_rate": 4.592133075948872e-06, "loss": 0.9648, "step": 11071 }, { "epoch": 0.21, "learning_rate": 4.592049444016061e-06, "loss": 1.0862, "step": 11072 }, { "epoch": 0.21, "learning_rate": 4.591965804271602e-06, "loss": 0.8398, "step": 11073 }, { "epoch": 0.21, "learning_rate": 4.5918821567158065e-06, "loss": 1.0255, "step": 11074 }, { "epoch": 0.21, "learning_rate": 4.591798501348987e-06, "loss": 0.8963, "step": 11075 }, { "epoch": 0.21, "learning_rate": 4.591714838171456e-06, "loss": 1.1246, "step": 11076 }, { "epoch": 0.21, "learning_rate": 4.591631167183526e-06, "loss": 0.7879, "step": 11077 }, { "epoch": 0.21, "learning_rate": 4.5915474883855096e-06, "loss": 0.959, "step": 11078 }, { "epoch": 0.21, "learning_rate": 4.591463801777719e-06, "loss": 0.8141, "step": 11079 }, { "epoch": 0.21, "learning_rate": 4.591380107360467e-06, "loss": 0.963, "step": 11080 }, { "epoch": 0.21, "learning_rate": 4.591296405134065e-06, "loss": 1.132, "step": 11081 }, { "epoch": 0.21, "learning_rate": 4.591212695098827e-06, "loss": 1.2194, "step": 11082 }, { "epoch": 0.21, "learning_rate": 4.591128977255064e-06, "loss": 0.7576, "step": 11083 }, { "epoch": 0.21, "learning_rate": 4.5910452516030905e-06, "loss": 0.9276, "step": 11084 }, { "epoch": 0.21, "learning_rate": 4.590961518143217e-06, "loss": 0.8771, "step": 11085 }, { "epoch": 0.21, "learning_rate": 4.590877776875759e-06, "loss": 0.8571, "step": 11086 }, { "epoch": 0.21, "learning_rate": 4.590794027801027e-06, "loss": 1.0952, "step": 11087 }, { "epoch": 0.21, "learning_rate": 4.590710270919333e-06, "loss": 0.8075, "step": 11088 }, { "epoch": 0.21, "learning_rate": 4.590626506230992e-06, "loss": 0.849, "step": 11089 }, { "epoch": 0.21, "learning_rate": 4.590542733736316e-06, "loss": 0.8073, "step": 11090 }, { "epoch": 0.21, "learning_rate": 4.590458953435617e-06, "loss": 1.0077, "step": 11091 }, { "epoch": 0.21, "learning_rate": 4.5903751653292075e-06, "loss": 1.0291, "step": 11092 }, { "epoch": 0.21, "learning_rate": 4.590291369417402e-06, "loss": 1.1949, "step": 11093 }, { "epoch": 0.21, "learning_rate": 4.590207565700513e-06, "loss": 1.0293, "step": 11094 }, { "epoch": 0.21, "learning_rate": 4.590123754178853e-06, "loss": 1.0997, "step": 11095 }, { "epoch": 0.21, "learning_rate": 4.590039934852735e-06, "loss": 1.0745, "step": 11096 }, { "epoch": 0.21, "learning_rate": 4.589956107722471e-06, "loss": 0.889, "step": 11097 }, { "epoch": 0.21, "learning_rate": 4.589872272788376e-06, "loss": 0.7436, "step": 11098 }, { "epoch": 0.21, "learning_rate": 4.589788430050762e-06, "loss": 1.1467, "step": 11099 }, { "epoch": 0.21, "learning_rate": 4.589704579509942e-06, "loss": 1.0214, "step": 11100 }, { "epoch": 0.21, "learning_rate": 4.589620721166228e-06, "loss": 1.0625, "step": 11101 }, { "epoch": 0.21, "learning_rate": 4.589536855019935e-06, "loss": 0.9155, "step": 11102 }, { "epoch": 0.21, "learning_rate": 4.589452981071376e-06, "loss": 0.9228, "step": 11103 }, { "epoch": 0.21, "learning_rate": 4.589369099320863e-06, "loss": 0.75, "step": 11104 }, { "epoch": 0.21, "learning_rate": 4.589285209768711e-06, "loss": 0.8401, "step": 11105 }, { "epoch": 0.21, "learning_rate": 4.589201312415231e-06, "loss": 1.2266, "step": 11106 }, { "epoch": 0.21, "learning_rate": 4.589117407260738e-06, "loss": 0.9619, "step": 11107 }, { "epoch": 0.21, "learning_rate": 4.589033494305544e-06, "loss": 0.8748, "step": 11108 }, { "epoch": 0.21, "learning_rate": 4.588949573549963e-06, "loss": 0.8565, "step": 11109 }, { "epoch": 0.21, "learning_rate": 4.588865644994308e-06, "loss": 0.8763, "step": 11110 }, { "epoch": 0.21, "learning_rate": 4.588781708638894e-06, "loss": 0.872, "step": 11111 }, { "epoch": 0.21, "learning_rate": 4.5886977644840325e-06, "loss": 1.3042, "step": 11112 }, { "epoch": 0.21, "learning_rate": 4.588613812530037e-06, "loss": 1.062, "step": 11113 }, { "epoch": 0.21, "learning_rate": 4.588529852777223e-06, "loss": 0.792, "step": 11114 }, { "epoch": 0.21, "learning_rate": 4.5884458852259014e-06, "loss": 0.655, "step": 11115 }, { "epoch": 0.21, "learning_rate": 4.588361909876387e-06, "loss": 0.7847, "step": 11116 }, { "epoch": 0.21, "learning_rate": 4.588277926728993e-06, "loss": 0.8804, "step": 11117 }, { "epoch": 0.21, "learning_rate": 4.588193935784034e-06, "loss": 1.0475, "step": 11118 }, { "epoch": 0.21, "learning_rate": 4.588109937041822e-06, "loss": 0.9839, "step": 11119 }, { "epoch": 0.21, "learning_rate": 4.588025930502672e-06, "loss": 0.9337, "step": 11120 }, { "epoch": 0.21, "learning_rate": 4.587941916166898e-06, "loss": 0.8314, "step": 11121 }, { "epoch": 0.21, "learning_rate": 4.587857894034812e-06, "loss": 0.9773, "step": 11122 }, { "epoch": 0.21, "learning_rate": 4.587773864106728e-06, "loss": 0.934, "step": 11123 }, { "epoch": 0.21, "learning_rate": 4.587689826382962e-06, "loss": 0.9789, "step": 11124 }, { "epoch": 0.21, "learning_rate": 4.5876057808638255e-06, "loss": 1.2657, "step": 11125 }, { "epoch": 0.21, "learning_rate": 4.587521727549633e-06, "loss": 0.6607, "step": 11126 }, { "epoch": 0.21, "learning_rate": 4.587437666440698e-06, "loss": 0.9415, "step": 11127 }, { "epoch": 0.21, "learning_rate": 4.587353597537335e-06, "loss": 0.9799, "step": 11128 }, { "epoch": 0.21, "learning_rate": 4.587269520839857e-06, "loss": 0.9628, "step": 11129 }, { "epoch": 0.21, "learning_rate": 4.58718543634858e-06, "loss": 0.9982, "step": 11130 }, { "epoch": 0.21, "learning_rate": 4.587101344063816e-06, "loss": 1.2072, "step": 11131 }, { "epoch": 0.21, "learning_rate": 4.58701724398588e-06, "loss": 0.8422, "step": 11132 }, { "epoch": 0.21, "learning_rate": 4.586933136115085e-06, "loss": 0.6512, "step": 11133 }, { "epoch": 0.21, "learning_rate": 4.586849020451745e-06, "loss": 1.0555, "step": 11134 }, { "epoch": 0.21, "learning_rate": 4.5867648969961755e-06, "loss": 0.7507, "step": 11135 }, { "epoch": 0.21, "learning_rate": 4.58668076574869e-06, "loss": 0.9426, "step": 11136 }, { "epoch": 0.21, "learning_rate": 4.5865966267096015e-06, "loss": 1.2587, "step": 11137 }, { "epoch": 0.21, "learning_rate": 4.586512479879226e-06, "loss": 1.0668, "step": 11138 }, { "epoch": 0.21, "learning_rate": 4.5864283252578775e-06, "loss": 0.8701, "step": 11139 }, { "epoch": 0.21, "learning_rate": 4.5863441628458695e-06, "loss": 0.8174, "step": 11140 }, { "epoch": 0.21, "learning_rate": 4.586259992643516e-06, "loss": 0.8961, "step": 11141 }, { "epoch": 0.21, "learning_rate": 4.586175814651131e-06, "loss": 0.9, "step": 11142 }, { "epoch": 0.21, "learning_rate": 4.586091628869029e-06, "loss": 1.2019, "step": 11143 }, { "epoch": 0.21, "learning_rate": 4.586007435297527e-06, "loss": 1.0446, "step": 11144 }, { "epoch": 0.21, "learning_rate": 4.585923233936936e-06, "loss": 0.9666, "step": 11145 }, { "epoch": 0.21, "learning_rate": 4.5858390247875715e-06, "loss": 0.9594, "step": 11146 }, { "epoch": 0.21, "learning_rate": 4.585754807849748e-06, "loss": 0.8239, "step": 11147 }, { "epoch": 0.21, "learning_rate": 4.58567058312378e-06, "loss": 0.9797, "step": 11148 }, { "epoch": 0.21, "learning_rate": 4.585586350609982e-06, "loss": 1.002, "step": 11149 }, { "epoch": 0.21, "learning_rate": 4.585502110308668e-06, "loss": 0.9359, "step": 11150 }, { "epoch": 0.21, "learning_rate": 4.585417862220154e-06, "loss": 0.9614, "step": 11151 }, { "epoch": 0.21, "learning_rate": 4.5853336063447535e-06, "loss": 1.0225, "step": 11152 }, { "epoch": 0.21, "learning_rate": 4.585249342682781e-06, "loss": 0.9411, "step": 11153 }, { "epoch": 0.21, "learning_rate": 4.585165071234552e-06, "loss": 0.9402, "step": 11154 }, { "epoch": 0.21, "learning_rate": 4.58508079200038e-06, "loss": 0.8957, "step": 11155 }, { "epoch": 0.21, "learning_rate": 4.58499650498058e-06, "loss": 1.2059, "step": 11156 }, { "epoch": 0.21, "learning_rate": 4.584912210175467e-06, "loss": 0.9095, "step": 11157 }, { "epoch": 0.21, "learning_rate": 4.584827907585356e-06, "loss": 0.8426, "step": 11158 }, { "epoch": 0.21, "learning_rate": 4.584743597210561e-06, "loss": 1.0104, "step": 11159 }, { "epoch": 0.21, "learning_rate": 4.5846592790513985e-06, "loss": 1.0263, "step": 11160 }, { "epoch": 0.21, "learning_rate": 4.5845749531081816e-06, "loss": 0.8103, "step": 11161 }, { "epoch": 0.21, "learning_rate": 4.584490619381226e-06, "loss": 1.22, "step": 11162 }, { "epoch": 0.21, "learning_rate": 4.584406277870845e-06, "loss": 0.8831, "step": 11163 }, { "epoch": 0.21, "learning_rate": 4.5843219285773565e-06, "loss": 0.7843, "step": 11164 }, { "epoch": 0.21, "learning_rate": 4.584237571501073e-06, "loss": 0.8751, "step": 11165 }, { "epoch": 0.21, "learning_rate": 4.58415320664231e-06, "loss": 1.0742, "step": 11166 }, { "epoch": 0.21, "learning_rate": 4.584068834001384e-06, "loss": 1.0984, "step": 11167 }, { "epoch": 0.21, "learning_rate": 4.583984453578607e-06, "loss": 0.9277, "step": 11168 }, { "epoch": 0.21, "learning_rate": 4.583900065374298e-06, "loss": 1.1135, "step": 11169 }, { "epoch": 0.21, "learning_rate": 4.5838156693887695e-06, "loss": 0.7187, "step": 11170 }, { "epoch": 0.21, "learning_rate": 4.583731265622336e-06, "loss": 0.8237, "step": 11171 }, { "epoch": 0.21, "learning_rate": 4.583646854075315e-06, "loss": 0.95, "step": 11172 }, { "epoch": 0.21, "learning_rate": 4.58356243474802e-06, "loss": 0.7997, "step": 11173 }, { "epoch": 0.21, "learning_rate": 4.583478007640767e-06, "loss": 0.8768, "step": 11174 }, { "epoch": 0.21, "learning_rate": 4.583393572753871e-06, "loss": 1.0393, "step": 11175 }, { "epoch": 0.21, "learning_rate": 4.583309130087647e-06, "loss": 0.9624, "step": 11176 }, { "epoch": 0.21, "learning_rate": 4.583224679642412e-06, "loss": 0.8143, "step": 11177 }, { "epoch": 0.21, "learning_rate": 4.583140221418479e-06, "loss": 0.7987, "step": 11178 }, { "epoch": 0.21, "learning_rate": 4.583055755416163e-06, "loss": 1.0727, "step": 11179 }, { "epoch": 0.21, "learning_rate": 4.5829712816357816e-06, "loss": 1.0663, "step": 11180 }, { "epoch": 0.21, "learning_rate": 4.582886800077649e-06, "loss": 1.1139, "step": 11181 }, { "epoch": 0.21, "learning_rate": 4.582802310742082e-06, "loss": 1.0074, "step": 11182 }, { "epoch": 0.21, "learning_rate": 4.582717813629394e-06, "loss": 0.8178, "step": 11183 }, { "epoch": 0.21, "learning_rate": 4.582633308739902e-06, "loss": 1.2211, "step": 11184 }, { "epoch": 0.21, "learning_rate": 4.5825487960739216e-06, "loss": 0.9506, "step": 11185 }, { "epoch": 0.21, "learning_rate": 4.582464275631767e-06, "loss": 0.7174, "step": 11186 }, { "epoch": 0.21, "learning_rate": 4.582379747413755e-06, "loss": 1.0362, "step": 11187 }, { "epoch": 0.21, "learning_rate": 4.582295211420201e-06, "loss": 0.9506, "step": 11188 }, { "epoch": 0.21, "learning_rate": 4.58221066765142e-06, "loss": 0.9709, "step": 11189 }, { "epoch": 0.21, "learning_rate": 4.582126116107728e-06, "loss": 1.0003, "step": 11190 }, { "epoch": 0.21, "learning_rate": 4.582041556789441e-06, "loss": 0.9247, "step": 11191 }, { "epoch": 0.21, "learning_rate": 4.581956989696876e-06, "loss": 0.8116, "step": 11192 }, { "epoch": 0.21, "learning_rate": 4.581872414830346e-06, "loss": 1.0355, "step": 11193 }, { "epoch": 0.21, "learning_rate": 4.58178783219017e-06, "loss": 1.1712, "step": 11194 }, { "epoch": 0.21, "learning_rate": 4.5817032417766605e-06, "loss": 1.0275, "step": 11195 }, { "epoch": 0.21, "learning_rate": 4.581618643590135e-06, "loss": 1.0676, "step": 11196 }, { "epoch": 0.21, "learning_rate": 4.581534037630909e-06, "loss": 0.9996, "step": 11197 }, { "epoch": 0.21, "learning_rate": 4.5814494238993e-06, "loss": 0.9024, "step": 11198 }, { "epoch": 0.21, "learning_rate": 4.581364802395622e-06, "loss": 0.8789, "step": 11199 }, { "epoch": 0.21, "learning_rate": 4.581280173120192e-06, "loss": 1.1286, "step": 11200 }, { "epoch": 0.21, "learning_rate": 4.5811955360733244e-06, "loss": 0.7809, "step": 11201 }, { "epoch": 0.21, "learning_rate": 4.581110891255338e-06, "loss": 1.006, "step": 11202 }, { "epoch": 0.21, "learning_rate": 4.581026238666546e-06, "loss": 1.0678, "step": 11203 }, { "epoch": 0.21, "learning_rate": 4.580941578307267e-06, "loss": 1.0073, "step": 11204 }, { "epoch": 0.21, "learning_rate": 4.580856910177815e-06, "loss": 0.8325, "step": 11205 }, { "epoch": 0.21, "learning_rate": 4.580772234278508e-06, "loss": 1.1196, "step": 11206 }, { "epoch": 0.21, "learning_rate": 4.58068755060966e-06, "loss": 1.056, "step": 11207 }, { "epoch": 0.21, "learning_rate": 4.58060285917159e-06, "loss": 1.097, "step": 11208 }, { "epoch": 0.21, "learning_rate": 4.580518159964612e-06, "loss": 1.1641, "step": 11209 }, { "epoch": 0.21, "learning_rate": 4.580433452989042e-06, "loss": 0.879, "step": 11210 }, { "epoch": 0.21, "learning_rate": 4.5803487382451995e-06, "loss": 1.0306, "step": 11211 }, { "epoch": 0.21, "learning_rate": 4.580264015733397e-06, "loss": 1.0752, "step": 11212 }, { "epoch": 0.21, "learning_rate": 4.580179285453953e-06, "loss": 0.9459, "step": 11213 }, { "epoch": 0.21, "learning_rate": 4.5800945474071825e-06, "loss": 0.8752, "step": 11214 }, { "epoch": 0.21, "learning_rate": 4.580009801593404e-06, "loss": 0.9366, "step": 11215 }, { "epoch": 0.21, "learning_rate": 4.579925048012932e-06, "loss": 0.7585, "step": 11216 }, { "epoch": 0.21, "learning_rate": 4.579840286666084e-06, "loss": 0.8358, "step": 11217 }, { "epoch": 0.21, "learning_rate": 4.579755517553175e-06, "loss": 0.9629, "step": 11218 }, { "epoch": 0.21, "learning_rate": 4.579670740674524e-06, "loss": 1.1306, "step": 11219 }, { "epoch": 0.21, "learning_rate": 4.579585956030445e-06, "loss": 1.0274, "step": 11220 }, { "epoch": 0.21, "learning_rate": 4.579501163621257e-06, "loss": 0.9207, "step": 11221 }, { "epoch": 0.21, "learning_rate": 4.579416363447276e-06, "loss": 0.9673, "step": 11222 }, { "epoch": 0.21, "learning_rate": 4.579331555508817e-06, "loss": 0.9888, "step": 11223 }, { "epoch": 0.21, "learning_rate": 4.579246739806197e-06, "loss": 0.9255, "step": 11224 }, { "epoch": 0.21, "learning_rate": 4.5791619163397335e-06, "loss": 1.1492, "step": 11225 }, { "epoch": 0.21, "learning_rate": 4.579077085109745e-06, "loss": 0.7728, "step": 11226 }, { "epoch": 0.21, "learning_rate": 4.578992246116545e-06, "loss": 0.9298, "step": 11227 }, { "epoch": 0.21, "learning_rate": 4.578907399360451e-06, "loss": 1.0294, "step": 11228 }, { "epoch": 0.21, "learning_rate": 4.578822544841782e-06, "loss": 0.8713, "step": 11229 }, { "epoch": 0.21, "learning_rate": 4.578737682560853e-06, "loss": 0.8287, "step": 11230 }, { "epoch": 0.21, "learning_rate": 4.57865281251798e-06, "loss": 1.1642, "step": 11231 }, { "epoch": 0.21, "learning_rate": 4.5785679347134826e-06, "loss": 0.8953, "step": 11232 }, { "epoch": 0.21, "learning_rate": 4.578483049147676e-06, "loss": 0.8774, "step": 11233 }, { "epoch": 0.21, "learning_rate": 4.578398155820878e-06, "loss": 0.8918, "step": 11234 }, { "epoch": 0.21, "learning_rate": 4.578313254733403e-06, "loss": 0.8246, "step": 11235 }, { "epoch": 0.21, "learning_rate": 4.5782283458855715e-06, "loss": 0.8609, "step": 11236 }, { "epoch": 0.21, "learning_rate": 4.578143429277699e-06, "loss": 1.0538, "step": 11237 }, { "epoch": 0.21, "learning_rate": 4.578058504910103e-06, "loss": 0.9408, "step": 11238 }, { "epoch": 0.21, "learning_rate": 4.577973572783099e-06, "loss": 1.0348, "step": 11239 }, { "epoch": 0.21, "learning_rate": 4.577888632897006e-06, "loss": 1.084, "step": 11240 }, { "epoch": 0.21, "learning_rate": 4.5778036852521415e-06, "loss": 0.9012, "step": 11241 }, { "epoch": 0.21, "learning_rate": 4.57771872984882e-06, "loss": 1.0698, "step": 11242 }, { "epoch": 0.21, "learning_rate": 4.577633766687361e-06, "loss": 1.1168, "step": 11243 }, { "epoch": 0.21, "learning_rate": 4.5775487957680826e-06, "loss": 1.0562, "step": 11244 }, { "epoch": 0.21, "learning_rate": 4.5774638170913e-06, "loss": 0.9971, "step": 11245 }, { "epoch": 0.21, "learning_rate": 4.577378830657331e-06, "loss": 1.014, "step": 11246 }, { "epoch": 0.21, "learning_rate": 4.577293836466493e-06, "loss": 0.9772, "step": 11247 }, { "epoch": 0.21, "learning_rate": 4.577208834519104e-06, "loss": 0.9448, "step": 11248 }, { "epoch": 0.21, "learning_rate": 4.57712382481548e-06, "loss": 1.2977, "step": 11249 }, { "epoch": 0.21, "learning_rate": 4.577038807355939e-06, "loss": 1.0485, "step": 11250 }, { "epoch": 0.21, "learning_rate": 4.5769537821408e-06, "loss": 0.9902, "step": 11251 }, { "epoch": 0.21, "learning_rate": 4.576868749170379e-06, "loss": 0.7298, "step": 11252 }, { "epoch": 0.21, "learning_rate": 4.5767837084449936e-06, "loss": 0.9284, "step": 11253 }, { "epoch": 0.21, "learning_rate": 4.576698659964961e-06, "loss": 1.0089, "step": 11254 }, { "epoch": 0.21, "learning_rate": 4.5766136037306e-06, "loss": 1.1038, "step": 11255 }, { "epoch": 0.21, "learning_rate": 4.5765285397422275e-06, "loss": 1.1821, "step": 11256 }, { "epoch": 0.21, "learning_rate": 4.5764434680001606e-06, "loss": 0.8826, "step": 11257 }, { "epoch": 0.21, "learning_rate": 4.576358388504718e-06, "loss": 0.7975, "step": 11258 }, { "epoch": 0.21, "learning_rate": 4.576273301256217e-06, "loss": 0.9456, "step": 11259 }, { "epoch": 0.21, "learning_rate": 4.576188206254974e-06, "loss": 0.7687, "step": 11260 }, { "epoch": 0.21, "learning_rate": 4.576103103501309e-06, "loss": 1.0047, "step": 11261 }, { "epoch": 0.21, "learning_rate": 4.576017992995538e-06, "loss": 1.0842, "step": 11262 }, { "epoch": 0.21, "learning_rate": 4.575932874737979e-06, "loss": 0.8643, "step": 11263 }, { "epoch": 0.21, "learning_rate": 4.575847748728952e-06, "loss": 0.9495, "step": 11264 }, { "epoch": 0.21, "learning_rate": 4.5757626149687715e-06, "loss": 1.0276, "step": 11265 }, { "epoch": 0.21, "learning_rate": 4.575677473457758e-06, "loss": 1.0174, "step": 11266 }, { "epoch": 0.21, "learning_rate": 4.575592324196228e-06, "loss": 1.0768, "step": 11267 }, { "epoch": 0.21, "learning_rate": 4.575507167184501e-06, "loss": 1.1018, "step": 11268 }, { "epoch": 0.21, "learning_rate": 4.5754220024228925e-06, "loss": 1.0694, "step": 11269 }, { "epoch": 0.21, "learning_rate": 4.575336829911721e-06, "loss": 1.0277, "step": 11270 }, { "epoch": 0.21, "learning_rate": 4.575251649651308e-06, "loss": 0.7854, "step": 11271 }, { "epoch": 0.21, "learning_rate": 4.575166461641968e-06, "loss": 0.812, "step": 11272 }, { "epoch": 0.21, "learning_rate": 4.575081265884019e-06, "loss": 0.9989, "step": 11273 }, { "epoch": 0.21, "learning_rate": 4.5749960623777815e-06, "loss": 0.8486, "step": 11274 }, { "epoch": 0.21, "learning_rate": 4.574910851123572e-06, "loss": 1.0668, "step": 11275 }, { "epoch": 0.21, "learning_rate": 4.574825632121708e-06, "loss": 1.0571, "step": 11276 }, { "epoch": 0.21, "learning_rate": 4.574740405372509e-06, "loss": 0.9178, "step": 11277 }, { "epoch": 0.21, "learning_rate": 4.574655170876294e-06, "loss": 1.1017, "step": 11278 }, { "epoch": 0.21, "learning_rate": 4.57456992863338e-06, "loss": 0.9479, "step": 11279 }, { "epoch": 0.21, "learning_rate": 4.574484678644084e-06, "loss": 0.9834, "step": 11280 }, { "epoch": 0.21, "learning_rate": 4.574399420908727e-06, "loss": 1.2357, "step": 11281 }, { "epoch": 0.21, "learning_rate": 4.574314155427627e-06, "loss": 0.9955, "step": 11282 }, { "epoch": 0.21, "learning_rate": 4.574228882201101e-06, "loss": 0.9059, "step": 11283 }, { "epoch": 0.21, "learning_rate": 4.574143601229467e-06, "loss": 0.9709, "step": 11284 }, { "epoch": 0.21, "learning_rate": 4.574058312513045e-06, "loss": 1.1063, "step": 11285 }, { "epoch": 0.21, "learning_rate": 4.573973016052153e-06, "loss": 1.0331, "step": 11286 }, { "epoch": 0.21, "learning_rate": 4.573887711847109e-06, "loss": 1.1757, "step": 11287 }, { "epoch": 0.21, "learning_rate": 4.573802399898232e-06, "loss": 0.9118, "step": 11288 }, { "epoch": 0.21, "learning_rate": 4.573717080205841e-06, "loss": 0.8213, "step": 11289 }, { "epoch": 0.21, "learning_rate": 4.5736317527702525e-06, "loss": 0.9799, "step": 11290 }, { "epoch": 0.21, "learning_rate": 4.573546417591788e-06, "loss": 0.808, "step": 11291 }, { "epoch": 0.21, "learning_rate": 4.573461074670764e-06, "loss": 0.7732, "step": 11292 }, { "epoch": 0.21, "learning_rate": 4.5733757240075e-06, "loss": 1.0834, "step": 11293 }, { "epoch": 0.21, "learning_rate": 4.573290365602315e-06, "loss": 0.9949, "step": 11294 }, { "epoch": 0.21, "learning_rate": 4.573204999455527e-06, "loss": 0.944, "step": 11295 }, { "epoch": 0.21, "learning_rate": 4.573119625567456e-06, "loss": 0.6725, "step": 11296 }, { "epoch": 0.21, "learning_rate": 4.573034243938419e-06, "loss": 0.8335, "step": 11297 }, { "epoch": 0.21, "learning_rate": 4.572948854568736e-06, "loss": 1.0623, "step": 11298 }, { "epoch": 0.21, "learning_rate": 4.572863457458725e-06, "loss": 1.0365, "step": 11299 }, { "epoch": 0.21, "learning_rate": 4.572778052608706e-06, "loss": 1.1334, "step": 11300 }, { "epoch": 0.21, "learning_rate": 4.572692640018997e-06, "loss": 1.0739, "step": 11301 }, { "epoch": 0.21, "learning_rate": 4.572607219689918e-06, "loss": 0.9725, "step": 11302 }, { "epoch": 0.21, "learning_rate": 4.572521791621786e-06, "loss": 1.0006, "step": 11303 }, { "epoch": 0.21, "learning_rate": 4.572436355814922e-06, "loss": 0.9542, "step": 11304 }, { "epoch": 0.21, "learning_rate": 4.572350912269644e-06, "loss": 1.0765, "step": 11305 }, { "epoch": 0.21, "learning_rate": 4.572265460986271e-06, "loss": 1.1164, "step": 11306 }, { "epoch": 0.21, "learning_rate": 4.572180001965123e-06, "loss": 1.0289, "step": 11307 }, { "epoch": 0.21, "learning_rate": 4.572094535206517e-06, "loss": 0.9597, "step": 11308 }, { "epoch": 0.21, "learning_rate": 4.572009060710775e-06, "loss": 0.9857, "step": 11309 }, { "epoch": 0.21, "learning_rate": 4.571923578478214e-06, "loss": 1.0056, "step": 11310 }, { "epoch": 0.21, "learning_rate": 4.571838088509154e-06, "loss": 0.9825, "step": 11311 }, { "epoch": 0.21, "learning_rate": 4.571752590803914e-06, "loss": 1.1562, "step": 11312 }, { "epoch": 0.21, "learning_rate": 4.571667085362813e-06, "loss": 0.8024, "step": 11313 }, { "epoch": 0.21, "learning_rate": 4.571581572186171e-06, "loss": 1.0958, "step": 11314 }, { "epoch": 0.21, "learning_rate": 4.571496051274307e-06, "loss": 0.8744, "step": 11315 }, { "epoch": 0.21, "learning_rate": 4.571410522627541e-06, "loss": 0.913, "step": 11316 }, { "epoch": 0.21, "learning_rate": 4.5713249862461905e-06, "loss": 0.8334, "step": 11317 }, { "epoch": 0.21, "learning_rate": 4.571239442130576e-06, "loss": 1.1351, "step": 11318 }, { "epoch": 0.21, "learning_rate": 4.571153890281017e-06, "loss": 0.9432, "step": 11319 }, { "epoch": 0.21, "learning_rate": 4.5710683306978334e-06, "loss": 0.9412, "step": 11320 }, { "epoch": 0.21, "learning_rate": 4.570982763381344e-06, "loss": 0.9984, "step": 11321 }, { "epoch": 0.21, "learning_rate": 4.5708971883318685e-06, "loss": 0.9706, "step": 11322 }, { "epoch": 0.21, "learning_rate": 4.570811605549726e-06, "loss": 0.9114, "step": 11323 }, { "epoch": 0.21, "learning_rate": 4.570726015035238e-06, "loss": 1.2194, "step": 11324 }, { "epoch": 0.21, "learning_rate": 4.570640416788721e-06, "loss": 1.2216, "step": 11325 }, { "epoch": 0.21, "learning_rate": 4.5705548108104954e-06, "loss": 0.9537, "step": 11326 }, { "epoch": 0.21, "learning_rate": 4.570469197100883e-06, "loss": 0.8873, "step": 11327 }, { "epoch": 0.21, "learning_rate": 4.570383575660203e-06, "loss": 0.9673, "step": 11328 }, { "epoch": 0.21, "learning_rate": 4.570297946488772e-06, "loss": 0.7922, "step": 11329 }, { "epoch": 0.21, "learning_rate": 4.570212309586913e-06, "loss": 0.9739, "step": 11330 }, { "epoch": 0.21, "learning_rate": 4.570126664954945e-06, "loss": 0.7874, "step": 11331 }, { "epoch": 0.21, "learning_rate": 4.570041012593187e-06, "loss": 0.9059, "step": 11332 }, { "epoch": 0.21, "learning_rate": 4.5699553525019595e-06, "loss": 0.8585, "step": 11333 }, { "epoch": 0.21, "learning_rate": 4.569869684681582e-06, "loss": 0.9801, "step": 11334 }, { "epoch": 0.21, "learning_rate": 4.569784009132374e-06, "loss": 1.1434, "step": 11335 }, { "epoch": 0.21, "learning_rate": 4.5696983258546565e-06, "loss": 0.9656, "step": 11336 }, { "epoch": 0.21, "learning_rate": 4.56961263484875e-06, "loss": 1.0816, "step": 11337 }, { "epoch": 0.21, "learning_rate": 4.5695269361149715e-06, "loss": 1.0716, "step": 11338 }, { "epoch": 0.21, "learning_rate": 4.569441229653644e-06, "loss": 0.8444, "step": 11339 }, { "epoch": 0.21, "learning_rate": 4.569355515465087e-06, "loss": 1.0349, "step": 11340 }, { "epoch": 0.21, "learning_rate": 4.569269793549619e-06, "loss": 0.9636, "step": 11341 }, { "epoch": 0.21, "learning_rate": 4.569184063907562e-06, "loss": 0.9433, "step": 11342 }, { "epoch": 0.21, "learning_rate": 4.569098326539233e-06, "loss": 1.3171, "step": 11343 }, { "epoch": 0.21, "learning_rate": 4.569012581444956e-06, "loss": 1.1054, "step": 11344 }, { "epoch": 0.21, "learning_rate": 4.568926828625048e-06, "loss": 0.8889, "step": 11345 }, { "epoch": 0.21, "learning_rate": 4.5688410680798325e-06, "loss": 0.9373, "step": 11346 }, { "epoch": 0.21, "learning_rate": 4.568755299809627e-06, "loss": 0.8421, "step": 11347 }, { "epoch": 0.21, "learning_rate": 4.568669523814753e-06, "loss": 0.8505, "step": 11348 }, { "epoch": 0.21, "learning_rate": 4.5685837400955306e-06, "loss": 0.8931, "step": 11349 }, { "epoch": 0.21, "learning_rate": 4.56849794865228e-06, "loss": 1.1017, "step": 11350 }, { "epoch": 0.21, "learning_rate": 4.56841214948532e-06, "loss": 1.0003, "step": 11351 }, { "epoch": 0.21, "learning_rate": 4.568326342594975e-06, "loss": 1.0233, "step": 11352 }, { "epoch": 0.21, "learning_rate": 4.56824052798156e-06, "loss": 0.7785, "step": 11353 }, { "epoch": 0.21, "learning_rate": 4.5681547056454e-06, "loss": 0.8885, "step": 11354 }, { "epoch": 0.21, "learning_rate": 4.568068875586814e-06, "loss": 1.0077, "step": 11355 }, { "epoch": 0.21, "learning_rate": 4.567983037806121e-06, "loss": 1.0157, "step": 11356 }, { "epoch": 0.21, "learning_rate": 4.5678971923036434e-06, "loss": 0.9887, "step": 11357 }, { "epoch": 0.21, "learning_rate": 4.567811339079701e-06, "loss": 1.0713, "step": 11358 }, { "epoch": 0.21, "learning_rate": 4.5677254781346145e-06, "loss": 0.8603, "step": 11359 }, { "epoch": 0.21, "learning_rate": 4.567639609468705e-06, "loss": 0.804, "step": 11360 }, { "epoch": 0.21, "learning_rate": 4.567553733082292e-06, "loss": 0.8558, "step": 11361 }, { "epoch": 0.21, "learning_rate": 4.5674678489756966e-06, "loss": 1.0892, "step": 11362 }, { "epoch": 0.21, "learning_rate": 4.56738195714924e-06, "loss": 1.1705, "step": 11363 }, { "epoch": 0.21, "learning_rate": 4.567296057603242e-06, "loss": 0.9773, "step": 11364 }, { "epoch": 0.21, "learning_rate": 4.567210150338024e-06, "loss": 1.0998, "step": 11365 }, { "epoch": 0.21, "learning_rate": 4.567124235353907e-06, "loss": 0.8615, "step": 11366 }, { "epoch": 0.21, "learning_rate": 4.567038312651212e-06, "loss": 0.8394, "step": 11367 }, { "epoch": 0.21, "learning_rate": 4.566952382230258e-06, "loss": 0.9934, "step": 11368 }, { "epoch": 0.21, "learning_rate": 4.566866444091369e-06, "loss": 1.1481, "step": 11369 }, { "epoch": 0.21, "learning_rate": 4.566780498234863e-06, "loss": 0.8901, "step": 11370 }, { "epoch": 0.21, "learning_rate": 4.566694544661061e-06, "loss": 0.9045, "step": 11371 }, { "epoch": 0.21, "learning_rate": 4.566608583370286e-06, "loss": 0.8852, "step": 11372 }, { "epoch": 0.21, "learning_rate": 4.566522614362858e-06, "loss": 0.8909, "step": 11373 }, { "epoch": 0.21, "learning_rate": 4.566436637639098e-06, "loss": 1.1398, "step": 11374 }, { "epoch": 0.21, "learning_rate": 4.566350653199327e-06, "loss": 0.9816, "step": 11375 }, { "epoch": 0.21, "learning_rate": 4.5662646610438655e-06, "loss": 1.072, "step": 11376 }, { "epoch": 0.21, "learning_rate": 4.566178661173035e-06, "loss": 0.7078, "step": 11377 }, { "epoch": 0.21, "learning_rate": 4.566092653587158e-06, "loss": 0.7284, "step": 11378 }, { "epoch": 0.21, "learning_rate": 4.5660066382865535e-06, "loss": 0.8467, "step": 11379 }, { "epoch": 0.21, "learning_rate": 4.565920615271543e-06, "loss": 1.1113, "step": 11380 }, { "epoch": 0.21, "learning_rate": 4.565834584542449e-06, "loss": 1.1963, "step": 11381 }, { "epoch": 0.21, "learning_rate": 4.565748546099592e-06, "loss": 0.9438, "step": 11382 }, { "epoch": 0.21, "learning_rate": 4.565662499943293e-06, "loss": 0.9759, "step": 11383 }, { "epoch": 0.21, "learning_rate": 4.565576446073874e-06, "loss": 0.9536, "step": 11384 }, { "epoch": 0.21, "learning_rate": 4.565490384491656e-06, "loss": 0.8894, "step": 11385 }, { "epoch": 0.21, "learning_rate": 4.565404315196958e-06, "loss": 1.007, "step": 11386 }, { "epoch": 0.21, "learning_rate": 4.565318238190106e-06, "loss": 1.1268, "step": 11387 }, { "epoch": 0.21, "learning_rate": 4.565232153471419e-06, "loss": 1.1805, "step": 11388 }, { "epoch": 0.21, "learning_rate": 4.565146061041217e-06, "loss": 0.9422, "step": 11389 }, { "epoch": 0.21, "learning_rate": 4.5650599608998244e-06, "loss": 0.9199, "step": 11390 }, { "epoch": 0.21, "learning_rate": 4.56497385304756e-06, "loss": 0.9588, "step": 11391 }, { "epoch": 0.21, "learning_rate": 4.564887737484748e-06, "loss": 0.8156, "step": 11392 }, { "epoch": 0.21, "learning_rate": 4.564801614211707e-06, "loss": 1.0018, "step": 11393 }, { "epoch": 0.21, "learning_rate": 4.564715483228761e-06, "loss": 1.1155, "step": 11394 }, { "epoch": 0.21, "learning_rate": 4.56462934453623e-06, "loss": 0.8907, "step": 11395 }, { "epoch": 0.22, "learning_rate": 4.564543198134437e-06, "loss": 0.8936, "step": 11396 }, { "epoch": 0.22, "learning_rate": 4.564457044023702e-06, "loss": 0.9385, "step": 11397 }, { "epoch": 0.22, "learning_rate": 4.564370882204349e-06, "loss": 0.8223, "step": 11398 }, { "epoch": 0.22, "learning_rate": 4.564284712676698e-06, "loss": 1.0094, "step": 11399 }, { "epoch": 0.22, "learning_rate": 4.564198535441071e-06, "loss": 0.998, "step": 11400 }, { "epoch": 0.22, "learning_rate": 4.5641123504977904e-06, "loss": 1.0753, "step": 11401 }, { "epoch": 0.22, "learning_rate": 4.564026157847177e-06, "loss": 0.7781, "step": 11402 }, { "epoch": 0.22, "learning_rate": 4.563939957489553e-06, "loss": 0.8563, "step": 11403 }, { "epoch": 0.22, "learning_rate": 4.563853749425241e-06, "loss": 1.1046, "step": 11404 }, { "epoch": 0.22, "learning_rate": 4.563767533654563e-06, "loss": 0.9865, "step": 11405 }, { "epoch": 0.22, "learning_rate": 4.563681310177839e-06, "loss": 1.2646, "step": 11406 }, { "epoch": 0.22, "learning_rate": 4.563595078995392e-06, "loss": 1.0418, "step": 11407 }, { "epoch": 0.22, "learning_rate": 4.5635088401075455e-06, "loss": 1.0527, "step": 11408 }, { "epoch": 0.22, "learning_rate": 4.5634225935146194e-06, "loss": 0.8752, "step": 11409 }, { "epoch": 0.22, "learning_rate": 4.563336339216937e-06, "loss": 1.0107, "step": 11410 }, { "epoch": 0.22, "learning_rate": 4.56325007721482e-06, "loss": 0.8222, "step": 11411 }, { "epoch": 0.22, "learning_rate": 4.56316380750859e-06, "loss": 1.0087, "step": 11412 }, { "epoch": 0.22, "learning_rate": 4.563077530098571e-06, "loss": 1.128, "step": 11413 }, { "epoch": 0.22, "learning_rate": 4.5629912449850826e-06, "loss": 0.8546, "step": 11414 }, { "epoch": 0.22, "learning_rate": 4.562904952168449e-06, "loss": 0.8348, "step": 11415 }, { "epoch": 0.22, "learning_rate": 4.5628186516489905e-06, "loss": 0.8415, "step": 11416 }, { "epoch": 0.22, "learning_rate": 4.562732343427031e-06, "loss": 0.8827, "step": 11417 }, { "epoch": 0.22, "learning_rate": 4.5626460275028914e-06, "loss": 0.8625, "step": 11418 }, { "epoch": 0.22, "learning_rate": 4.562559703876895e-06, "loss": 1.1439, "step": 11419 }, { "epoch": 0.22, "learning_rate": 4.5624733725493656e-06, "loss": 0.8578, "step": 11420 }, { "epoch": 0.22, "learning_rate": 4.5623870335206225e-06, "loss": 0.8365, "step": 11421 }, { "epoch": 0.22, "learning_rate": 4.5623006867909895e-06, "loss": 0.9632, "step": 11422 }, { "epoch": 0.22, "learning_rate": 4.562214332360788e-06, "loss": 0.8474, "step": 11423 }, { "epoch": 0.22, "learning_rate": 4.5621279702303425e-06, "loss": 1.0447, "step": 11424 }, { "epoch": 0.22, "learning_rate": 4.562041600399975e-06, "loss": 1.01, "step": 11425 }, { "epoch": 0.22, "learning_rate": 4.561955222870006e-06, "loss": 1.0031, "step": 11426 }, { "epoch": 0.22, "learning_rate": 4.56186883764076e-06, "loss": 1.0401, "step": 11427 }, { "epoch": 0.22, "learning_rate": 4.561782444712559e-06, "loss": 1.0915, "step": 11428 }, { "epoch": 0.22, "learning_rate": 4.561696044085726e-06, "loss": 0.8707, "step": 11429 }, { "epoch": 0.22, "learning_rate": 4.561609635760582e-06, "loss": 1.0349, "step": 11430 }, { "epoch": 0.22, "learning_rate": 4.561523219737452e-06, "loss": 1.121, "step": 11431 }, { "epoch": 0.22, "learning_rate": 4.561436796016657e-06, "loss": 0.9498, "step": 11432 }, { "epoch": 0.22, "learning_rate": 4.56135036459852e-06, "loss": 0.9224, "step": 11433 }, { "epoch": 0.22, "learning_rate": 4.561263925483365e-06, "loss": 0.8121, "step": 11434 }, { "epoch": 0.22, "learning_rate": 4.561177478671513e-06, "loss": 0.8722, "step": 11435 }, { "epoch": 0.22, "learning_rate": 4.5610910241632875e-06, "loss": 0.8719, "step": 11436 }, { "epoch": 0.22, "learning_rate": 4.561004561959011e-06, "loss": 0.9658, "step": 11437 }, { "epoch": 0.22, "learning_rate": 4.560918092059007e-06, "loss": 0.9241, "step": 11438 }, { "epoch": 0.22, "learning_rate": 4.560831614463597e-06, "loss": 0.928, "step": 11439 }, { "epoch": 0.22, "learning_rate": 4.560745129173106e-06, "loss": 0.9786, "step": 11440 }, { "epoch": 0.22, "learning_rate": 4.560658636187857e-06, "loss": 0.9204, "step": 11441 }, { "epoch": 0.22, "learning_rate": 4.56057213550817e-06, "loss": 1.0915, "step": 11442 }, { "epoch": 0.22, "learning_rate": 4.56048562713437e-06, "loss": 1.0912, "step": 11443 }, { "epoch": 0.22, "learning_rate": 4.560399111066781e-06, "loss": 1.0783, "step": 11444 }, { "epoch": 0.22, "learning_rate": 4.560312587305724e-06, "loss": 0.9832, "step": 11445 }, { "epoch": 0.22, "learning_rate": 4.560226055851523e-06, "loss": 0.9564, "step": 11446 }, { "epoch": 0.22, "learning_rate": 4.560139516704501e-06, "loss": 1.0278, "step": 11447 }, { "epoch": 0.22, "learning_rate": 4.560052969864982e-06, "loss": 0.9348, "step": 11448 }, { "epoch": 0.22, "learning_rate": 4.559966415333288e-06, "loss": 0.9917, "step": 11449 }, { "epoch": 0.22, "learning_rate": 4.559879853109742e-06, "loss": 1.1711, "step": 11450 }, { "epoch": 0.22, "learning_rate": 4.559793283194668e-06, "loss": 1.15, "step": 11451 }, { "epoch": 0.22, "learning_rate": 4.5597067055883895e-06, "loss": 0.9521, "step": 11452 }, { "epoch": 0.22, "learning_rate": 4.559620120291229e-06, "loss": 0.8834, "step": 11453 }, { "epoch": 0.22, "learning_rate": 4.55953352730351e-06, "loss": 0.9293, "step": 11454 }, { "epoch": 0.22, "learning_rate": 4.559446926625556e-06, "loss": 1.0478, "step": 11455 }, { "epoch": 0.22, "learning_rate": 4.5593603182576905e-06, "loss": 1.184, "step": 11456 }, { "epoch": 0.22, "learning_rate": 4.559273702200236e-06, "loss": 1.0327, "step": 11457 }, { "epoch": 0.22, "learning_rate": 4.559187078453518e-06, "loss": 0.9561, "step": 11458 }, { "epoch": 0.22, "learning_rate": 4.559100447017858e-06, "loss": 0.8416, "step": 11459 }, { "epoch": 0.22, "learning_rate": 4.55901380789358e-06, "loss": 0.9178, "step": 11460 }, { "epoch": 0.22, "learning_rate": 4.558927161081007e-06, "loss": 1.0211, "step": 11461 }, { "epoch": 0.22, "learning_rate": 4.558840506580464e-06, "loss": 1.0397, "step": 11462 }, { "epoch": 0.22, "learning_rate": 4.558753844392273e-06, "loss": 1.0107, "step": 11463 }, { "epoch": 0.22, "learning_rate": 4.5586671745167585e-06, "loss": 0.8574, "step": 11464 }, { "epoch": 0.22, "learning_rate": 4.558580496954244e-06, "loss": 0.798, "step": 11465 }, { "epoch": 0.22, "learning_rate": 4.558493811705053e-06, "loss": 0.8566, "step": 11466 }, { "epoch": 0.22, "learning_rate": 4.558407118769509e-06, "loss": 0.9469, "step": 11467 }, { "epoch": 0.22, "learning_rate": 4.558320418147935e-06, "loss": 0.9765, "step": 11468 }, { "epoch": 0.22, "learning_rate": 4.558233709840657e-06, "loss": 1.0517, "step": 11469 }, { "epoch": 0.22, "learning_rate": 4.558146993847998e-06, "loss": 0.9178, "step": 11470 }, { "epoch": 0.22, "learning_rate": 4.55806027017028e-06, "loss": 0.7473, "step": 11471 }, { "epoch": 0.22, "learning_rate": 4.557973538807829e-06, "loss": 1.1473, "step": 11472 }, { "epoch": 0.22, "learning_rate": 4.557886799760967e-06, "loss": 0.795, "step": 11473 }, { "epoch": 0.22, "learning_rate": 4.55780005303002e-06, "loss": 0.9792, "step": 11474 }, { "epoch": 0.22, "learning_rate": 4.5577132986153095e-06, "loss": 1.2543, "step": 11475 }, { "epoch": 0.22, "learning_rate": 4.557626536517161e-06, "loss": 0.7434, "step": 11476 }, { "epoch": 0.22, "learning_rate": 4.557539766735898e-06, "loss": 0.7624, "step": 11477 }, { "epoch": 0.22, "learning_rate": 4.557452989271845e-06, "loss": 0.844, "step": 11478 }, { "epoch": 0.22, "learning_rate": 4.557366204125325e-06, "loss": 0.9006, "step": 11479 }, { "epoch": 0.22, "learning_rate": 4.557279411296663e-06, "loss": 1.0992, "step": 11480 }, { "epoch": 0.22, "learning_rate": 4.557192610786182e-06, "loss": 0.9879, "step": 11481 }, { "epoch": 0.22, "learning_rate": 4.5571058025942085e-06, "loss": 1.1309, "step": 11482 }, { "epoch": 0.22, "learning_rate": 4.557018986721064e-06, "loss": 0.864, "step": 11483 }, { "epoch": 0.22, "learning_rate": 4.556932163167074e-06, "loss": 0.8687, "step": 11484 }, { "epoch": 0.22, "learning_rate": 4.556845331932562e-06, "loss": 0.973, "step": 11485 }, { "epoch": 0.22, "learning_rate": 4.556758493017852e-06, "loss": 0.955, "step": 11486 }, { "epoch": 0.22, "learning_rate": 4.556671646423271e-06, "loss": 1.0195, "step": 11487 }, { "epoch": 0.22, "learning_rate": 4.556584792149139e-06, "loss": 1.0211, "step": 11488 }, { "epoch": 0.22, "learning_rate": 4.556497930195783e-06, "loss": 0.9186, "step": 11489 }, { "epoch": 0.22, "learning_rate": 4.556411060563527e-06, "loss": 0.8569, "step": 11490 }, { "epoch": 0.22, "learning_rate": 4.556324183252695e-06, "loss": 0.8327, "step": 11491 }, { "epoch": 0.22, "learning_rate": 4.556237298263612e-06, "loss": 0.6861, "step": 11492 }, { "epoch": 0.22, "learning_rate": 4.556150405596601e-06, "loss": 0.8228, "step": 11493 }, { "epoch": 0.22, "learning_rate": 4.5560635052519884e-06, "loss": 1.0284, "step": 11494 }, { "epoch": 0.22, "learning_rate": 4.555976597230097e-06, "loss": 1.0624, "step": 11495 }, { "epoch": 0.22, "learning_rate": 4.555889681531252e-06, "loss": 0.8589, "step": 11496 }, { "epoch": 0.22, "learning_rate": 4.555802758155779e-06, "loss": 0.8472, "step": 11497 }, { "epoch": 0.22, "learning_rate": 4.5557158271040014e-06, "loss": 1.0587, "step": 11498 }, { "epoch": 0.22, "learning_rate": 4.5556288883762425e-06, "loss": 1.0515, "step": 11499 }, { "epoch": 0.22, "learning_rate": 4.5555419419728295e-06, "loss": 0.9291, "step": 11500 }, { "epoch": 0.22, "learning_rate": 4.555454987894086e-06, "loss": 0.9932, "step": 11501 }, { "epoch": 0.22, "learning_rate": 4.555368026140337e-06, "loss": 0.9023, "step": 11502 }, { "epoch": 0.22, "learning_rate": 4.555281056711905e-06, "loss": 1.0832, "step": 11503 }, { "epoch": 0.22, "learning_rate": 4.555194079609118e-06, "loss": 1.0562, "step": 11504 }, { "epoch": 0.22, "learning_rate": 4.555107094832299e-06, "loss": 0.9688, "step": 11505 }, { "epoch": 0.22, "learning_rate": 4.555020102381773e-06, "loss": 1.2516, "step": 11506 }, { "epoch": 0.22, "learning_rate": 4.554933102257865e-06, "loss": 1.136, "step": 11507 }, { "epoch": 0.22, "learning_rate": 4.5548460944609e-06, "loss": 0.9082, "step": 11508 }, { "epoch": 0.22, "learning_rate": 4.554759078991202e-06, "loss": 0.8372, "step": 11509 }, { "epoch": 0.22, "learning_rate": 4.554672055849098e-06, "loss": 0.9784, "step": 11510 }, { "epoch": 0.22, "learning_rate": 4.55458502503491e-06, "loss": 0.817, "step": 11511 }, { "epoch": 0.22, "learning_rate": 4.554497986548966e-06, "loss": 1.2504, "step": 11512 }, { "epoch": 0.22, "learning_rate": 4.554410940391588e-06, "loss": 1.2085, "step": 11513 }, { "epoch": 0.22, "learning_rate": 4.5543238865631035e-06, "loss": 0.9373, "step": 11514 }, { "epoch": 0.22, "learning_rate": 4.554236825063836e-06, "loss": 1.0616, "step": 11515 }, { "epoch": 0.22, "learning_rate": 4.554149755894111e-06, "loss": 1.0076, "step": 11516 }, { "epoch": 0.22, "learning_rate": 4.554062679054255e-06, "loss": 0.8387, "step": 11517 }, { "epoch": 0.22, "learning_rate": 4.5539755945445915e-06, "loss": 1.0686, "step": 11518 }, { "epoch": 0.22, "learning_rate": 4.553888502365445e-06, "loss": 1.0291, "step": 11519 }, { "epoch": 0.22, "learning_rate": 4.5538014025171425e-06, "loss": 1.0262, "step": 11520 }, { "epoch": 0.22, "learning_rate": 4.553714295000009e-06, "loss": 0.9579, "step": 11521 }, { "epoch": 0.22, "learning_rate": 4.553627179814369e-06, "loss": 0.7912, "step": 11522 }, { "epoch": 0.22, "learning_rate": 4.553540056960548e-06, "loss": 0.8301, "step": 11523 }, { "epoch": 0.22, "learning_rate": 4.553452926438872e-06, "loss": 1.0026, "step": 11524 }, { "epoch": 0.22, "learning_rate": 4.553365788249665e-06, "loss": 1.3665, "step": 11525 }, { "epoch": 0.22, "learning_rate": 4.553278642393253e-06, "loss": 0.9688, "step": 11526 }, { "epoch": 0.22, "learning_rate": 4.553191488869962e-06, "loss": 0.9796, "step": 11527 }, { "epoch": 0.22, "learning_rate": 4.553104327680116e-06, "loss": 0.688, "step": 11528 }, { "epoch": 0.22, "learning_rate": 4.553017158824043e-06, "loss": 0.8405, "step": 11529 }, { "epoch": 0.22, "learning_rate": 4.552929982302065e-06, "loss": 0.9346, "step": 11530 }, { "epoch": 0.22, "learning_rate": 4.552842798114511e-06, "loss": 0.9791, "step": 11531 }, { "epoch": 0.22, "learning_rate": 4.552755606261704e-06, "loss": 1.0632, "step": 11532 }, { "epoch": 0.22, "learning_rate": 4.5526684067439715e-06, "loss": 1.0042, "step": 11533 }, { "epoch": 0.22, "learning_rate": 4.552581199561637e-06, "loss": 0.7203, "step": 11534 }, { "epoch": 0.22, "learning_rate": 4.552493984715027e-06, "loss": 0.7827, "step": 11535 }, { "epoch": 0.22, "learning_rate": 4.552406762204469e-06, "loss": 1.0104, "step": 11536 }, { "epoch": 0.22, "learning_rate": 4.552319532030286e-06, "loss": 1.1628, "step": 11537 }, { "epoch": 0.22, "learning_rate": 4.552232294192805e-06, "loss": 0.8778, "step": 11538 }, { "epoch": 0.22, "learning_rate": 4.552145048692351e-06, "loss": 0.9644, "step": 11539 }, { "epoch": 0.22, "learning_rate": 4.552057795529251e-06, "loss": 0.9346, "step": 11540 }, { "epoch": 0.22, "learning_rate": 4.55197053470383e-06, "loss": 0.8724, "step": 11541 }, { "epoch": 0.22, "learning_rate": 4.551883266216414e-06, "loss": 0.8359, "step": 11542 }, { "epoch": 0.22, "learning_rate": 4.551795990067328e-06, "loss": 1.1657, "step": 11543 }, { "epoch": 0.22, "learning_rate": 4.551708706256899e-06, "loss": 1.1746, "step": 11544 }, { "epoch": 0.22, "learning_rate": 4.551621414785453e-06, "loss": 1.0129, "step": 11545 }, { "epoch": 0.22, "learning_rate": 4.551534115653315e-06, "loss": 1.0063, "step": 11546 }, { "epoch": 0.22, "learning_rate": 4.551446808860813e-06, "loss": 0.9017, "step": 11547 }, { "epoch": 0.22, "learning_rate": 4.55135949440827e-06, "loss": 0.8516, "step": 11548 }, { "epoch": 0.22, "learning_rate": 4.551272172296014e-06, "loss": 1.0878, "step": 11549 }, { "epoch": 0.22, "learning_rate": 4.551184842524371e-06, "loss": 1.231, "step": 11550 }, { "epoch": 0.22, "learning_rate": 4.551097505093666e-06, "loss": 0.9411, "step": 11551 }, { "epoch": 0.22, "learning_rate": 4.5510101600042256e-06, "loss": 0.9077, "step": 11552 }, { "epoch": 0.22, "learning_rate": 4.5509228072563776e-06, "loss": 0.9785, "step": 11553 }, { "epoch": 0.22, "learning_rate": 4.550835446850445e-06, "loss": 0.9132, "step": 11554 }, { "epoch": 0.22, "learning_rate": 4.550748078786756e-06, "loss": 1.0828, "step": 11555 }, { "epoch": 0.22, "learning_rate": 4.550660703065638e-06, "loss": 1.1524, "step": 11556 }, { "epoch": 0.22, "learning_rate": 4.550573319687415e-06, "loss": 0.9655, "step": 11557 }, { "epoch": 0.22, "learning_rate": 4.550485928652414e-06, "loss": 1.0019, "step": 11558 }, { "epoch": 0.22, "learning_rate": 4.550398529960961e-06, "loss": 0.9495, "step": 11559 }, { "epoch": 0.22, "learning_rate": 4.550311123613383e-06, "loss": 0.9352, "step": 11560 }, { "epoch": 0.22, "learning_rate": 4.5502237096100064e-06, "loss": 0.8673, "step": 11561 }, { "epoch": 0.22, "learning_rate": 4.550136287951157e-06, "loss": 1.0776, "step": 11562 }, { "epoch": 0.22, "learning_rate": 4.5500488586371615e-06, "loss": 1.1212, "step": 11563 }, { "epoch": 0.22, "learning_rate": 4.5499614216683465e-06, "loss": 0.9211, "step": 11564 }, { "epoch": 0.22, "learning_rate": 4.549873977045039e-06, "loss": 0.8196, "step": 11565 }, { "epoch": 0.22, "learning_rate": 4.549786524767564e-06, "loss": 0.9502, "step": 11566 }, { "epoch": 0.22, "learning_rate": 4.549699064836249e-06, "loss": 1.0387, "step": 11567 }, { "epoch": 0.22, "learning_rate": 4.5496115972514215e-06, "loss": 1.1818, "step": 11568 }, { "epoch": 0.22, "learning_rate": 4.549524122013407e-06, "loss": 1.1241, "step": 11569 }, { "epoch": 0.22, "learning_rate": 4.549436639122532e-06, "loss": 0.9183, "step": 11570 }, { "epoch": 0.22, "learning_rate": 4.549349148579123e-06, "loss": 0.9168, "step": 11571 }, { "epoch": 0.22, "learning_rate": 4.549261650383507e-06, "loss": 0.9111, "step": 11572 }, { "epoch": 0.22, "learning_rate": 4.5491741445360116e-06, "loss": 1.1042, "step": 11573 }, { "epoch": 0.22, "learning_rate": 4.549086631036962e-06, "loss": 1.1215, "step": 11574 }, { "epoch": 0.22, "learning_rate": 4.548999109886687e-06, "loss": 1.068, "step": 11575 }, { "epoch": 0.22, "learning_rate": 4.5489115810855115e-06, "loss": 0.929, "step": 11576 }, { "epoch": 0.22, "learning_rate": 4.548824044633762e-06, "loss": 0.9628, "step": 11577 }, { "epoch": 0.22, "learning_rate": 4.548736500531767e-06, "loss": 0.9532, "step": 11578 }, { "epoch": 0.22, "learning_rate": 4.548648948779853e-06, "loss": 0.9951, "step": 11579 }, { "epoch": 0.22, "learning_rate": 4.548561389378346e-06, "loss": 1.017, "step": 11580 }, { "epoch": 0.22, "learning_rate": 4.548473822327575e-06, "loss": 1.1321, "step": 11581 }, { "epoch": 0.22, "learning_rate": 4.548386247627864e-06, "loss": 0.881, "step": 11582 }, { "epoch": 0.22, "learning_rate": 4.548298665279543e-06, "loss": 0.8253, "step": 11583 }, { "epoch": 0.22, "learning_rate": 4.548211075282936e-06, "loss": 0.8092, "step": 11584 }, { "epoch": 0.22, "learning_rate": 4.548123477638372e-06, "loss": 0.8486, "step": 11585 }, { "epoch": 0.22, "learning_rate": 4.548035872346178e-06, "loss": 0.8506, "step": 11586 }, { "epoch": 0.22, "learning_rate": 4.547948259406682e-06, "loss": 1.1577, "step": 11587 }, { "epoch": 0.22, "learning_rate": 4.547860638820208e-06, "loss": 0.9972, "step": 11588 }, { "epoch": 0.22, "learning_rate": 4.547773010587086e-06, "loss": 1.024, "step": 11589 }, { "epoch": 0.22, "learning_rate": 4.547685374707643e-06, "loss": 0.7729, "step": 11590 }, { "epoch": 0.22, "learning_rate": 4.547597731182205e-06, "loss": 1.0576, "step": 11591 }, { "epoch": 0.22, "learning_rate": 4.5475100800111e-06, "loss": 0.9919, "step": 11592 }, { "epoch": 0.22, "learning_rate": 4.547422421194655e-06, "loss": 0.8699, "step": 11593 }, { "epoch": 0.22, "learning_rate": 4.547334754733198e-06, "loss": 1.0409, "step": 11594 }, { "epoch": 0.22, "learning_rate": 4.547247080627055e-06, "loss": 0.9845, "step": 11595 }, { "epoch": 0.22, "learning_rate": 4.547159398876554e-06, "loss": 1.0115, "step": 11596 }, { "epoch": 0.22, "learning_rate": 4.547071709482023e-06, "loss": 1.0745, "step": 11597 }, { "epoch": 0.22, "learning_rate": 4.546984012443789e-06, "loss": 0.7584, "step": 11598 }, { "epoch": 0.22, "learning_rate": 4.5468963077621805e-06, "loss": 0.9719, "step": 11599 }, { "epoch": 0.22, "learning_rate": 4.546808595437523e-06, "loss": 0.9951, "step": 11600 }, { "epoch": 0.22, "learning_rate": 4.546720875470144e-06, "loss": 0.9954, "step": 11601 }, { "epoch": 0.22, "learning_rate": 4.546633147860373e-06, "loss": 0.9272, "step": 11602 }, { "epoch": 0.22, "learning_rate": 4.546545412608538e-06, "loss": 0.9969, "step": 11603 }, { "epoch": 0.22, "learning_rate": 4.546457669714963e-06, "loss": 0.7716, "step": 11604 }, { "epoch": 0.22, "learning_rate": 4.5463699191799785e-06, "loss": 0.9355, "step": 11605 }, { "epoch": 0.22, "learning_rate": 4.546282161003911e-06, "loss": 1.0714, "step": 11606 }, { "epoch": 0.22, "learning_rate": 4.546194395187089e-06, "loss": 0.9183, "step": 11607 }, { "epoch": 0.22, "learning_rate": 4.54610662172984e-06, "loss": 0.9076, "step": 11608 }, { "epoch": 0.22, "learning_rate": 4.546018840632492e-06, "loss": 0.7271, "step": 11609 }, { "epoch": 0.22, "learning_rate": 4.545931051895372e-06, "loss": 0.9232, "step": 11610 }, { "epoch": 0.22, "learning_rate": 4.545843255518808e-06, "loss": 0.8861, "step": 11611 }, { "epoch": 0.22, "learning_rate": 4.545755451503128e-06, "loss": 1.0055, "step": 11612 }, { "epoch": 0.22, "learning_rate": 4.5456676398486605e-06, "loss": 0.9366, "step": 11613 }, { "epoch": 0.22, "learning_rate": 4.545579820555733e-06, "loss": 0.9671, "step": 11614 }, { "epoch": 0.22, "learning_rate": 4.5454919936246716e-06, "loss": 0.9672, "step": 11615 }, { "epoch": 0.22, "learning_rate": 4.545404159055807e-06, "loss": 0.9126, "step": 11616 }, { "epoch": 0.22, "learning_rate": 4.5453163168494654e-06, "loss": 0.8747, "step": 11617 }, { "epoch": 0.22, "learning_rate": 4.545228467005975e-06, "loss": 1.2264, "step": 11618 }, { "epoch": 0.22, "learning_rate": 4.545140609525665e-06, "loss": 1.2068, "step": 11619 }, { "epoch": 0.22, "learning_rate": 4.545052744408863e-06, "loss": 0.9349, "step": 11620 }, { "epoch": 0.22, "learning_rate": 4.5449648716558956e-06, "loss": 0.9942, "step": 11621 }, { "epoch": 0.22, "learning_rate": 4.544876991267093e-06, "loss": 1.1651, "step": 11622 }, { "epoch": 0.22, "learning_rate": 4.5447891032427826e-06, "loss": 0.8262, "step": 11623 }, { "epoch": 0.22, "learning_rate": 4.544701207583292e-06, "loss": 0.9846, "step": 11624 }, { "epoch": 0.22, "learning_rate": 4.54461330428895e-06, "loss": 1.3611, "step": 11625 }, { "epoch": 0.22, "learning_rate": 4.544525393360084e-06, "loss": 0.8672, "step": 11626 }, { "epoch": 0.22, "learning_rate": 4.5444374747970235e-06, "loss": 0.887, "step": 11627 }, { "epoch": 0.22, "learning_rate": 4.544349548600095e-06, "loss": 0.7009, "step": 11628 }, { "epoch": 0.22, "learning_rate": 4.544261614769629e-06, "loss": 0.8189, "step": 11629 }, { "epoch": 0.22, "learning_rate": 4.544173673305953e-06, "loss": 0.9688, "step": 11630 }, { "epoch": 0.22, "learning_rate": 4.544085724209395e-06, "loss": 1.0131, "step": 11631 }, { "epoch": 0.22, "learning_rate": 4.543997767480283e-06, "loss": 0.9489, "step": 11632 }, { "epoch": 0.22, "learning_rate": 4.543909803118946e-06, "loss": 0.8334, "step": 11633 }, { "epoch": 0.22, "learning_rate": 4.543821831125713e-06, "loss": 0.8778, "step": 11634 }, { "epoch": 0.22, "learning_rate": 4.543733851500912e-06, "loss": 1.1053, "step": 11635 }, { "epoch": 0.22, "learning_rate": 4.543645864244871e-06, "loss": 0.9611, "step": 11636 }, { "epoch": 0.22, "learning_rate": 4.543557869357919e-06, "loss": 1.3577, "step": 11637 }, { "epoch": 0.22, "learning_rate": 4.543469866840385e-06, "loss": 0.8977, "step": 11638 }, { "epoch": 0.22, "learning_rate": 4.5433818566925975e-06, "loss": 0.8596, "step": 11639 }, { "epoch": 0.22, "learning_rate": 4.543293838914885e-06, "loss": 0.889, "step": 11640 }, { "epoch": 0.22, "learning_rate": 4.543205813507575e-06, "loss": 0.9453, "step": 11641 }, { "epoch": 0.22, "learning_rate": 4.543117780470997e-06, "loss": 0.9949, "step": 11642 }, { "epoch": 0.22, "learning_rate": 4.54302973980548e-06, "loss": 1.1077, "step": 11643 }, { "epoch": 0.22, "learning_rate": 4.542941691511354e-06, "loss": 1.1335, "step": 11644 }, { "epoch": 0.22, "learning_rate": 4.542853635588944e-06, "loss": 0.5797, "step": 11645 }, { "epoch": 0.22, "learning_rate": 4.542765572038582e-06, "loss": 0.8039, "step": 11646 }, { "epoch": 0.22, "learning_rate": 4.542677500860597e-06, "loss": 0.8737, "step": 11647 }, { "epoch": 0.22, "learning_rate": 4.542589422055317e-06, "loss": 1.058, "step": 11648 }, { "epoch": 0.22, "learning_rate": 4.542501335623069e-06, "loss": 1.0154, "step": 11649 }, { "epoch": 0.22, "learning_rate": 4.542413241564185e-06, "loss": 1.0038, "step": 11650 }, { "epoch": 0.22, "learning_rate": 4.542325139878992e-06, "loss": 0.814, "step": 11651 }, { "epoch": 0.22, "learning_rate": 4.54223703056782e-06, "loss": 0.9037, "step": 11652 }, { "epoch": 0.22, "learning_rate": 4.542148913630997e-06, "loss": 0.8866, "step": 11653 }, { "epoch": 0.22, "learning_rate": 4.542060789068853e-06, "loss": 1.032, "step": 11654 }, { "epoch": 0.22, "learning_rate": 4.541972656881716e-06, "loss": 1.191, "step": 11655 }, { "epoch": 0.22, "learning_rate": 4.541884517069916e-06, "loss": 1.1692, "step": 11656 }, { "epoch": 0.22, "learning_rate": 4.5417963696337815e-06, "loss": 0.9489, "step": 11657 }, { "epoch": 0.22, "learning_rate": 4.541708214573643e-06, "loss": 0.8698, "step": 11658 }, { "epoch": 0.22, "learning_rate": 4.541620051889828e-06, "loss": 0.8732, "step": 11659 }, { "epoch": 0.22, "learning_rate": 4.541531881582667e-06, "loss": 1.0892, "step": 11660 }, { "epoch": 0.22, "learning_rate": 4.541443703652487e-06, "loss": 0.9476, "step": 11661 }, { "epoch": 0.22, "learning_rate": 4.5413555180996204e-06, "loss": 1.3732, "step": 11662 }, { "epoch": 0.22, "learning_rate": 4.541267324924394e-06, "loss": 1.0037, "step": 11663 }, { "epoch": 0.22, "learning_rate": 4.541179124127139e-06, "loss": 0.8168, "step": 11664 }, { "epoch": 0.22, "learning_rate": 4.541090915708182e-06, "loss": 1.121, "step": 11665 }, { "epoch": 0.22, "learning_rate": 4.541002699667855e-06, "loss": 0.7339, "step": 11666 }, { "epoch": 0.22, "learning_rate": 4.540914476006487e-06, "loss": 1.0023, "step": 11667 }, { "epoch": 0.22, "learning_rate": 4.540826244724406e-06, "loss": 1.0343, "step": 11668 }, { "epoch": 0.22, "learning_rate": 4.540738005821943e-06, "loss": 1.0769, "step": 11669 }, { "epoch": 0.22, "learning_rate": 4.540649759299427e-06, "loss": 1.0104, "step": 11670 }, { "epoch": 0.22, "learning_rate": 4.540561505157186e-06, "loss": 0.7371, "step": 11671 }, { "epoch": 0.22, "learning_rate": 4.540473243395552e-06, "loss": 0.9151, "step": 11672 }, { "epoch": 0.22, "learning_rate": 4.540384974014854e-06, "loss": 0.7437, "step": 11673 }, { "epoch": 0.22, "learning_rate": 4.540296697015421e-06, "loss": 1.0383, "step": 11674 }, { "epoch": 0.22, "learning_rate": 4.540208412397582e-06, "loss": 1.1179, "step": 11675 }, { "epoch": 0.22, "learning_rate": 4.540120120161667e-06, "loss": 0.9199, "step": 11676 }, { "epoch": 0.22, "learning_rate": 4.540031820308007e-06, "loss": 0.9249, "step": 11677 }, { "epoch": 0.22, "learning_rate": 4.53994351283693e-06, "loss": 0.8452, "step": 11678 }, { "epoch": 0.22, "learning_rate": 4.539855197748767e-06, "loss": 1.14, "step": 11679 }, { "epoch": 0.22, "learning_rate": 4.539766875043847e-06, "loss": 1.0385, "step": 11680 }, { "epoch": 0.22, "learning_rate": 4.5396785447225e-06, "loss": 1.2604, "step": 11681 }, { "epoch": 0.22, "learning_rate": 4.5395902067850555e-06, "loss": 0.8755, "step": 11682 }, { "epoch": 0.22, "learning_rate": 4.539501861231844e-06, "loss": 1.0178, "step": 11683 }, { "epoch": 0.22, "learning_rate": 4.539413508063195e-06, "loss": 1.0982, "step": 11684 }, { "epoch": 0.22, "learning_rate": 4.5393251472794384e-06, "loss": 0.8229, "step": 11685 }, { "epoch": 0.22, "learning_rate": 4.539236778880906e-06, "loss": 1.078, "step": 11686 }, { "epoch": 0.22, "learning_rate": 4.539148402867924e-06, "loss": 1.0876, "step": 11687 }, { "epoch": 0.22, "learning_rate": 4.539060019240824e-06, "loss": 0.8757, "step": 11688 }, { "epoch": 0.22, "learning_rate": 4.538971627999937e-06, "loss": 0.7608, "step": 11689 }, { "epoch": 0.22, "learning_rate": 4.538883229145593e-06, "loss": 0.8372, "step": 11690 }, { "epoch": 0.22, "learning_rate": 4.5387948226781216e-06, "loss": 1.009, "step": 11691 }, { "epoch": 0.22, "learning_rate": 4.538706408597853e-06, "loss": 0.7494, "step": 11692 }, { "epoch": 0.22, "learning_rate": 4.538617986905116e-06, "loss": 1.087, "step": 11693 }, { "epoch": 0.22, "learning_rate": 4.538529557600243e-06, "loss": 1.1664, "step": 11694 }, { "epoch": 0.22, "learning_rate": 4.538441120683562e-06, "loss": 0.9071, "step": 11695 }, { "epoch": 0.22, "learning_rate": 4.5383526761554054e-06, "loss": 0.8773, "step": 11696 }, { "epoch": 0.22, "learning_rate": 4.538264224016102e-06, "loss": 0.9752, "step": 11697 }, { "epoch": 0.22, "learning_rate": 4.538175764265983e-06, "loss": 0.7825, "step": 11698 }, { "epoch": 0.22, "learning_rate": 4.538087296905378e-06, "loss": 0.857, "step": 11699 }, { "epoch": 0.22, "learning_rate": 4.537998821934617e-06, "loss": 1.3299, "step": 11700 }, { "epoch": 0.22, "learning_rate": 4.5379103393540315e-06, "loss": 0.9302, "step": 11701 }, { "epoch": 0.22, "learning_rate": 4.53782184916395e-06, "loss": 1.0008, "step": 11702 }, { "epoch": 0.22, "learning_rate": 4.537733351364706e-06, "loss": 0.9891, "step": 11703 }, { "epoch": 0.22, "learning_rate": 4.537644845956627e-06, "loss": 0.9155, "step": 11704 }, { "epoch": 0.22, "learning_rate": 4.537556332940045e-06, "loss": 0.9979, "step": 11705 }, { "epoch": 0.22, "learning_rate": 4.53746781231529e-06, "loss": 1.2787, "step": 11706 }, { "epoch": 0.22, "learning_rate": 4.537379284082692e-06, "loss": 1.0504, "step": 11707 }, { "epoch": 0.22, "learning_rate": 4.537290748242583e-06, "loss": 0.9734, "step": 11708 }, { "epoch": 0.22, "learning_rate": 4.537202204795293e-06, "loss": 0.9858, "step": 11709 }, { "epoch": 0.22, "learning_rate": 4.5371136537411526e-06, "loss": 0.9636, "step": 11710 }, { "epoch": 0.22, "learning_rate": 4.537025095080492e-06, "loss": 0.8087, "step": 11711 }, { "epoch": 0.22, "learning_rate": 4.536936528813641e-06, "loss": 1.061, "step": 11712 }, { "epoch": 0.22, "learning_rate": 4.536847954940933e-06, "loss": 1.1925, "step": 11713 }, { "epoch": 0.22, "learning_rate": 4.536759373462697e-06, "loss": 0.8843, "step": 11714 }, { "epoch": 0.22, "learning_rate": 4.536670784379263e-06, "loss": 0.9024, "step": 11715 }, { "epoch": 0.22, "learning_rate": 4.5365821876909635e-06, "loss": 0.9019, "step": 11716 }, { "epoch": 0.22, "learning_rate": 4.536493583398128e-06, "loss": 0.9276, "step": 11717 }, { "epoch": 0.22, "learning_rate": 4.536404971501088e-06, "loss": 1.1515, "step": 11718 }, { "epoch": 0.22, "learning_rate": 4.5363163520001754e-06, "loss": 1.2262, "step": 11719 }, { "epoch": 0.22, "learning_rate": 4.536227724895719e-06, "loss": 0.8695, "step": 11720 }, { "epoch": 0.22, "learning_rate": 4.536139090188051e-06, "loss": 1.1036, "step": 11721 }, { "epoch": 0.22, "learning_rate": 4.5360504478775016e-06, "loss": 1.2123, "step": 11722 }, { "epoch": 0.22, "learning_rate": 4.5359617979644026e-06, "loss": 0.8002, "step": 11723 }, { "epoch": 0.22, "learning_rate": 4.5358731404490855e-06, "loss": 0.941, "step": 11724 }, { "epoch": 0.22, "learning_rate": 4.535784475331879e-06, "loss": 1.1098, "step": 11725 }, { "epoch": 0.22, "learning_rate": 4.535695802613116e-06, "loss": 0.954, "step": 11726 }, { "epoch": 0.22, "learning_rate": 4.535607122293128e-06, "loss": 0.8118, "step": 11727 }, { "epoch": 0.22, "learning_rate": 4.5355184343722445e-06, "loss": 0.928, "step": 11728 }, { "epoch": 0.22, "learning_rate": 4.535429738850799e-06, "loss": 0.8636, "step": 11729 }, { "epoch": 0.22, "learning_rate": 4.53534103572912e-06, "loss": 0.9392, "step": 11730 }, { "epoch": 0.22, "learning_rate": 4.5352523250075405e-06, "loss": 1.2565, "step": 11731 }, { "epoch": 0.22, "learning_rate": 4.535163606686391e-06, "loss": 0.9246, "step": 11732 }, { "epoch": 0.22, "learning_rate": 4.535074880766003e-06, "loss": 0.8192, "step": 11733 }, { "epoch": 0.22, "learning_rate": 4.534986147246708e-06, "loss": 0.9246, "step": 11734 }, { "epoch": 0.22, "learning_rate": 4.534897406128837e-06, "loss": 0.8474, "step": 11735 }, { "epoch": 0.22, "learning_rate": 4.534808657412722e-06, "loss": 0.8995, "step": 11736 }, { "epoch": 0.22, "learning_rate": 4.534719901098693e-06, "loss": 1.137, "step": 11737 }, { "epoch": 0.22, "learning_rate": 4.534631137187082e-06, "loss": 0.9197, "step": 11738 }, { "epoch": 0.22, "learning_rate": 4.534542365678221e-06, "loss": 1.0638, "step": 11739 }, { "epoch": 0.22, "learning_rate": 4.534453586572441e-06, "loss": 0.8817, "step": 11740 }, { "epoch": 0.22, "learning_rate": 4.534364799870075e-06, "loss": 0.9504, "step": 11741 }, { "epoch": 0.22, "learning_rate": 4.5342760055714525e-06, "loss": 0.8203, "step": 11742 }, { "epoch": 0.22, "learning_rate": 4.5341872036769055e-06, "loss": 1.0381, "step": 11743 }, { "epoch": 0.22, "learning_rate": 4.534098394186766e-06, "loss": 0.831, "step": 11744 }, { "epoch": 0.22, "learning_rate": 4.534009577101366e-06, "loss": 1.0804, "step": 11745 }, { "epoch": 0.22, "learning_rate": 4.533920752421035e-06, "loss": 0.8631, "step": 11746 }, { "epoch": 0.22, "learning_rate": 4.5338319201461075e-06, "loss": 0.9387, "step": 11747 }, { "epoch": 0.22, "learning_rate": 4.5337430802769144e-06, "loss": 0.8758, "step": 11748 }, { "epoch": 0.22, "learning_rate": 4.533654232813786e-06, "loss": 1.0889, "step": 11749 }, { "epoch": 0.22, "learning_rate": 4.533565377757055e-06, "loss": 1.1052, "step": 11750 }, { "epoch": 0.22, "learning_rate": 4.533476515107055e-06, "loss": 0.6101, "step": 11751 }, { "epoch": 0.22, "learning_rate": 4.533387644864114e-06, "loss": 0.787, "step": 11752 }, { "epoch": 0.22, "learning_rate": 4.533298767028567e-06, "loss": 1.0182, "step": 11753 }, { "epoch": 0.22, "learning_rate": 4.533209881600744e-06, "loss": 1.0913, "step": 11754 }, { "epoch": 0.22, "learning_rate": 4.5331209885809775e-06, "loss": 0.9533, "step": 11755 }, { "epoch": 0.22, "learning_rate": 4.533032087969601e-06, "loss": 1.007, "step": 11756 }, { "epoch": 0.22, "learning_rate": 4.532943179766944e-06, "loss": 0.9776, "step": 11757 }, { "epoch": 0.22, "learning_rate": 4.53285426397334e-06, "loss": 0.9077, "step": 11758 }, { "epoch": 0.22, "learning_rate": 4.532765340589119e-06, "loss": 0.871, "step": 11759 }, { "epoch": 0.22, "learning_rate": 4.532676409614616e-06, "loss": 0.9061, "step": 11760 }, { "epoch": 0.22, "learning_rate": 4.532587471050162e-06, "loss": 0.9623, "step": 11761 }, { "epoch": 0.22, "learning_rate": 4.5324985248960875e-06, "loss": 1.0746, "step": 11762 }, { "epoch": 0.22, "learning_rate": 4.532409571152726e-06, "loss": 0.9037, "step": 11763 }, { "epoch": 0.22, "learning_rate": 4.53232060982041e-06, "loss": 0.9828, "step": 11764 }, { "epoch": 0.22, "learning_rate": 4.53223164089947e-06, "loss": 0.7847, "step": 11765 }, { "epoch": 0.22, "learning_rate": 4.532142664390241e-06, "loss": 1.0894, "step": 11766 }, { "epoch": 0.22, "learning_rate": 4.532053680293053e-06, "loss": 1.1118, "step": 11767 }, { "epoch": 0.22, "learning_rate": 4.531964688608239e-06, "loss": 1.1674, "step": 11768 }, { "epoch": 0.22, "learning_rate": 4.531875689336131e-06, "loss": 1.0956, "step": 11769 }, { "epoch": 0.22, "learning_rate": 4.531786682477061e-06, "loss": 0.9849, "step": 11770 }, { "epoch": 0.22, "learning_rate": 4.531697668031362e-06, "loss": 0.7945, "step": 11771 }, { "epoch": 0.22, "learning_rate": 4.531608645999366e-06, "loss": 0.8097, "step": 11772 }, { "epoch": 0.22, "learning_rate": 4.531519616381406e-06, "loss": 0.782, "step": 11773 }, { "epoch": 0.22, "learning_rate": 4.531430579177815e-06, "loss": 0.9881, "step": 11774 }, { "epoch": 0.22, "learning_rate": 4.531341534388923e-06, "loss": 1.1918, "step": 11775 }, { "epoch": 0.22, "learning_rate": 4.531252482015064e-06, "loss": 1.0275, "step": 11776 }, { "epoch": 0.22, "learning_rate": 4.531163422056571e-06, "loss": 1.0201, "step": 11777 }, { "epoch": 0.22, "learning_rate": 4.531074354513776e-06, "loss": 0.7755, "step": 11778 }, { "epoch": 0.22, "learning_rate": 4.530985279387013e-06, "loss": 0.9703, "step": 11779 }, { "epoch": 0.22, "learning_rate": 4.530896196676611e-06, "loss": 1.1844, "step": 11780 }, { "epoch": 0.22, "learning_rate": 4.5308071063829055e-06, "loss": 1.1206, "step": 11781 }, { "epoch": 0.22, "learning_rate": 4.530718008506229e-06, "loss": 0.9439, "step": 11782 }, { "epoch": 0.22, "learning_rate": 4.530628903046914e-06, "loss": 0.9717, "step": 11783 }, { "epoch": 0.22, "learning_rate": 4.530539790005292e-06, "loss": 0.878, "step": 11784 }, { "epoch": 0.22, "learning_rate": 4.530450669381697e-06, "loss": 1.0816, "step": 11785 }, { "epoch": 0.22, "learning_rate": 4.530361541176462e-06, "loss": 0.8721, "step": 11786 }, { "epoch": 0.22, "learning_rate": 4.530272405389919e-06, "loss": 1.231, "step": 11787 }, { "epoch": 0.22, "learning_rate": 4.5301832620224005e-06, "loss": 1.0536, "step": 11788 }, { "epoch": 0.22, "learning_rate": 4.530094111074241e-06, "loss": 0.9503, "step": 11789 }, { "epoch": 0.22, "learning_rate": 4.530004952545772e-06, "loss": 0.8507, "step": 11790 }, { "epoch": 0.22, "learning_rate": 4.529915786437326e-06, "loss": 0.9779, "step": 11791 }, { "epoch": 0.22, "learning_rate": 4.529826612749238e-06, "loss": 0.8765, "step": 11792 }, { "epoch": 0.22, "learning_rate": 4.529737431481839e-06, "loss": 0.977, "step": 11793 }, { "epoch": 0.22, "learning_rate": 4.529648242635461e-06, "loss": 1.1115, "step": 11794 }, { "epoch": 0.22, "learning_rate": 4.529559046210441e-06, "loss": 0.9048, "step": 11795 }, { "epoch": 0.22, "learning_rate": 4.529469842207109e-06, "loss": 1.0223, "step": 11796 }, { "epoch": 0.22, "learning_rate": 4.529380630625799e-06, "loss": 0.911, "step": 11797 }, { "epoch": 0.22, "learning_rate": 4.529291411466844e-06, "loss": 1.0843, "step": 11798 }, { "epoch": 0.22, "learning_rate": 4.529202184730577e-06, "loss": 1.1151, "step": 11799 }, { "epoch": 0.22, "learning_rate": 4.529112950417331e-06, "loss": 1.024, "step": 11800 }, { "epoch": 0.22, "learning_rate": 4.529023708527439e-06, "loss": 0.9482, "step": 11801 }, { "epoch": 0.22, "learning_rate": 4.528934459061235e-06, "loss": 0.8619, "step": 11802 }, { "epoch": 0.22, "learning_rate": 4.528845202019052e-06, "loss": 0.7858, "step": 11803 }, { "epoch": 0.22, "learning_rate": 4.528755937401224e-06, "loss": 0.9556, "step": 11804 }, { "epoch": 0.22, "learning_rate": 4.528666665208083e-06, "loss": 1.0707, "step": 11805 }, { "epoch": 0.22, "learning_rate": 4.528577385439963e-06, "loss": 0.8468, "step": 11806 }, { "epoch": 0.22, "learning_rate": 4.528488098097197e-06, "loss": 0.9709, "step": 11807 }, { "epoch": 0.22, "learning_rate": 4.528398803180119e-06, "loss": 1.0181, "step": 11808 }, { "epoch": 0.22, "learning_rate": 4.528309500689061e-06, "loss": 0.8828, "step": 11809 }, { "epoch": 0.22, "learning_rate": 4.528220190624358e-06, "loss": 0.8749, "step": 11810 }, { "epoch": 0.22, "learning_rate": 4.528130872986344e-06, "loss": 0.6983, "step": 11811 }, { "epoch": 0.22, "learning_rate": 4.528041547775351e-06, "loss": 1.2835, "step": 11812 }, { "epoch": 0.22, "learning_rate": 4.527952214991712e-06, "loss": 1.14, "step": 11813 }, { "epoch": 0.22, "learning_rate": 4.5278628746357635e-06, "loss": 0.8942, "step": 11814 }, { "epoch": 0.22, "learning_rate": 4.527773526707836e-06, "loss": 0.9539, "step": 11815 }, { "epoch": 0.22, "learning_rate": 4.527684171208264e-06, "loss": 0.7762, "step": 11816 }, { "epoch": 0.22, "learning_rate": 4.527594808137382e-06, "loss": 0.9727, "step": 11817 }, { "epoch": 0.22, "learning_rate": 4.527505437495523e-06, "loss": 1.2239, "step": 11818 }, { "epoch": 0.22, "learning_rate": 4.527416059283021e-06, "loss": 1.0575, "step": 11819 }, { "epoch": 0.22, "learning_rate": 4.52732667350021e-06, "loss": 0.8838, "step": 11820 }, { "epoch": 0.22, "learning_rate": 4.527237280147422e-06, "loss": 0.8852, "step": 11821 }, { "epoch": 0.22, "learning_rate": 4.527147879224993e-06, "loss": 0.8253, "step": 11822 }, { "epoch": 0.22, "learning_rate": 4.527058470733257e-06, "loss": 0.8271, "step": 11823 }, { "epoch": 0.22, "learning_rate": 4.526969054672546e-06, "loss": 0.988, "step": 11824 }, { "epoch": 0.22, "learning_rate": 4.526879631043194e-06, "loss": 0.9587, "step": 11825 }, { "epoch": 0.22, "learning_rate": 4.526790199845536e-06, "loss": 0.6608, "step": 11826 }, { "epoch": 0.22, "learning_rate": 4.526700761079906e-06, "loss": 0.9734, "step": 11827 }, { "epoch": 0.22, "learning_rate": 4.526611314746637e-06, "loss": 0.9635, "step": 11828 }, { "epoch": 0.22, "learning_rate": 4.526521860846064e-06, "loss": 0.8607, "step": 11829 }, { "epoch": 0.22, "learning_rate": 4.526432399378519e-06, "loss": 0.8379, "step": 11830 }, { "epoch": 0.22, "learning_rate": 4.52634293034434e-06, "loss": 1.1893, "step": 11831 }, { "epoch": 0.22, "learning_rate": 4.5262534537438565e-06, "loss": 0.9084, "step": 11832 }, { "epoch": 0.22, "learning_rate": 4.5261639695774054e-06, "loss": 0.9239, "step": 11833 }, { "epoch": 0.22, "learning_rate": 4.5260744778453205e-06, "loss": 0.9341, "step": 11834 }, { "epoch": 0.22, "learning_rate": 4.525984978547936e-06, "loss": 0.8543, "step": 11835 }, { "epoch": 0.22, "learning_rate": 4.5258954716855854e-06, "loss": 0.9187, "step": 11836 }, { "epoch": 0.22, "learning_rate": 4.525805957258602e-06, "loss": 1.2349, "step": 11837 }, { "epoch": 0.22, "learning_rate": 4.525716435267323e-06, "loss": 0.9736, "step": 11838 }, { "epoch": 0.22, "learning_rate": 4.52562690571208e-06, "loss": 0.942, "step": 11839 }, { "epoch": 0.22, "learning_rate": 4.525537368593208e-06, "loss": 1.0106, "step": 11840 }, { "epoch": 0.22, "learning_rate": 4.525447823911042e-06, "loss": 0.7951, "step": 11841 }, { "epoch": 0.22, "learning_rate": 4.525358271665916e-06, "loss": 0.8508, "step": 11842 }, { "epoch": 0.22, "learning_rate": 4.525268711858165e-06, "loss": 1.0887, "step": 11843 }, { "epoch": 0.22, "learning_rate": 4.525179144488121e-06, "loss": 0.975, "step": 11844 }, { "epoch": 0.22, "learning_rate": 4.525089569556122e-06, "loss": 1.0437, "step": 11845 }, { "epoch": 0.22, "learning_rate": 4.524999987062499e-06, "loss": 0.9496, "step": 11846 }, { "epoch": 0.22, "learning_rate": 4.524910397007589e-06, "loss": 0.9792, "step": 11847 }, { "epoch": 0.22, "learning_rate": 4.524820799391726e-06, "loss": 0.95, "step": 11848 }, { "epoch": 0.22, "learning_rate": 4.524731194215244e-06, "loss": 0.9811, "step": 11849 }, { "epoch": 0.22, "learning_rate": 4.524641581478477e-06, "loss": 1.1899, "step": 11850 }, { "epoch": 0.22, "learning_rate": 4.524551961181761e-06, "loss": 1.0082, "step": 11851 }, { "epoch": 0.22, "learning_rate": 4.52446233332543e-06, "loss": 1.0186, "step": 11852 }, { "epoch": 0.22, "learning_rate": 4.524372697909819e-06, "loss": 0.941, "step": 11853 }, { "epoch": 0.22, "learning_rate": 4.524283054935262e-06, "loss": 0.8124, "step": 11854 }, { "epoch": 0.22, "learning_rate": 4.524193404402095e-06, "loss": 0.8503, "step": 11855 }, { "epoch": 0.22, "learning_rate": 4.5241037463106504e-06, "loss": 1.164, "step": 11856 }, { "epoch": 0.22, "learning_rate": 4.5240140806612655e-06, "loss": 0.8677, "step": 11857 }, { "epoch": 0.22, "learning_rate": 4.523924407454274e-06, "loss": 1.0029, "step": 11858 }, { "epoch": 0.22, "learning_rate": 4.523834726690011e-06, "loss": 0.8373, "step": 11859 }, { "epoch": 0.22, "learning_rate": 4.5237450383688105e-06, "loss": 0.8951, "step": 11860 }, { "epoch": 0.22, "learning_rate": 4.523655342491009e-06, "loss": 0.9711, "step": 11861 }, { "epoch": 0.22, "learning_rate": 4.523565639056939e-06, "loss": 0.8443, "step": 11862 }, { "epoch": 0.22, "learning_rate": 4.523475928066939e-06, "loss": 0.8759, "step": 11863 }, { "epoch": 0.22, "learning_rate": 4.52338620952134e-06, "loss": 0.8955, "step": 11864 }, { "epoch": 0.22, "learning_rate": 4.52329648342048e-06, "loss": 0.9414, "step": 11865 }, { "epoch": 0.22, "learning_rate": 4.523206749764693e-06, "loss": 0.8312, "step": 11866 }, { "epoch": 0.22, "learning_rate": 4.523117008554313e-06, "loss": 0.8154, "step": 11867 }, { "epoch": 0.22, "learning_rate": 4.523027259789677e-06, "loss": 1.1072, "step": 11868 }, { "epoch": 0.22, "learning_rate": 4.5229375034711194e-06, "loss": 1.0045, "step": 11869 }, { "epoch": 0.22, "learning_rate": 4.522847739598975e-06, "loss": 0.9854, "step": 11870 }, { "epoch": 0.22, "learning_rate": 4.522757968173579e-06, "loss": 0.9308, "step": 11871 }, { "epoch": 0.22, "learning_rate": 4.522668189195267e-06, "loss": 0.8848, "step": 11872 }, { "epoch": 0.22, "learning_rate": 4.522578402664374e-06, "loss": 0.9807, "step": 11873 }, { "epoch": 0.22, "learning_rate": 4.5224886085812345e-06, "loss": 1.0659, "step": 11874 }, { "epoch": 0.22, "learning_rate": 4.522398806946185e-06, "loss": 0.9512, "step": 11875 }, { "epoch": 0.22, "learning_rate": 4.522308997759561e-06, "loss": 0.9315, "step": 11876 }, { "epoch": 0.22, "learning_rate": 4.5222191810216964e-06, "loss": 1.1389, "step": 11877 }, { "epoch": 0.22, "learning_rate": 4.522129356732928e-06, "loss": 0.886, "step": 11878 }, { "epoch": 0.22, "learning_rate": 4.52203952489359e-06, "loss": 0.8675, "step": 11879 }, { "epoch": 0.22, "learning_rate": 4.521949685504019e-06, "loss": 0.8668, "step": 11880 }, { "epoch": 0.22, "learning_rate": 4.521859838564549e-06, "loss": 1.0096, "step": 11881 }, { "epoch": 0.22, "learning_rate": 4.521769984075517e-06, "loss": 1.183, "step": 11882 }, { "epoch": 0.22, "learning_rate": 4.521680122037258e-06, "loss": 0.8688, "step": 11883 }, { "epoch": 0.22, "learning_rate": 4.521590252450107e-06, "loss": 0.8833, "step": 11884 }, { "epoch": 0.22, "learning_rate": 4.521500375314401e-06, "loss": 0.973, "step": 11885 }, { "epoch": 0.22, "learning_rate": 4.521410490630473e-06, "loss": 0.9643, "step": 11886 }, { "epoch": 0.22, "learning_rate": 4.521320598398661e-06, "loss": 1.0219, "step": 11887 }, { "epoch": 0.22, "learning_rate": 4.5212306986193e-06, "loss": 0.8036, "step": 11888 }, { "epoch": 0.22, "learning_rate": 4.521140791292725e-06, "loss": 0.9357, "step": 11889 }, { "epoch": 0.22, "learning_rate": 4.521050876419273e-06, "loss": 1.1, "step": 11890 }, { "epoch": 0.22, "learning_rate": 4.520960953999278e-06, "loss": 1.1725, "step": 11891 }, { "epoch": 0.22, "learning_rate": 4.520871024033078e-06, "loss": 1.1118, "step": 11892 }, { "epoch": 0.22, "learning_rate": 4.520781086521007e-06, "loss": 1.0496, "step": 11893 }, { "epoch": 0.22, "learning_rate": 4.520691141463401e-06, "loss": 1.0392, "step": 11894 }, { "epoch": 0.22, "learning_rate": 4.5206011888605965e-06, "loss": 0.8262, "step": 11895 }, { "epoch": 0.22, "learning_rate": 4.52051122871293e-06, "loss": 0.912, "step": 11896 }, { "epoch": 0.22, "learning_rate": 4.520421261020735e-06, "loss": 0.8696, "step": 11897 }, { "epoch": 0.22, "learning_rate": 4.52033128578435e-06, "loss": 0.9843, "step": 11898 }, { "epoch": 0.22, "learning_rate": 4.520241303004109e-06, "loss": 1.1971, "step": 11899 }, { "epoch": 0.22, "learning_rate": 4.5201513126803495e-06, "loss": 0.9824, "step": 11900 }, { "epoch": 0.22, "learning_rate": 4.520061314813407e-06, "loss": 0.8028, "step": 11901 }, { "epoch": 0.22, "learning_rate": 4.519971309403617e-06, "loss": 0.804, "step": 11902 }, { "epoch": 0.22, "learning_rate": 4.5198812964513166e-06, "loss": 1.0125, "step": 11903 }, { "epoch": 0.22, "learning_rate": 4.519791275956842e-06, "loss": 0.9273, "step": 11904 }, { "epoch": 0.22, "learning_rate": 4.519701247920527e-06, "loss": 1.1989, "step": 11905 }, { "epoch": 0.22, "learning_rate": 4.519611212342711e-06, "loss": 1.1382, "step": 11906 }, { "epoch": 0.22, "learning_rate": 4.519521169223727e-06, "loss": 1.0452, "step": 11907 }, { "epoch": 0.22, "learning_rate": 4.519431118563915e-06, "loss": 0.8502, "step": 11908 }, { "epoch": 0.22, "learning_rate": 4.519341060363608e-06, "loss": 1.027, "step": 11909 }, { "epoch": 0.22, "learning_rate": 4.5192509946231435e-06, "loss": 0.9477, "step": 11910 }, { "epoch": 0.22, "learning_rate": 4.519160921342858e-06, "loss": 1.0505, "step": 11911 }, { "epoch": 0.22, "learning_rate": 4.519070840523087e-06, "loss": 1.2639, "step": 11912 }, { "epoch": 0.22, "learning_rate": 4.518980752164167e-06, "loss": 1.1214, "step": 11913 }, { "epoch": 0.22, "learning_rate": 4.518890656266435e-06, "loss": 1.0592, "step": 11914 }, { "epoch": 0.22, "learning_rate": 4.518800552830228e-06, "loss": 0.9573, "step": 11915 }, { "epoch": 0.22, "learning_rate": 4.518710441855882e-06, "loss": 0.8759, "step": 11916 }, { "epoch": 0.22, "learning_rate": 4.518620323343731e-06, "loss": 0.8975, "step": 11917 }, { "epoch": 0.22, "learning_rate": 4.5185301972941154e-06, "loss": 0.9515, "step": 11918 }, { "epoch": 0.22, "learning_rate": 4.518440063707369e-06, "loss": 0.8156, "step": 11919 }, { "epoch": 0.22, "learning_rate": 4.51834992258383e-06, "loss": 0.8489, "step": 11920 }, { "epoch": 0.22, "learning_rate": 4.5182597739238335e-06, "loss": 0.9062, "step": 11921 }, { "epoch": 0.22, "learning_rate": 4.518169617727718e-06, "loss": 0.8941, "step": 11922 }, { "epoch": 0.22, "learning_rate": 4.518079453995818e-06, "loss": 0.8601, "step": 11923 }, { "epoch": 0.22, "learning_rate": 4.517989282728472e-06, "loss": 1.0197, "step": 11924 }, { "epoch": 0.22, "learning_rate": 4.517899103926015e-06, "loss": 1.0295, "step": 11925 }, { "epoch": 0.23, "learning_rate": 4.5178089175887855e-06, "loss": 0.8738, "step": 11926 }, { "epoch": 0.23, "learning_rate": 4.517718723717119e-06, "loss": 1.0119, "step": 11927 }, { "epoch": 0.23, "learning_rate": 4.517628522311352e-06, "loss": 0.9521, "step": 11928 }, { "epoch": 0.23, "learning_rate": 4.517538313371823e-06, "loss": 1.0288, "step": 11929 }, { "epoch": 0.23, "learning_rate": 4.517448096898866e-06, "loss": 1.0754, "step": 11930 }, { "epoch": 0.23, "learning_rate": 4.517357872892822e-06, "loss": 1.1838, "step": 11931 }, { "epoch": 0.23, "learning_rate": 4.517267641354025e-06, "loss": 1.0725, "step": 11932 }, { "epoch": 0.23, "learning_rate": 4.517177402282812e-06, "loss": 0.7852, "step": 11933 }, { "epoch": 0.23, "learning_rate": 4.51708715567952e-06, "loss": 1.0908, "step": 11934 }, { "epoch": 0.23, "learning_rate": 4.516996901544487e-06, "loss": 0.9472, "step": 11935 }, { "epoch": 0.23, "learning_rate": 4.5169066398780495e-06, "loss": 0.9391, "step": 11936 }, { "epoch": 0.23, "learning_rate": 4.516816370680543e-06, "loss": 1.1792, "step": 11937 }, { "epoch": 0.23, "learning_rate": 4.516726093952308e-06, "loss": 0.9162, "step": 11938 }, { "epoch": 0.23, "learning_rate": 4.516635809693679e-06, "loss": 0.847, "step": 11939 }, { "epoch": 0.23, "learning_rate": 4.5165455179049934e-06, "loss": 0.8307, "step": 11940 }, { "epoch": 0.23, "learning_rate": 4.516455218586589e-06, "loss": 0.9514, "step": 11941 }, { "epoch": 0.23, "learning_rate": 4.5163649117388016e-06, "loss": 1.0317, "step": 11942 }, { "epoch": 0.23, "learning_rate": 4.5162745973619706e-06, "loss": 1.1143, "step": 11943 }, { "epoch": 0.23, "learning_rate": 4.516184275456432e-06, "loss": 1.1503, "step": 11944 }, { "epoch": 0.23, "learning_rate": 4.516093946022523e-06, "loss": 0.6931, "step": 11945 }, { "epoch": 0.23, "learning_rate": 4.516003609060581e-06, "loss": 0.8941, "step": 11946 }, { "epoch": 0.23, "learning_rate": 4.5159132645709435e-06, "loss": 1.0203, "step": 11947 }, { "epoch": 0.23, "learning_rate": 4.515822912553947e-06, "loss": 0.7992, "step": 11948 }, { "epoch": 0.23, "learning_rate": 4.51573255300993e-06, "loss": 1.0438, "step": 11949 }, { "epoch": 0.23, "learning_rate": 4.5156421859392296e-06, "loss": 1.1973, "step": 11950 }, { "epoch": 0.23, "learning_rate": 4.515551811342183e-06, "loss": 0.9729, "step": 11951 }, { "epoch": 0.23, "learning_rate": 4.515461429219128e-06, "loss": 0.9029, "step": 11952 }, { "epoch": 0.23, "learning_rate": 4.515371039570401e-06, "loss": 0.9174, "step": 11953 }, { "epoch": 0.23, "learning_rate": 4.515280642396342e-06, "loss": 0.8062, "step": 11954 }, { "epoch": 0.23, "learning_rate": 4.515190237697285e-06, "loss": 0.9925, "step": 11955 }, { "epoch": 0.23, "learning_rate": 4.51509982547357e-06, "loss": 1.0519, "step": 11956 }, { "epoch": 0.23, "learning_rate": 4.515009405725534e-06, "loss": 1.0141, "step": 11957 }, { "epoch": 0.23, "learning_rate": 4.514918978453515e-06, "loss": 0.9781, "step": 11958 }, { "epoch": 0.23, "learning_rate": 4.51482854365785e-06, "loss": 1.0539, "step": 11959 }, { "epoch": 0.23, "learning_rate": 4.514738101338877e-06, "loss": 0.8856, "step": 11960 }, { "epoch": 0.23, "learning_rate": 4.514647651496934e-06, "loss": 0.9713, "step": 11961 }, { "epoch": 0.23, "learning_rate": 4.514557194132358e-06, "loss": 1.1052, "step": 11962 }, { "epoch": 0.23, "learning_rate": 4.514466729245488e-06, "loss": 1.1722, "step": 11963 }, { "epoch": 0.23, "learning_rate": 4.51437625683666e-06, "loss": 1.1371, "step": 11964 }, { "epoch": 0.23, "learning_rate": 4.514285776906213e-06, "loss": 0.9226, "step": 11965 }, { "epoch": 0.23, "learning_rate": 4.514195289454485e-06, "loss": 0.9572, "step": 11966 }, { "epoch": 0.23, "learning_rate": 4.514104794481814e-06, "loss": 0.8492, "step": 11967 }, { "epoch": 0.23, "learning_rate": 4.514014291988536e-06, "loss": 1.0238, "step": 11968 }, { "epoch": 0.23, "learning_rate": 4.513923781974992e-06, "loss": 1.1431, "step": 11969 }, { "epoch": 0.23, "learning_rate": 4.513833264441518e-06, "loss": 0.7573, "step": 11970 }, { "epoch": 0.23, "learning_rate": 4.513742739388452e-06, "loss": 0.9215, "step": 11971 }, { "epoch": 0.23, "learning_rate": 4.513652206816132e-06, "loss": 0.7934, "step": 11972 }, { "epoch": 0.23, "learning_rate": 4.5135616667248975e-06, "loss": 0.7645, "step": 11973 }, { "epoch": 0.23, "learning_rate": 4.513471119115085e-06, "loss": 1.1259, "step": 11974 }, { "epoch": 0.23, "learning_rate": 4.513380563987032e-06, "loss": 1.0543, "step": 11975 }, { "epoch": 0.23, "learning_rate": 4.513290001341078e-06, "loss": 1.0603, "step": 11976 }, { "epoch": 0.23, "learning_rate": 4.513199431177561e-06, "loss": 0.9018, "step": 11977 }, { "epoch": 0.23, "learning_rate": 4.51310885349682e-06, "loss": 0.7787, "step": 11978 }, { "epoch": 0.23, "learning_rate": 4.513018268299192e-06, "loss": 0.8714, "step": 11979 }, { "epoch": 0.23, "learning_rate": 4.5129276755850145e-06, "loss": 1.2175, "step": 11980 }, { "epoch": 0.23, "learning_rate": 4.512837075354628e-06, "loss": 1.134, "step": 11981 }, { "epoch": 0.23, "learning_rate": 4.51274646760837e-06, "loss": 0.9001, "step": 11982 }, { "epoch": 0.23, "learning_rate": 4.512655852346577e-06, "loss": 0.994, "step": 11983 }, { "epoch": 0.23, "learning_rate": 4.512565229569589e-06, "loss": 0.8093, "step": 11984 }, { "epoch": 0.23, "learning_rate": 4.512474599277744e-06, "loss": 0.8338, "step": 11985 }, { "epoch": 0.23, "learning_rate": 4.512383961471381e-06, "loss": 0.8018, "step": 11986 }, { "epoch": 0.23, "learning_rate": 4.512293316150838e-06, "loss": 1.0408, "step": 11987 }, { "epoch": 0.23, "learning_rate": 4.512202663316454e-06, "loss": 1.0417, "step": 11988 }, { "epoch": 0.23, "learning_rate": 4.512112002968566e-06, "loss": 0.8388, "step": 11989 }, { "epoch": 0.23, "learning_rate": 4.512021335107514e-06, "loss": 0.9796, "step": 11990 }, { "epoch": 0.23, "learning_rate": 4.511930659733635e-06, "loss": 0.8868, "step": 11991 }, { "epoch": 0.23, "learning_rate": 4.51183997684727e-06, "loss": 0.9581, "step": 11992 }, { "epoch": 0.23, "learning_rate": 4.511749286448755e-06, "loss": 0.9425, "step": 11993 }, { "epoch": 0.23, "learning_rate": 4.511658588538431e-06, "loss": 1.0255, "step": 11994 }, { "epoch": 0.23, "learning_rate": 4.5115678831166345e-06, "loss": 1.0234, "step": 11995 }, { "epoch": 0.23, "learning_rate": 4.511477170183706e-06, "loss": 0.856, "step": 11996 }, { "epoch": 0.23, "learning_rate": 4.511386449739983e-06, "loss": 1.1019, "step": 11997 }, { "epoch": 0.23, "learning_rate": 4.511295721785805e-06, "loss": 1.0527, "step": 11998 }, { "epoch": 0.23, "learning_rate": 4.51120498632151e-06, "loss": 0.9438, "step": 11999 }, { "epoch": 0.23, "learning_rate": 4.511114243347438e-06, "loss": 1.0264, "step": 12000 }, { "epoch": 0.23, "learning_rate": 4.511023492863926e-06, "loss": 1.0297, "step": 12001 }, { "epoch": 0.23, "learning_rate": 4.510932734871315e-06, "loss": 1.0457, "step": 12002 }, { "epoch": 0.23, "learning_rate": 4.510841969369943e-06, "loss": 0.8507, "step": 12003 }, { "epoch": 0.23, "learning_rate": 4.510751196360147e-06, "loss": 1.2794, "step": 12004 }, { "epoch": 0.23, "learning_rate": 4.510660415842268e-06, "loss": 0.9219, "step": 12005 }, { "epoch": 0.23, "learning_rate": 4.510569627816646e-06, "loss": 1.0119, "step": 12006 }, { "epoch": 0.23, "learning_rate": 4.510478832283618e-06, "loss": 0.9408, "step": 12007 }, { "epoch": 0.23, "learning_rate": 4.510388029243523e-06, "loss": 0.8259, "step": 12008 }, { "epoch": 0.23, "learning_rate": 4.510297218696702e-06, "loss": 0.9337, "step": 12009 }, { "epoch": 0.23, "learning_rate": 4.510206400643493e-06, "loss": 0.8264, "step": 12010 }, { "epoch": 0.23, "learning_rate": 4.510115575084234e-06, "loss": 0.9426, "step": 12011 }, { "epoch": 0.23, "learning_rate": 4.510024742019265e-06, "loss": 1.2018, "step": 12012 }, { "epoch": 0.23, "learning_rate": 4.509933901448925e-06, "loss": 1.0935, "step": 12013 }, { "epoch": 0.23, "learning_rate": 4.509843053373554e-06, "loss": 0.9359, "step": 12014 }, { "epoch": 0.23, "learning_rate": 4.509752197793491e-06, "loss": 0.9412, "step": 12015 }, { "epoch": 0.23, "learning_rate": 4.509661334709075e-06, "loss": 1.0746, "step": 12016 }, { "epoch": 0.23, "learning_rate": 4.509570464120644e-06, "loss": 0.9592, "step": 12017 }, { "epoch": 0.23, "learning_rate": 4.509479586028539e-06, "loss": 1.0078, "step": 12018 }, { "epoch": 0.23, "learning_rate": 4.5093887004330994e-06, "loss": 1.012, "step": 12019 }, { "epoch": 0.23, "learning_rate": 4.509297807334664e-06, "loss": 0.9423, "step": 12020 }, { "epoch": 0.23, "learning_rate": 4.509206906733572e-06, "loss": 0.9739, "step": 12021 }, { "epoch": 0.23, "learning_rate": 4.509115998630162e-06, "loss": 0.9732, "step": 12022 }, { "epoch": 0.23, "learning_rate": 4.5090250830247765e-06, "loss": 0.8947, "step": 12023 }, { "epoch": 0.23, "learning_rate": 4.508934159917752e-06, "loss": 0.9512, "step": 12024 }, { "epoch": 0.23, "learning_rate": 4.508843229309428e-06, "loss": 1.0793, "step": 12025 }, { "epoch": 0.23, "learning_rate": 4.508752291200146e-06, "loss": 1.1898, "step": 12026 }, { "epoch": 0.23, "learning_rate": 4.508661345590244e-06, "loss": 0.9239, "step": 12027 }, { "epoch": 0.23, "learning_rate": 4.508570392480062e-06, "loss": 0.8967, "step": 12028 }, { "epoch": 0.23, "learning_rate": 4.508479431869941e-06, "loss": 0.7243, "step": 12029 }, { "epoch": 0.23, "learning_rate": 4.508388463760218e-06, "loss": 0.8816, "step": 12030 }, { "epoch": 0.23, "learning_rate": 4.508297488151234e-06, "loss": 1.1342, "step": 12031 }, { "epoch": 0.23, "learning_rate": 4.50820650504333e-06, "loss": 0.9674, "step": 12032 }, { "epoch": 0.23, "learning_rate": 4.508115514436844e-06, "loss": 0.7008, "step": 12033 }, { "epoch": 0.23, "learning_rate": 4.508024516332116e-06, "loss": 0.9858, "step": 12034 }, { "epoch": 0.23, "learning_rate": 4.507933510729485e-06, "loss": 0.8357, "step": 12035 }, { "epoch": 0.23, "learning_rate": 4.5078424976292936e-06, "loss": 0.84, "step": 12036 }, { "epoch": 0.23, "learning_rate": 4.507751477031878e-06, "loss": 1.1154, "step": 12037 }, { "epoch": 0.23, "learning_rate": 4.507660448937582e-06, "loss": 1.0697, "step": 12038 }, { "epoch": 0.23, "learning_rate": 4.507569413346742e-06, "loss": 0.9449, "step": 12039 }, { "epoch": 0.23, "learning_rate": 4.5074783702597e-06, "loss": 1.0693, "step": 12040 }, { "epoch": 0.23, "learning_rate": 4.507387319676796e-06, "loss": 0.8174, "step": 12041 }, { "epoch": 0.23, "learning_rate": 4.5072962615983685e-06, "loss": 1.0478, "step": 12042 }, { "epoch": 0.23, "learning_rate": 4.5072051960247575e-06, "loss": 1.0701, "step": 12043 }, { "epoch": 0.23, "learning_rate": 4.507114122956305e-06, "loss": 1.1782, "step": 12044 }, { "epoch": 0.23, "learning_rate": 4.507023042393349e-06, "loss": 0.9933, "step": 12045 }, { "epoch": 0.23, "learning_rate": 4.506931954336232e-06, "loss": 1.0929, "step": 12046 }, { "epoch": 0.23, "learning_rate": 4.506840858785291e-06, "loss": 0.9549, "step": 12047 }, { "epoch": 0.23, "learning_rate": 4.506749755740869e-06, "loss": 0.9354, "step": 12048 }, { "epoch": 0.23, "learning_rate": 4.506658645203304e-06, "loss": 1.2542, "step": 12049 }, { "epoch": 0.23, "learning_rate": 4.506567527172938e-06, "loss": 1.4309, "step": 12050 }, { "epoch": 0.23, "learning_rate": 4.50647640165011e-06, "loss": 1.0129, "step": 12051 }, { "epoch": 0.23, "learning_rate": 4.50638526863516e-06, "loss": 0.884, "step": 12052 }, { "epoch": 0.23, "learning_rate": 4.506294128128429e-06, "loss": 1.068, "step": 12053 }, { "epoch": 0.23, "learning_rate": 4.506202980130258e-06, "loss": 1.0951, "step": 12054 }, { "epoch": 0.23, "learning_rate": 4.506111824640986e-06, "loss": 1.1124, "step": 12055 }, { "epoch": 0.23, "learning_rate": 4.506020661660955e-06, "loss": 1.2136, "step": 12056 }, { "epoch": 0.23, "learning_rate": 4.5059294911905035e-06, "loss": 0.9579, "step": 12057 }, { "epoch": 0.23, "learning_rate": 4.5058383132299725e-06, "loss": 1.0326, "step": 12058 }, { "epoch": 0.23, "learning_rate": 4.5057471277797034e-06, "loss": 0.9496, "step": 12059 }, { "epoch": 0.23, "learning_rate": 4.505655934840035e-06, "loss": 0.897, "step": 12060 }, { "epoch": 0.23, "learning_rate": 4.50556473441131e-06, "loss": 0.9947, "step": 12061 }, { "epoch": 0.23, "learning_rate": 4.505473526493868e-06, "loss": 0.9082, "step": 12062 }, { "epoch": 0.23, "learning_rate": 4.505382311088048e-06, "loss": 0.9841, "step": 12063 }, { "epoch": 0.23, "learning_rate": 4.505291088194192e-06, "loss": 0.7769, "step": 12064 }, { "epoch": 0.23, "learning_rate": 4.505199857812642e-06, "loss": 0.9569, "step": 12065 }, { "epoch": 0.23, "learning_rate": 4.505108619943736e-06, "loss": 1.033, "step": 12066 }, { "epoch": 0.23, "learning_rate": 4.505017374587817e-06, "loss": 0.8914, "step": 12067 }, { "epoch": 0.23, "learning_rate": 4.504926121745223e-06, "loss": 0.9427, "step": 12068 }, { "epoch": 0.23, "learning_rate": 4.504834861416297e-06, "loss": 1.0837, "step": 12069 }, { "epoch": 0.23, "learning_rate": 4.504743593601379e-06, "loss": 0.9639, "step": 12070 }, { "epoch": 0.23, "learning_rate": 4.5046523183008105e-06, "loss": 0.7429, "step": 12071 }, { "epoch": 0.23, "learning_rate": 4.504561035514932e-06, "loss": 1.0351, "step": 12072 }, { "epoch": 0.23, "learning_rate": 4.504469745244083e-06, "loss": 0.8768, "step": 12073 }, { "epoch": 0.23, "learning_rate": 4.504378447488607e-06, "loss": 1.0691, "step": 12074 }, { "epoch": 0.23, "learning_rate": 4.504287142248842e-06, "loss": 1.0746, "step": 12075 }, { "epoch": 0.23, "learning_rate": 4.50419582952513e-06, "loss": 1.0441, "step": 12076 }, { "epoch": 0.23, "learning_rate": 4.504104509317813e-06, "loss": 0.7944, "step": 12077 }, { "epoch": 0.23, "learning_rate": 4.50401318162723e-06, "loss": 1.0856, "step": 12078 }, { "epoch": 0.23, "learning_rate": 4.503921846453725e-06, "loss": 0.849, "step": 12079 }, { "epoch": 0.23, "learning_rate": 4.503830503797636e-06, "loss": 0.9382, "step": 12080 }, { "epoch": 0.23, "learning_rate": 4.503739153659306e-06, "loss": 1.0765, "step": 12081 }, { "epoch": 0.23, "learning_rate": 4.503647796039075e-06, "loss": 0.9478, "step": 12082 }, { "epoch": 0.23, "learning_rate": 4.503556430937284e-06, "loss": 0.9464, "step": 12083 }, { "epoch": 0.23, "learning_rate": 4.503465058354276e-06, "loss": 0.9622, "step": 12084 }, { "epoch": 0.23, "learning_rate": 4.50337367829039e-06, "loss": 0.8712, "step": 12085 }, { "epoch": 0.23, "learning_rate": 4.50328229074597e-06, "loss": 0.7205, "step": 12086 }, { "epoch": 0.23, "learning_rate": 4.503190895721353e-06, "loss": 0.983, "step": 12087 }, { "epoch": 0.23, "learning_rate": 4.5030994932168835e-06, "loss": 0.9573, "step": 12088 }, { "epoch": 0.23, "learning_rate": 4.5030080832329016e-06, "loss": 0.8005, "step": 12089 }, { "epoch": 0.23, "learning_rate": 4.502916665769749e-06, "loss": 0.8999, "step": 12090 }, { "epoch": 0.23, "learning_rate": 4.502825240827768e-06, "loss": 0.8556, "step": 12091 }, { "epoch": 0.23, "learning_rate": 4.502733808407297e-06, "loss": 0.7615, "step": 12092 }, { "epoch": 0.23, "learning_rate": 4.502642368508681e-06, "loss": 0.9424, "step": 12093 }, { "epoch": 0.23, "learning_rate": 4.502550921132259e-06, "loss": 1.0414, "step": 12094 }, { "epoch": 0.23, "learning_rate": 4.502459466278374e-06, "loss": 0.8491, "step": 12095 }, { "epoch": 0.23, "learning_rate": 4.502368003947366e-06, "loss": 0.8505, "step": 12096 }, { "epoch": 0.23, "learning_rate": 4.502276534139578e-06, "loss": 0.7645, "step": 12097 }, { "epoch": 0.23, "learning_rate": 4.50218505685535e-06, "loss": 0.8642, "step": 12098 }, { "epoch": 0.23, "learning_rate": 4.502093572095024e-06, "loss": 1.0193, "step": 12099 }, { "epoch": 0.23, "learning_rate": 4.502002079858944e-06, "loss": 1.283, "step": 12100 }, { "epoch": 0.23, "learning_rate": 4.501910580147448e-06, "loss": 0.9686, "step": 12101 }, { "epoch": 0.23, "learning_rate": 4.501819072960879e-06, "loss": 1.0203, "step": 12102 }, { "epoch": 0.23, "learning_rate": 4.50172755829958e-06, "loss": 0.9713, "step": 12103 }, { "epoch": 0.23, "learning_rate": 4.501636036163891e-06, "loss": 0.8183, "step": 12104 }, { "epoch": 0.23, "learning_rate": 4.5015445065541555e-06, "loss": 1.1075, "step": 12105 }, { "epoch": 0.23, "learning_rate": 4.501452969470712e-06, "loss": 1.0679, "step": 12106 }, { "epoch": 0.23, "learning_rate": 4.501361424913907e-06, "loss": 0.9747, "step": 12107 }, { "epoch": 0.23, "learning_rate": 4.501269872884078e-06, "loss": 0.8407, "step": 12108 }, { "epoch": 0.23, "learning_rate": 4.5011783133815695e-06, "loss": 0.7515, "step": 12109 }, { "epoch": 0.23, "learning_rate": 4.501086746406722e-06, "loss": 1.1833, "step": 12110 }, { "epoch": 0.23, "learning_rate": 4.500995171959879e-06, "loss": 0.9603, "step": 12111 }, { "epoch": 0.23, "learning_rate": 4.50090359004138e-06, "loss": 1.0147, "step": 12112 }, { "epoch": 0.23, "learning_rate": 4.50081200065157e-06, "loss": 0.9445, "step": 12113 }, { "epoch": 0.23, "learning_rate": 4.500720403790788e-06, "loss": 0.7451, "step": 12114 }, { "epoch": 0.23, "learning_rate": 4.500628799459377e-06, "loss": 1.0053, "step": 12115 }, { "epoch": 0.23, "learning_rate": 4.50053718765768e-06, "loss": 0.8791, "step": 12116 }, { "epoch": 0.23, "learning_rate": 4.500445568386039e-06, "loss": 1.0743, "step": 12117 }, { "epoch": 0.23, "learning_rate": 4.500353941644795e-06, "loss": 1.2404, "step": 12118 }, { "epoch": 0.23, "learning_rate": 4.500262307434291e-06, "loss": 1.1926, "step": 12119 }, { "epoch": 0.23, "learning_rate": 4.5001706657548685e-06, "loss": 1.154, "step": 12120 }, { "epoch": 0.23, "learning_rate": 4.50007901660687e-06, "loss": 0.874, "step": 12121 }, { "epoch": 0.23, "learning_rate": 4.499987359990639e-06, "loss": 0.8949, "step": 12122 }, { "epoch": 0.23, "learning_rate": 4.499895695906515e-06, "loss": 0.9758, "step": 12123 }, { "epoch": 0.23, "learning_rate": 4.499804024354842e-06, "loss": 0.7751, "step": 12124 }, { "epoch": 0.23, "learning_rate": 4.4997123453359626e-06, "loss": 1.1202, "step": 12125 }, { "epoch": 0.23, "learning_rate": 4.499620658850219e-06, "loss": 0.7595, "step": 12126 }, { "epoch": 0.23, "learning_rate": 4.499528964897953e-06, "loss": 0.8015, "step": 12127 }, { "epoch": 0.23, "learning_rate": 4.499437263479506e-06, "loss": 0.9644, "step": 12128 }, { "epoch": 0.23, "learning_rate": 4.499345554595223e-06, "loss": 0.9751, "step": 12129 }, { "epoch": 0.23, "learning_rate": 4.499253838245444e-06, "loss": 0.9858, "step": 12130 }, { "epoch": 0.23, "learning_rate": 4.4991621144305134e-06, "loss": 1.0203, "step": 12131 }, { "epoch": 0.23, "learning_rate": 4.4990703831507715e-06, "loss": 0.8952, "step": 12132 }, { "epoch": 0.23, "learning_rate": 4.498978644406563e-06, "loss": 0.9796, "step": 12133 }, { "epoch": 0.23, "learning_rate": 4.498886898198229e-06, "loss": 0.8571, "step": 12134 }, { "epoch": 0.23, "learning_rate": 4.498795144526113e-06, "loss": 0.9924, "step": 12135 }, { "epoch": 0.23, "learning_rate": 4.498703383390557e-06, "loss": 1.0897, "step": 12136 }, { "epoch": 0.23, "learning_rate": 4.498611614791904e-06, "loss": 1.0228, "step": 12137 }, { "epoch": 0.23, "learning_rate": 4.498519838730496e-06, "loss": 1.174, "step": 12138 }, { "epoch": 0.23, "learning_rate": 4.4984280552066775e-06, "loss": 1.027, "step": 12139 }, { "epoch": 0.23, "learning_rate": 4.4983362642207885e-06, "loss": 0.8966, "step": 12140 }, { "epoch": 0.23, "learning_rate": 4.498244465773174e-06, "loss": 1.0087, "step": 12141 }, { "epoch": 0.23, "learning_rate": 4.498152659864176e-06, "loss": 0.9181, "step": 12142 }, { "epoch": 0.23, "learning_rate": 4.498060846494137e-06, "loss": 1.0077, "step": 12143 }, { "epoch": 0.23, "learning_rate": 4.4979690256634e-06, "loss": 1.1035, "step": 12144 }, { "epoch": 0.23, "learning_rate": 4.497877197372308e-06, "loss": 0.9408, "step": 12145 }, { "epoch": 0.23, "learning_rate": 4.497785361621203e-06, "loss": 0.8843, "step": 12146 }, { "epoch": 0.23, "learning_rate": 4.4976935184104295e-06, "loss": 1.0834, "step": 12147 }, { "epoch": 0.23, "learning_rate": 4.49760166774033e-06, "loss": 0.9615, "step": 12148 }, { "epoch": 0.23, "learning_rate": 4.497509809611247e-06, "loss": 0.9841, "step": 12149 }, { "epoch": 0.23, "learning_rate": 4.497417944023522e-06, "loss": 1.2554, "step": 12150 }, { "epoch": 0.23, "learning_rate": 4.4973260709775015e-06, "loss": 0.9258, "step": 12151 }, { "epoch": 0.23, "learning_rate": 4.497234190473526e-06, "loss": 0.8812, "step": 12152 }, { "epoch": 0.23, "learning_rate": 4.49714230251194e-06, "loss": 0.7974, "step": 12153 }, { "epoch": 0.23, "learning_rate": 4.4970504070930846e-06, "loss": 0.9871, "step": 12154 }, { "epoch": 0.23, "learning_rate": 4.496958504217305e-06, "loss": 0.9604, "step": 12155 }, { "epoch": 0.23, "learning_rate": 4.496866593884944e-06, "loss": 1.0269, "step": 12156 }, { "epoch": 0.23, "learning_rate": 4.496774676096344e-06, "loss": 1.095, "step": 12157 }, { "epoch": 0.23, "learning_rate": 4.496682750851848e-06, "loss": 1.0825, "step": 12158 }, { "epoch": 0.23, "learning_rate": 4.4965908181518e-06, "loss": 1.053, "step": 12159 }, { "epoch": 0.23, "learning_rate": 4.496498877996544e-06, "loss": 0.8718, "step": 12160 }, { "epoch": 0.23, "learning_rate": 4.496406930386421e-06, "loss": 1.0287, "step": 12161 }, { "epoch": 0.23, "learning_rate": 4.496314975321777e-06, "loss": 0.9667, "step": 12162 }, { "epoch": 0.23, "learning_rate": 4.496223012802954e-06, "loss": 1.0402, "step": 12163 }, { "epoch": 0.23, "learning_rate": 4.496131042830294e-06, "loss": 0.7584, "step": 12164 }, { "epoch": 0.23, "learning_rate": 4.496039065404143e-06, "loss": 0.8808, "step": 12165 }, { "epoch": 0.23, "learning_rate": 4.495947080524844e-06, "loss": 0.8038, "step": 12166 }, { "epoch": 0.23, "learning_rate": 4.495855088192739e-06, "loss": 0.8051, "step": 12167 }, { "epoch": 0.23, "learning_rate": 4.495763088408172e-06, "loss": 1.173, "step": 12168 }, { "epoch": 0.23, "learning_rate": 4.495671081171487e-06, "loss": 0.9671, "step": 12169 }, { "epoch": 0.23, "learning_rate": 4.495579066483028e-06, "loss": 0.9884, "step": 12170 }, { "epoch": 0.23, "learning_rate": 4.495487044343138e-06, "loss": 0.9515, "step": 12171 }, { "epoch": 0.23, "learning_rate": 4.4953950147521594e-06, "loss": 1.0741, "step": 12172 }, { "epoch": 0.23, "learning_rate": 4.495302977710437e-06, "loss": 0.7457, "step": 12173 }, { "epoch": 0.23, "learning_rate": 4.4952109332183155e-06, "loss": 1.2816, "step": 12174 }, { "epoch": 0.23, "learning_rate": 4.495118881276137e-06, "loss": 1.2158, "step": 12175 }, { "epoch": 0.23, "learning_rate": 4.4950268218842464e-06, "loss": 0.9111, "step": 12176 }, { "epoch": 0.23, "learning_rate": 4.494934755042986e-06, "loss": 0.8154, "step": 12177 }, { "epoch": 0.23, "learning_rate": 4.494842680752701e-06, "loss": 0.9695, "step": 12178 }, { "epoch": 0.23, "learning_rate": 4.494750599013734e-06, "loss": 0.8049, "step": 12179 }, { "epoch": 0.23, "learning_rate": 4.49465850982643e-06, "loss": 0.9131, "step": 12180 }, { "epoch": 0.23, "learning_rate": 4.4945664131911315e-06, "loss": 1.094, "step": 12181 }, { "epoch": 0.23, "learning_rate": 4.4944743091081845e-06, "loss": 1.072, "step": 12182 }, { "epoch": 0.23, "learning_rate": 4.494382197577931e-06, "loss": 1.0119, "step": 12183 }, { "epoch": 0.23, "learning_rate": 4.494290078600715e-06, "loss": 1.1366, "step": 12184 }, { "epoch": 0.23, "learning_rate": 4.494197952176881e-06, "loss": 0.8354, "step": 12185 }, { "epoch": 0.23, "learning_rate": 4.494105818306773e-06, "loss": 0.8566, "step": 12186 }, { "epoch": 0.23, "learning_rate": 4.494013676990735e-06, "loss": 1.0182, "step": 12187 }, { "epoch": 0.23, "learning_rate": 4.493921528229112e-06, "loss": 0.9888, "step": 12188 }, { "epoch": 0.23, "learning_rate": 4.493829372022247e-06, "loss": 0.9885, "step": 12189 }, { "epoch": 0.23, "learning_rate": 4.493737208370483e-06, "loss": 0.8421, "step": 12190 }, { "epoch": 0.23, "learning_rate": 4.493645037274166e-06, "loss": 0.9397, "step": 12191 }, { "epoch": 0.23, "learning_rate": 4.49355285873364e-06, "loss": 0.7764, "step": 12192 }, { "epoch": 0.23, "learning_rate": 4.493460672749249e-06, "loss": 1.0812, "step": 12193 }, { "epoch": 0.23, "learning_rate": 4.493368479321336e-06, "loss": 1.0145, "step": 12194 }, { "epoch": 0.23, "learning_rate": 4.493276278450247e-06, "loss": 0.899, "step": 12195 }, { "epoch": 0.23, "learning_rate": 4.493184070136325e-06, "loss": 0.9116, "step": 12196 }, { "epoch": 0.23, "learning_rate": 4.493091854379915e-06, "loss": 0.9285, "step": 12197 }, { "epoch": 0.23, "learning_rate": 4.492999631181361e-06, "loss": 0.9332, "step": 12198 }, { "epoch": 0.23, "learning_rate": 4.492907400541008e-06, "loss": 1.0349, "step": 12199 }, { "epoch": 0.23, "learning_rate": 4.492815162459199e-06, "loss": 1.0822, "step": 12200 }, { "epoch": 0.23, "learning_rate": 4.49272291693628e-06, "loss": 0.8781, "step": 12201 }, { "epoch": 0.23, "learning_rate": 4.4926306639725945e-06, "loss": 0.9855, "step": 12202 }, { "epoch": 0.23, "learning_rate": 4.4925384035684864e-06, "loss": 1.1344, "step": 12203 }, { "epoch": 0.23, "learning_rate": 4.492446135724302e-06, "loss": 0.9202, "step": 12204 }, { "epoch": 0.23, "learning_rate": 4.492353860440385e-06, "loss": 1.0429, "step": 12205 }, { "epoch": 0.23, "learning_rate": 4.492261577717079e-06, "loss": 1.269, "step": 12206 }, { "epoch": 0.23, "learning_rate": 4.4921692875547295e-06, "loss": 0.685, "step": 12207 }, { "epoch": 0.23, "learning_rate": 4.492076989953681e-06, "loss": 0.8888, "step": 12208 }, { "epoch": 0.23, "learning_rate": 4.4919846849142775e-06, "loss": 0.7207, "step": 12209 }, { "epoch": 0.23, "learning_rate": 4.491892372436866e-06, "loss": 0.7863, "step": 12210 }, { "epoch": 0.23, "learning_rate": 4.491800052521789e-06, "loss": 1.0071, "step": 12211 }, { "epoch": 0.23, "learning_rate": 4.491707725169391e-06, "loss": 1.1301, "step": 12212 }, { "epoch": 0.23, "learning_rate": 4.491615390380017e-06, "loss": 1.0927, "step": 12213 }, { "epoch": 0.23, "learning_rate": 4.4915230481540125e-06, "loss": 0.8292, "step": 12214 }, { "epoch": 0.23, "learning_rate": 4.491430698491722e-06, "loss": 0.8528, "step": 12215 }, { "epoch": 0.23, "learning_rate": 4.491338341393491e-06, "loss": 0.9908, "step": 12216 }, { "epoch": 0.23, "learning_rate": 4.491245976859663e-06, "loss": 0.7846, "step": 12217 }, { "epoch": 0.23, "learning_rate": 4.491153604890584e-06, "loss": 1.066, "step": 12218 }, { "epoch": 0.23, "learning_rate": 4.491061225486598e-06, "loss": 0.9372, "step": 12219 }, { "epoch": 0.23, "learning_rate": 4.490968838648051e-06, "loss": 1.0435, "step": 12220 }, { "epoch": 0.23, "learning_rate": 4.4908764443752874e-06, "loss": 0.8945, "step": 12221 }, { "epoch": 0.23, "learning_rate": 4.490784042668652e-06, "loss": 0.8793, "step": 12222 }, { "epoch": 0.23, "learning_rate": 4.49069163352849e-06, "loss": 0.991, "step": 12223 }, { "epoch": 0.23, "learning_rate": 4.490599216955146e-06, "loss": 1.0756, "step": 12224 }, { "epoch": 0.23, "learning_rate": 4.490506792948966e-06, "loss": 1.0163, "step": 12225 }, { "epoch": 0.23, "learning_rate": 4.490414361510294e-06, "loss": 0.8717, "step": 12226 }, { "epoch": 0.23, "learning_rate": 4.490321922639477e-06, "loss": 0.9323, "step": 12227 }, { "epoch": 0.23, "learning_rate": 4.4902294763368595e-06, "loss": 0.762, "step": 12228 }, { "epoch": 0.23, "learning_rate": 4.4901370226027845e-06, "loss": 0.8236, "step": 12229 }, { "epoch": 0.23, "learning_rate": 4.4900445614376e-06, "loss": 0.8842, "step": 12230 }, { "epoch": 0.23, "learning_rate": 4.489952092841649e-06, "loss": 0.9167, "step": 12231 }, { "epoch": 0.23, "learning_rate": 4.4898596168152786e-06, "loss": 0.9539, "step": 12232 }, { "epoch": 0.23, "learning_rate": 4.4897671333588335e-06, "loss": 0.9367, "step": 12233 }, { "epoch": 0.23, "learning_rate": 4.4896746424726585e-06, "loss": 0.9732, "step": 12234 }, { "epoch": 0.23, "learning_rate": 4.4895821441571e-06, "loss": 1.0505, "step": 12235 }, { "epoch": 0.23, "learning_rate": 4.489489638412502e-06, "loss": 0.9498, "step": 12236 }, { "epoch": 0.23, "learning_rate": 4.489397125239211e-06, "loss": 1.2971, "step": 12237 }, { "epoch": 0.23, "learning_rate": 4.489304604637572e-06, "loss": 1.165, "step": 12238 }, { "epoch": 0.23, "learning_rate": 4.489212076607931e-06, "loss": 0.9543, "step": 12239 }, { "epoch": 0.23, "learning_rate": 4.4891195411506325e-06, "loss": 0.9431, "step": 12240 }, { "epoch": 0.23, "learning_rate": 4.489026998266024e-06, "loss": 0.7876, "step": 12241 }, { "epoch": 0.23, "learning_rate": 4.488934447954448e-06, "loss": 0.8329, "step": 12242 }, { "epoch": 0.23, "learning_rate": 4.488841890216253e-06, "loss": 1.1639, "step": 12243 }, { "epoch": 0.23, "learning_rate": 4.4887493250517825e-06, "loss": 0.9688, "step": 12244 }, { "epoch": 0.23, "learning_rate": 4.488656752461384e-06, "loss": 1.0653, "step": 12245 }, { "epoch": 0.23, "learning_rate": 4.488564172445401e-06, "loss": 0.9762, "step": 12246 }, { "epoch": 0.23, "learning_rate": 4.48847158500418e-06, "loss": 1.0486, "step": 12247 }, { "epoch": 0.23, "learning_rate": 4.488378990138068e-06, "loss": 0.8063, "step": 12248 }, { "epoch": 0.23, "learning_rate": 4.4882863878474104e-06, "loss": 0.9148, "step": 12249 }, { "epoch": 0.23, "learning_rate": 4.488193778132551e-06, "loss": 1.1442, "step": 12250 }, { "epoch": 0.23, "learning_rate": 4.488101160993838e-06, "loss": 0.9799, "step": 12251 }, { "epoch": 0.23, "learning_rate": 4.488008536431616e-06, "loss": 0.911, "step": 12252 }, { "epoch": 0.23, "learning_rate": 4.487915904446231e-06, "loss": 0.9055, "step": 12253 }, { "epoch": 0.23, "learning_rate": 4.48782326503803e-06, "loss": 0.9267, "step": 12254 }, { "epoch": 0.23, "learning_rate": 4.487730618207356e-06, "loss": 1.0107, "step": 12255 }, { "epoch": 0.23, "learning_rate": 4.487637963954558e-06, "loss": 1.0413, "step": 12256 }, { "epoch": 0.23, "learning_rate": 4.48754530227998e-06, "loss": 0.9061, "step": 12257 }, { "epoch": 0.23, "learning_rate": 4.487452633183969e-06, "loss": 0.9946, "step": 12258 }, { "epoch": 0.23, "learning_rate": 4.487359956666871e-06, "loss": 0.8105, "step": 12259 }, { "epoch": 0.23, "learning_rate": 4.487267272729032e-06, "loss": 0.8696, "step": 12260 }, { "epoch": 0.23, "learning_rate": 4.487174581370798e-06, "loss": 0.9, "step": 12261 }, { "epoch": 0.23, "learning_rate": 4.487081882592515e-06, "loss": 1.1732, "step": 12262 }, { "epoch": 0.23, "learning_rate": 4.4869891763945286e-06, "loss": 1.1463, "step": 12263 }, { "epoch": 0.23, "learning_rate": 4.486896462777186e-06, "loss": 0.8734, "step": 12264 }, { "epoch": 0.23, "learning_rate": 4.486803741740833e-06, "loss": 0.7589, "step": 12265 }, { "epoch": 0.23, "learning_rate": 4.486711013285816e-06, "loss": 1.0921, "step": 12266 }, { "epoch": 0.23, "learning_rate": 4.48661827741248e-06, "loss": 0.84, "step": 12267 }, { "epoch": 0.23, "learning_rate": 4.486525534121173e-06, "loss": 0.9756, "step": 12268 }, { "epoch": 0.23, "learning_rate": 4.486432783412241e-06, "loss": 0.8682, "step": 12269 }, { "epoch": 0.23, "learning_rate": 4.486340025286029e-06, "loss": 0.9783, "step": 12270 }, { "epoch": 0.23, "learning_rate": 4.486247259742884e-06, "loss": 0.991, "step": 12271 }, { "epoch": 0.23, "learning_rate": 4.486154486783154e-06, "loss": 1.0696, "step": 12272 }, { "epoch": 0.23, "learning_rate": 4.486061706407183e-06, "loss": 1.0638, "step": 12273 }, { "epoch": 0.23, "learning_rate": 4.485968918615319e-06, "loss": 1.0972, "step": 12274 }, { "epoch": 0.23, "learning_rate": 4.485876123407907e-06, "loss": 0.9949, "step": 12275 }, { "epoch": 0.23, "learning_rate": 4.485783320785296e-06, "loss": 1.0541, "step": 12276 }, { "epoch": 0.23, "learning_rate": 4.48569051074783e-06, "loss": 0.7059, "step": 12277 }, { "epoch": 0.23, "learning_rate": 4.485597693295857e-06, "loss": 0.9028, "step": 12278 }, { "epoch": 0.23, "learning_rate": 4.485504868429722e-06, "loss": 0.7934, "step": 12279 }, { "epoch": 0.23, "learning_rate": 4.4854120361497735e-06, "loss": 1.0072, "step": 12280 }, { "epoch": 0.23, "learning_rate": 4.4853191964563575e-06, "loss": 1.2651, "step": 12281 }, { "epoch": 0.23, "learning_rate": 4.48522634934982e-06, "loss": 1.1133, "step": 12282 }, { "epoch": 0.23, "learning_rate": 4.485133494830508e-06, "loss": 1.0105, "step": 12283 }, { "epoch": 0.23, "learning_rate": 4.485040632898769e-06, "loss": 0.8907, "step": 12284 }, { "epoch": 0.23, "learning_rate": 4.4849477635549495e-06, "loss": 0.9788, "step": 12285 }, { "epoch": 0.23, "learning_rate": 4.484854886799395e-06, "loss": 0.9379, "step": 12286 }, { "epoch": 0.23, "learning_rate": 4.484762002632453e-06, "loss": 1.1802, "step": 12287 }, { "epoch": 0.23, "learning_rate": 4.484669111054472e-06, "loss": 1.0023, "step": 12288 }, { "epoch": 0.23, "learning_rate": 4.484576212065797e-06, "loss": 0.8863, "step": 12289 }, { "epoch": 0.23, "learning_rate": 4.484483305666774e-06, "loss": 0.9098, "step": 12290 }, { "epoch": 0.23, "learning_rate": 4.484390391857752e-06, "loss": 0.9252, "step": 12291 }, { "epoch": 0.23, "learning_rate": 4.484297470639078e-06, "loss": 0.6793, "step": 12292 }, { "epoch": 0.23, "learning_rate": 4.484204542011096e-06, "loss": 1.0851, "step": 12293 }, { "epoch": 0.23, "learning_rate": 4.484111605974156e-06, "loss": 1.0066, "step": 12294 }, { "epoch": 0.23, "learning_rate": 4.484018662528605e-06, "loss": 1.009, "step": 12295 }, { "epoch": 0.23, "learning_rate": 4.483925711674788e-06, "loss": 0.9504, "step": 12296 }, { "epoch": 0.23, "learning_rate": 4.483832753413055e-06, "loss": 0.8734, "step": 12297 }, { "epoch": 0.23, "learning_rate": 4.4837397877437495e-06, "loss": 0.9415, "step": 12298 }, { "epoch": 0.23, "learning_rate": 4.483646814667221e-06, "loss": 1.1974, "step": 12299 }, { "epoch": 0.23, "learning_rate": 4.483553834183816e-06, "loss": 1.3073, "step": 12300 }, { "epoch": 0.23, "learning_rate": 4.4834608462938815e-06, "loss": 1.0909, "step": 12301 }, { "epoch": 0.23, "learning_rate": 4.483367850997766e-06, "loss": 0.8627, "step": 12302 }, { "epoch": 0.23, "learning_rate": 4.4832748482958146e-06, "loss": 0.8932, "step": 12303 }, { "epoch": 0.23, "learning_rate": 4.483181838188376e-06, "loss": 0.8135, "step": 12304 }, { "epoch": 0.23, "learning_rate": 4.4830888206757985e-06, "loss": 0.9895, "step": 12305 }, { "epoch": 0.23, "learning_rate": 4.482995795758427e-06, "loss": 1.1671, "step": 12306 }, { "epoch": 0.23, "learning_rate": 4.48290276343661e-06, "loss": 1.0339, "step": 12307 }, { "epoch": 0.23, "learning_rate": 4.482809723710695e-06, "loss": 0.7853, "step": 12308 }, { "epoch": 0.23, "learning_rate": 4.482716676581029e-06, "loss": 1.0208, "step": 12309 }, { "epoch": 0.23, "learning_rate": 4.48262362204796e-06, "loss": 0.7776, "step": 12310 }, { "epoch": 0.23, "learning_rate": 4.482530560111835e-06, "loss": 0.8998, "step": 12311 }, { "epoch": 0.23, "learning_rate": 4.482437490773002e-06, "loss": 1.1902, "step": 12312 }, { "epoch": 0.23, "learning_rate": 4.4823444140318084e-06, "loss": 0.967, "step": 12313 }, { "epoch": 0.23, "learning_rate": 4.482251329888601e-06, "loss": 1.0115, "step": 12314 }, { "epoch": 0.23, "learning_rate": 4.482158238343728e-06, "loss": 1.0618, "step": 12315 }, { "epoch": 0.23, "learning_rate": 4.482065139397538e-06, "loss": 0.8986, "step": 12316 }, { "epoch": 0.23, "learning_rate": 4.481972033050376e-06, "loss": 0.8205, "step": 12317 }, { "epoch": 0.23, "learning_rate": 4.481878919302592e-06, "loss": 1.239, "step": 12318 }, { "epoch": 0.23, "learning_rate": 4.481785798154532e-06, "loss": 1.0256, "step": 12319 }, { "epoch": 0.23, "learning_rate": 4.481692669606545e-06, "loss": 0.899, "step": 12320 }, { "epoch": 0.23, "learning_rate": 4.481599533658979e-06, "loss": 1.0278, "step": 12321 }, { "epoch": 0.23, "learning_rate": 4.4815063903121815e-06, "loss": 0.915, "step": 12322 }, { "epoch": 0.23, "learning_rate": 4.481413239566499e-06, "loss": 1.1147, "step": 12323 }, { "epoch": 0.23, "learning_rate": 4.48132008142228e-06, "loss": 0.8928, "step": 12324 }, { "epoch": 0.23, "learning_rate": 4.481226915879872e-06, "loss": 1.0408, "step": 12325 }, { "epoch": 0.23, "learning_rate": 4.4811337429396255e-06, "loss": 0.8222, "step": 12326 }, { "epoch": 0.23, "learning_rate": 4.481040562601885e-06, "loss": 0.9211, "step": 12327 }, { "epoch": 0.23, "learning_rate": 4.480947374867e-06, "loss": 0.8341, "step": 12328 }, { "epoch": 0.23, "learning_rate": 4.480854179735317e-06, "loss": 0.8625, "step": 12329 }, { "epoch": 0.23, "learning_rate": 4.4807609772071865e-06, "loss": 0.97, "step": 12330 }, { "epoch": 0.23, "learning_rate": 4.480667767282955e-06, "loss": 1.1227, "step": 12331 }, { "epoch": 0.23, "learning_rate": 4.480574549962971e-06, "loss": 0.9868, "step": 12332 }, { "epoch": 0.23, "learning_rate": 4.480481325247583e-06, "loss": 0.878, "step": 12333 }, { "epoch": 0.23, "learning_rate": 4.480388093137138e-06, "loss": 1.1202, "step": 12334 }, { "epoch": 0.23, "learning_rate": 4.480294853631984e-06, "loss": 0.8277, "step": 12335 }, { "epoch": 0.23, "learning_rate": 4.480201606732471e-06, "loss": 0.8359, "step": 12336 }, { "epoch": 0.23, "learning_rate": 4.480108352438945e-06, "loss": 0.9324, "step": 12337 }, { "epoch": 0.23, "learning_rate": 4.480015090751754e-06, "loss": 0.9896, "step": 12338 }, { "epoch": 0.23, "learning_rate": 4.479921821671249e-06, "loss": 0.7426, "step": 12339 }, { "epoch": 0.23, "learning_rate": 4.479828545197776e-06, "loss": 1.1329, "step": 12340 }, { "epoch": 0.23, "learning_rate": 4.479735261331683e-06, "loss": 0.8595, "step": 12341 }, { "epoch": 0.23, "learning_rate": 4.479641970073321e-06, "loss": 1.0289, "step": 12342 }, { "epoch": 0.23, "learning_rate": 4.4795486714230355e-06, "loss": 0.9413, "step": 12343 }, { "epoch": 0.23, "learning_rate": 4.4794553653811765e-06, "loss": 1.0448, "step": 12344 }, { "epoch": 0.23, "learning_rate": 4.479362051948092e-06, "loss": 0.8157, "step": 12345 }, { "epoch": 0.23, "learning_rate": 4.47926873112413e-06, "loss": 1.0291, "step": 12346 }, { "epoch": 0.23, "learning_rate": 4.4791754029096394e-06, "loss": 0.9353, "step": 12347 }, { "epoch": 0.23, "learning_rate": 4.479082067304967e-06, "loss": 1.027, "step": 12348 }, { "epoch": 0.23, "learning_rate": 4.478988724310465e-06, "loss": 0.9139, "step": 12349 }, { "epoch": 0.23, "learning_rate": 4.478895373926478e-06, "loss": 0.8985, "step": 12350 }, { "epoch": 0.23, "learning_rate": 4.478802016153358e-06, "loss": 1.1091, "step": 12351 }, { "epoch": 0.23, "learning_rate": 4.478708650991451e-06, "loss": 1.1554, "step": 12352 }, { "epoch": 0.23, "learning_rate": 4.478615278441107e-06, "loss": 1.0361, "step": 12353 }, { "epoch": 0.23, "learning_rate": 4.478521898502674e-06, "loss": 0.8787, "step": 12354 }, { "epoch": 0.23, "learning_rate": 4.4784285111765004e-06, "loss": 0.8118, "step": 12355 }, { "epoch": 0.23, "learning_rate": 4.478335116462936e-06, "loss": 1.1823, "step": 12356 }, { "epoch": 0.23, "learning_rate": 4.4782417143623294e-06, "loss": 1.0966, "step": 12357 }, { "epoch": 0.23, "learning_rate": 4.478148304875028e-06, "loss": 1.111, "step": 12358 }, { "epoch": 0.23, "learning_rate": 4.478054888001382e-06, "loss": 0.6586, "step": 12359 }, { "epoch": 0.23, "learning_rate": 4.477961463741739e-06, "loss": 1.0163, "step": 12360 }, { "epoch": 0.23, "learning_rate": 4.477868032096449e-06, "loss": 1.0673, "step": 12361 }, { "epoch": 0.23, "learning_rate": 4.47777459306586e-06, "loss": 1.3163, "step": 12362 }, { "epoch": 0.23, "learning_rate": 4.477681146650323e-06, "loss": 1.1531, "step": 12363 }, { "epoch": 0.23, "learning_rate": 4.477587692850183e-06, "loss": 0.8418, "step": 12364 }, { "epoch": 0.23, "learning_rate": 4.477494231665792e-06, "loss": 0.9978, "step": 12365 }, { "epoch": 0.23, "learning_rate": 4.477400763097499e-06, "loss": 1.2, "step": 12366 }, { "epoch": 0.23, "learning_rate": 4.477307287145652e-06, "loss": 0.9377, "step": 12367 }, { "epoch": 0.23, "learning_rate": 4.477213803810599e-06, "loss": 1.4125, "step": 12368 }, { "epoch": 0.23, "learning_rate": 4.477120313092691e-06, "loss": 1.0389, "step": 12369 }, { "epoch": 0.23, "learning_rate": 4.477026814992276e-06, "loss": 0.892, "step": 12370 }, { "epoch": 0.23, "learning_rate": 4.4769333095097045e-06, "loss": 1.0325, "step": 12371 }, { "epoch": 0.23, "learning_rate": 4.476839796645324e-06, "loss": 1.0429, "step": 12372 }, { "epoch": 0.23, "learning_rate": 4.476746276399484e-06, "loss": 0.7052, "step": 12373 }, { "epoch": 0.23, "learning_rate": 4.476652748772534e-06, "loss": 1.1234, "step": 12374 }, { "epoch": 0.23, "learning_rate": 4.476559213764824e-06, "loss": 1.1215, "step": 12375 }, { "epoch": 0.23, "learning_rate": 4.476465671376702e-06, "loss": 1.1141, "step": 12376 }, { "epoch": 0.23, "learning_rate": 4.476372121608518e-06, "loss": 1.0317, "step": 12377 }, { "epoch": 0.23, "learning_rate": 4.476278564460621e-06, "loss": 0.9136, "step": 12378 }, { "epoch": 0.23, "learning_rate": 4.47618499993336e-06, "loss": 0.8486, "step": 12379 }, { "epoch": 0.23, "learning_rate": 4.476091428027085e-06, "loss": 0.9568, "step": 12380 }, { "epoch": 0.23, "learning_rate": 4.4759978487421455e-06, "loss": 1.1396, "step": 12381 }, { "epoch": 0.23, "learning_rate": 4.47590426207889e-06, "loss": 0.962, "step": 12382 }, { "epoch": 0.23, "learning_rate": 4.47581066803767e-06, "loss": 0.8774, "step": 12383 }, { "epoch": 0.23, "learning_rate": 4.475717066618832e-06, "loss": 0.7845, "step": 12384 }, { "epoch": 0.23, "learning_rate": 4.475623457822728e-06, "loss": 0.8063, "step": 12385 }, { "epoch": 0.23, "learning_rate": 4.475529841649706e-06, "loss": 1.0184, "step": 12386 }, { "epoch": 0.23, "learning_rate": 4.475436218100116e-06, "loss": 1.0405, "step": 12387 }, { "epoch": 0.23, "learning_rate": 4.475342587174308e-06, "loss": 0.8509, "step": 12388 }, { "epoch": 0.23, "learning_rate": 4.475248948872632e-06, "loss": 0.9757, "step": 12389 }, { "epoch": 0.23, "learning_rate": 4.475155303195436e-06, "loss": 0.9178, "step": 12390 }, { "epoch": 0.23, "learning_rate": 4.475061650143072e-06, "loss": 0.9806, "step": 12391 }, { "epoch": 0.23, "learning_rate": 4.474967989715887e-06, "loss": 0.905, "step": 12392 }, { "epoch": 0.23, "learning_rate": 4.474874321914232e-06, "loss": 1.1292, "step": 12393 }, { "epoch": 0.23, "learning_rate": 4.474780646738458e-06, "loss": 0.9923, "step": 12394 }, { "epoch": 0.23, "learning_rate": 4.474686964188913e-06, "loss": 0.702, "step": 12395 }, { "epoch": 0.23, "learning_rate": 4.4745932742659474e-06, "loss": 0.8847, "step": 12396 }, { "epoch": 0.23, "learning_rate": 4.474499576969911e-06, "loss": 1.0789, "step": 12397 }, { "epoch": 0.23, "learning_rate": 4.474405872301153e-06, "loss": 0.8624, "step": 12398 }, { "epoch": 0.23, "learning_rate": 4.474312160260026e-06, "loss": 1.0632, "step": 12399 }, { "epoch": 0.23, "learning_rate": 4.474218440846876e-06, "loss": 1.188, "step": 12400 }, { "epoch": 0.23, "learning_rate": 4.474124714062056e-06, "loss": 0.9069, "step": 12401 }, { "epoch": 0.23, "learning_rate": 4.474030979905914e-06, "loss": 0.8825, "step": 12402 }, { "epoch": 0.23, "learning_rate": 4.473937238378802e-06, "loss": 0.7886, "step": 12403 }, { "epoch": 0.23, "learning_rate": 4.473843489481068e-06, "loss": 0.7952, "step": 12404 }, { "epoch": 0.23, "learning_rate": 4.4737497332130634e-06, "loss": 0.8544, "step": 12405 }, { "epoch": 0.23, "learning_rate": 4.473655969575137e-06, "loss": 0.9278, "step": 12406 }, { "epoch": 0.23, "learning_rate": 4.47356219856764e-06, "loss": 1.1327, "step": 12407 }, { "epoch": 0.23, "learning_rate": 4.473468420190922e-06, "loss": 0.7834, "step": 12408 }, { "epoch": 0.23, "learning_rate": 4.473374634445335e-06, "loss": 0.8869, "step": 12409 }, { "epoch": 0.23, "learning_rate": 4.473280841331226e-06, "loss": 0.685, "step": 12410 }, { "epoch": 0.23, "learning_rate": 4.4731870408489475e-06, "loss": 0.8262, "step": 12411 }, { "epoch": 0.23, "learning_rate": 4.473093232998849e-06, "loss": 1.1297, "step": 12412 }, { "epoch": 0.23, "learning_rate": 4.47299941778128e-06, "loss": 1.1016, "step": 12413 }, { "epoch": 0.23, "learning_rate": 4.472905595196593e-06, "loss": 1.1377, "step": 12414 }, { "epoch": 0.23, "learning_rate": 4.472811765245136e-06, "loss": 1.048, "step": 12415 }, { "epoch": 0.23, "learning_rate": 4.472717927927261e-06, "loss": 0.9786, "step": 12416 }, { "epoch": 0.23, "learning_rate": 4.472624083243317e-06, "loss": 0.9703, "step": 12417 }, { "epoch": 0.23, "learning_rate": 4.472530231193657e-06, "loss": 1.0458, "step": 12418 }, { "epoch": 0.23, "learning_rate": 4.472436371778628e-06, "loss": 1.0132, "step": 12419 }, { "epoch": 0.23, "learning_rate": 4.472342504998583e-06, "loss": 0.8735, "step": 12420 }, { "epoch": 0.23, "learning_rate": 4.472248630853871e-06, "loss": 1.0224, "step": 12421 }, { "epoch": 0.23, "learning_rate": 4.4721547493448426e-06, "loss": 1.0273, "step": 12422 }, { "epoch": 0.23, "learning_rate": 4.472060860471849e-06, "loss": 0.9083, "step": 12423 }, { "epoch": 0.23, "learning_rate": 4.471966964235241e-06, "loss": 1.0201, "step": 12424 }, { "epoch": 0.23, "learning_rate": 4.471873060635368e-06, "loss": 1.0268, "step": 12425 }, { "epoch": 0.23, "learning_rate": 4.471779149672583e-06, "loss": 0.8915, "step": 12426 }, { "epoch": 0.23, "learning_rate": 4.471685231347234e-06, "loss": 0.9256, "step": 12427 }, { "epoch": 0.23, "learning_rate": 4.4715913056596724e-06, "loss": 0.9593, "step": 12428 }, { "epoch": 0.23, "learning_rate": 4.4714973726102505e-06, "loss": 0.8426, "step": 12429 }, { "epoch": 0.23, "learning_rate": 4.471403432199317e-06, "loss": 0.9312, "step": 12430 }, { "epoch": 0.23, "learning_rate": 4.471309484427224e-06, "loss": 1.1666, "step": 12431 }, { "epoch": 0.23, "learning_rate": 4.4712155292943215e-06, "loss": 0.8407, "step": 12432 }, { "epoch": 0.23, "learning_rate": 4.471121566800961e-06, "loss": 0.7686, "step": 12433 }, { "epoch": 0.23, "learning_rate": 4.471027596947493e-06, "loss": 1.0103, "step": 12434 }, { "epoch": 0.23, "learning_rate": 4.470933619734268e-06, "loss": 0.8251, "step": 12435 }, { "epoch": 0.23, "learning_rate": 4.470839635161638e-06, "loss": 1.082, "step": 12436 }, { "epoch": 0.23, "learning_rate": 4.470745643229953e-06, "loss": 1.1784, "step": 12437 }, { "epoch": 0.23, "learning_rate": 4.470651643939564e-06, "loss": 0.9648, "step": 12438 }, { "epoch": 0.23, "learning_rate": 4.4705576372908215e-06, "loss": 1.0878, "step": 12439 }, { "epoch": 0.23, "learning_rate": 4.470463623284078e-06, "loss": 0.8859, "step": 12440 }, { "epoch": 0.23, "learning_rate": 4.4703696019196836e-06, "loss": 0.7926, "step": 12441 }, { "epoch": 0.23, "learning_rate": 4.470275573197989e-06, "loss": 0.8739, "step": 12442 }, { "epoch": 0.23, "learning_rate": 4.470181537119347e-06, "loss": 0.9573, "step": 12443 }, { "epoch": 0.23, "learning_rate": 4.470087493684106e-06, "loss": 1.1668, "step": 12444 }, { "epoch": 0.23, "learning_rate": 4.46999344289262e-06, "loss": 1.0507, "step": 12445 }, { "epoch": 0.23, "learning_rate": 4.469899384745239e-06, "loss": 0.858, "step": 12446 }, { "epoch": 0.23, "learning_rate": 4.469805319242313e-06, "loss": 0.915, "step": 12447 }, { "epoch": 0.23, "learning_rate": 4.469711246384196e-06, "loss": 1.0414, "step": 12448 }, { "epoch": 0.23, "learning_rate": 4.4696171661712355e-06, "loss": 1.085, "step": 12449 }, { "epoch": 0.23, "learning_rate": 4.469523078603786e-06, "loss": 1.0938, "step": 12450 }, { "epoch": 0.23, "learning_rate": 4.469428983682198e-06, "loss": 0.7517, "step": 12451 }, { "epoch": 0.23, "learning_rate": 4.469334881406822e-06, "loss": 0.9249, "step": 12452 }, { "epoch": 0.23, "learning_rate": 4.469240771778009e-06, "loss": 0.9885, "step": 12453 }, { "epoch": 0.23, "learning_rate": 4.469146654796113e-06, "loss": 1.074, "step": 12454 }, { "epoch": 0.23, "learning_rate": 4.4690525304614835e-06, "loss": 0.9348, "step": 12455 }, { "epoch": 0.24, "learning_rate": 4.468958398774472e-06, "loss": 0.9613, "step": 12456 }, { "epoch": 0.24, "learning_rate": 4.46886425973543e-06, "loss": 0.8238, "step": 12457 }, { "epoch": 0.24, "learning_rate": 4.468770113344709e-06, "loss": 1.0151, "step": 12458 }, { "epoch": 0.24, "learning_rate": 4.468675959602661e-06, "loss": 1.085, "step": 12459 }, { "epoch": 0.24, "learning_rate": 4.468581798509638e-06, "loss": 0.8795, "step": 12460 }, { "epoch": 0.24, "learning_rate": 4.4684876300659905e-06, "loss": 0.8827, "step": 12461 }, { "epoch": 0.24, "learning_rate": 4.46839345427207e-06, "loss": 0.8556, "step": 12462 }, { "epoch": 0.24, "learning_rate": 4.468299271128229e-06, "loss": 1.1865, "step": 12463 }, { "epoch": 0.24, "learning_rate": 4.468205080634819e-06, "loss": 0.9741, "step": 12464 }, { "epoch": 0.24, "learning_rate": 4.468110882792192e-06, "loss": 0.9977, "step": 12465 }, { "epoch": 0.24, "learning_rate": 4.4680166776006985e-06, "loss": 0.9039, "step": 12466 }, { "epoch": 0.24, "learning_rate": 4.467922465060691e-06, "loss": 0.7892, "step": 12467 }, { "epoch": 0.24, "learning_rate": 4.467828245172522e-06, "loss": 1.0654, "step": 12468 }, { "epoch": 0.24, "learning_rate": 4.467734017936543e-06, "loss": 1.0528, "step": 12469 }, { "epoch": 0.24, "learning_rate": 4.4676397833531045e-06, "loss": 0.9178, "step": 12470 }, { "epoch": 0.24, "learning_rate": 4.46754554142256e-06, "loss": 1.0089, "step": 12471 }, { "epoch": 0.24, "learning_rate": 4.467451292145261e-06, "loss": 0.8688, "step": 12472 }, { "epoch": 0.24, "learning_rate": 4.467357035521558e-06, "loss": 0.8446, "step": 12473 }, { "epoch": 0.24, "learning_rate": 4.467262771551805e-06, "loss": 1.0776, "step": 12474 }, { "epoch": 0.24, "learning_rate": 4.4671685002363525e-06, "loss": 1.0877, "step": 12475 }, { "epoch": 0.24, "learning_rate": 4.467074221575555e-06, "loss": 0.8087, "step": 12476 }, { "epoch": 0.24, "learning_rate": 4.4669799355697604e-06, "loss": 0.9046, "step": 12477 }, { "epoch": 0.24, "learning_rate": 4.466885642219324e-06, "loss": 0.9297, "step": 12478 }, { "epoch": 0.24, "learning_rate": 4.466791341524597e-06, "loss": 0.8289, "step": 12479 }, { "epoch": 0.24, "learning_rate": 4.4666970334859315e-06, "loss": 1.015, "step": 12480 }, { "epoch": 0.24, "learning_rate": 4.466602718103679e-06, "loss": 1.0241, "step": 12481 }, { "epoch": 0.24, "learning_rate": 4.466508395378193e-06, "loss": 0.9377, "step": 12482 }, { "epoch": 0.24, "learning_rate": 4.466414065309824e-06, "loss": 1.0049, "step": 12483 }, { "epoch": 0.24, "learning_rate": 4.466319727898926e-06, "loss": 1.0893, "step": 12484 }, { "epoch": 0.24, "learning_rate": 4.4662253831458506e-06, "loss": 1.0529, "step": 12485 }, { "epoch": 0.24, "learning_rate": 4.46613103105095e-06, "loss": 1.0026, "step": 12486 }, { "epoch": 0.24, "learning_rate": 4.466036671614576e-06, "loss": 0.9955, "step": 12487 }, { "epoch": 0.24, "learning_rate": 4.465942304837081e-06, "loss": 0.9711, "step": 12488 }, { "epoch": 0.24, "learning_rate": 4.465847930718818e-06, "loss": 0.9567, "step": 12489 }, { "epoch": 0.24, "learning_rate": 4.465753549260139e-06, "loss": 1.0319, "step": 12490 }, { "epoch": 0.24, "learning_rate": 4.465659160461396e-06, "loss": 0.9415, "step": 12491 }, { "epoch": 0.24, "learning_rate": 4.465564764322943e-06, "loss": 1.1025, "step": 12492 }, { "epoch": 0.24, "learning_rate": 4.465470360845131e-06, "loss": 1.1547, "step": 12493 }, { "epoch": 0.24, "learning_rate": 4.465375950028313e-06, "loss": 1.1276, "step": 12494 }, { "epoch": 0.24, "learning_rate": 4.4652815318728415e-06, "loss": 1.0254, "step": 12495 }, { "epoch": 0.24, "learning_rate": 4.465187106379069e-06, "loss": 0.8885, "step": 12496 }, { "epoch": 0.24, "learning_rate": 4.4650926735473474e-06, "loss": 0.8291, "step": 12497 }, { "epoch": 0.24, "learning_rate": 4.46499823337803e-06, "loss": 0.8862, "step": 12498 }, { "epoch": 0.24, "learning_rate": 4.464903785871471e-06, "loss": 0.9359, "step": 12499 }, { "epoch": 0.24, "learning_rate": 4.464809331028021e-06, "loss": 1.0764, "step": 12500 }, { "epoch": 0.24, "learning_rate": 4.464714868848032e-06, "loss": 0.9847, "step": 12501 }, { "epoch": 0.24, "learning_rate": 4.4646203993318594e-06, "loss": 0.8084, "step": 12502 }, { "epoch": 0.24, "learning_rate": 4.4645259224798535e-06, "loss": 0.9195, "step": 12503 }, { "epoch": 0.24, "learning_rate": 4.4644314382923686e-06, "loss": 0.7317, "step": 12504 }, { "epoch": 0.24, "learning_rate": 4.464336946769756e-06, "loss": 1.1198, "step": 12505 }, { "epoch": 0.24, "learning_rate": 4.46424244791237e-06, "loss": 1.1478, "step": 12506 }, { "epoch": 0.24, "learning_rate": 4.464147941720564e-06, "loss": 1.0641, "step": 12507 }, { "epoch": 0.24, "learning_rate": 4.464053428194688e-06, "loss": 0.9509, "step": 12508 }, { "epoch": 0.24, "learning_rate": 4.463958907335097e-06, "loss": 0.9286, "step": 12509 }, { "epoch": 0.24, "learning_rate": 4.463864379142145e-06, "loss": 0.798, "step": 12510 }, { "epoch": 0.24, "learning_rate": 4.463769843616183e-06, "loss": 1.1809, "step": 12511 }, { "epoch": 0.24, "learning_rate": 4.463675300757564e-06, "loss": 1.4047, "step": 12512 }, { "epoch": 0.24, "learning_rate": 4.463580750566643e-06, "loss": 1.0224, "step": 12513 }, { "epoch": 0.24, "learning_rate": 4.46348619304377e-06, "loss": 0.8723, "step": 12514 }, { "epoch": 0.24, "learning_rate": 4.463391628189301e-06, "loss": 0.9818, "step": 12515 }, { "epoch": 0.24, "learning_rate": 4.463297056003587e-06, "loss": 0.9677, "step": 12516 }, { "epoch": 0.24, "learning_rate": 4.463202476486982e-06, "loss": 0.7845, "step": 12517 }, { "epoch": 0.24, "learning_rate": 4.463107889639841e-06, "loss": 1.0186, "step": 12518 }, { "epoch": 0.24, "learning_rate": 4.463013295462513e-06, "loss": 1.0133, "step": 12519 }, { "epoch": 0.24, "learning_rate": 4.462918693955354e-06, "loss": 1.0722, "step": 12520 }, { "epoch": 0.24, "learning_rate": 4.4628240851187175e-06, "loss": 0.9231, "step": 12521 }, { "epoch": 0.24, "learning_rate": 4.4627294689529555e-06, "loss": 0.9288, "step": 12522 }, { "epoch": 0.24, "learning_rate": 4.462634845458422e-06, "loss": 0.9172, "step": 12523 }, { "epoch": 0.24, "learning_rate": 4.462540214635471e-06, "loss": 1.0588, "step": 12524 }, { "epoch": 0.24, "learning_rate": 4.462445576484454e-06, "loss": 1.073, "step": 12525 }, { "epoch": 0.24, "learning_rate": 4.462350931005726e-06, "loss": 1.0193, "step": 12526 }, { "epoch": 0.24, "learning_rate": 4.462256278199639e-06, "loss": 0.8484, "step": 12527 }, { "epoch": 0.24, "learning_rate": 4.462161618066547e-06, "loss": 0.8416, "step": 12528 }, { "epoch": 0.24, "learning_rate": 4.462066950606805e-06, "loss": 0.8062, "step": 12529 }, { "epoch": 0.24, "learning_rate": 4.461972275820764e-06, "loss": 0.8849, "step": 12530 }, { "epoch": 0.24, "learning_rate": 4.46187759370878e-06, "loss": 0.9064, "step": 12531 }, { "epoch": 0.24, "learning_rate": 4.461782904271204e-06, "loss": 0.9838, "step": 12532 }, { "epoch": 0.24, "learning_rate": 4.461688207508391e-06, "loss": 0.846, "step": 12533 }, { "epoch": 0.24, "learning_rate": 4.461593503420695e-06, "loss": 1.0729, "step": 12534 }, { "epoch": 0.24, "learning_rate": 4.461498792008469e-06, "loss": 0.9785, "step": 12535 }, { "epoch": 0.24, "learning_rate": 4.461404073272065e-06, "loss": 0.9113, "step": 12536 }, { "epoch": 0.24, "learning_rate": 4.46130934721184e-06, "loss": 1.038, "step": 12537 }, { "epoch": 0.24, "learning_rate": 4.461214613828145e-06, "loss": 0.9021, "step": 12538 }, { "epoch": 0.24, "learning_rate": 4.461119873121336e-06, "loss": 0.7744, "step": 12539 }, { "epoch": 0.24, "learning_rate": 4.461025125091765e-06, "loss": 0.9224, "step": 12540 }, { "epoch": 0.24, "learning_rate": 4.460930369739785e-06, "loss": 0.9039, "step": 12541 }, { "epoch": 0.24, "learning_rate": 4.460835607065753e-06, "loss": 0.9389, "step": 12542 }, { "epoch": 0.24, "learning_rate": 4.46074083707002e-06, "loss": 1.0046, "step": 12543 }, { "epoch": 0.24, "learning_rate": 4.460646059752941e-06, "loss": 1.1252, "step": 12544 }, { "epoch": 0.24, "learning_rate": 4.460551275114871e-06, "loss": 0.8877, "step": 12545 }, { "epoch": 0.24, "learning_rate": 4.46045648315616e-06, "loss": 1.0126, "step": 12546 }, { "epoch": 0.24, "learning_rate": 4.460361683877167e-06, "loss": 0.8279, "step": 12547 }, { "epoch": 0.24, "learning_rate": 4.460266877278242e-06, "loss": 0.9157, "step": 12548 }, { "epoch": 0.24, "learning_rate": 4.460172063359741e-06, "loss": 1.0827, "step": 12549 }, { "epoch": 0.24, "learning_rate": 4.460077242122019e-06, "loss": 1.0255, "step": 12550 }, { "epoch": 0.24, "learning_rate": 4.459982413565427e-06, "loss": 1.001, "step": 12551 }, { "epoch": 0.24, "learning_rate": 4.459887577690321e-06, "loss": 0.8588, "step": 12552 }, { "epoch": 0.24, "learning_rate": 4.459792734497055e-06, "loss": 0.9944, "step": 12553 }, { "epoch": 0.24, "learning_rate": 4.4596978839859835e-06, "loss": 0.8559, "step": 12554 }, { "epoch": 0.24, "learning_rate": 4.459603026157459e-06, "loss": 1.0941, "step": 12555 }, { "epoch": 0.24, "learning_rate": 4.459508161011839e-06, "loss": 1.0577, "step": 12556 }, { "epoch": 0.24, "learning_rate": 4.459413288549474e-06, "loss": 1.1182, "step": 12557 }, { "epoch": 0.24, "learning_rate": 4.45931840877072e-06, "loss": 0.918, "step": 12558 }, { "epoch": 0.24, "learning_rate": 4.459223521675932e-06, "loss": 1.0647, "step": 12559 }, { "epoch": 0.24, "learning_rate": 4.459128627265462e-06, "loss": 1.0329, "step": 12560 }, { "epoch": 0.24, "learning_rate": 4.459033725539666e-06, "loss": 0.8069, "step": 12561 }, { "epoch": 0.24, "learning_rate": 4.4589388164989e-06, "loss": 1.04, "step": 12562 }, { "epoch": 0.24, "learning_rate": 4.4588439001435145e-06, "loss": 1.0451, "step": 12563 }, { "epoch": 0.24, "learning_rate": 4.458748976473867e-06, "loss": 1.0115, "step": 12564 }, { "epoch": 0.24, "learning_rate": 4.45865404549031e-06, "loss": 0.9323, "step": 12565 }, { "epoch": 0.24, "learning_rate": 4.4585591071932e-06, "loss": 0.8703, "step": 12566 }, { "epoch": 0.24, "learning_rate": 4.45846416158289e-06, "loss": 0.8632, "step": 12567 }, { "epoch": 0.24, "learning_rate": 4.458369208659734e-06, "loss": 1.0872, "step": 12568 }, { "epoch": 0.24, "learning_rate": 4.458274248424088e-06, "loss": 1.2874, "step": 12569 }, { "epoch": 0.24, "learning_rate": 4.458179280876306e-06, "loss": 1.0663, "step": 12570 }, { "epoch": 0.24, "learning_rate": 4.458084306016743e-06, "loss": 1.0615, "step": 12571 }, { "epoch": 0.24, "learning_rate": 4.457989323845752e-06, "loss": 0.9567, "step": 12572 }, { "epoch": 0.24, "learning_rate": 4.457894334363691e-06, "loss": 0.9453, "step": 12573 }, { "epoch": 0.24, "learning_rate": 4.457799337570911e-06, "loss": 0.8807, "step": 12574 }, { "epoch": 0.24, "learning_rate": 4.457704333467768e-06, "loss": 0.9588, "step": 12575 }, { "epoch": 0.24, "learning_rate": 4.4576093220546176e-06, "loss": 0.8415, "step": 12576 }, { "epoch": 0.24, "learning_rate": 4.457514303331814e-06, "loss": 1.1174, "step": 12577 }, { "epoch": 0.24, "learning_rate": 4.457419277299712e-06, "loss": 0.9286, "step": 12578 }, { "epoch": 0.24, "learning_rate": 4.457324243958666e-06, "loss": 0.7658, "step": 12579 }, { "epoch": 0.24, "learning_rate": 4.457229203309033e-06, "loss": 0.9364, "step": 12580 }, { "epoch": 0.24, "learning_rate": 4.457134155351165e-06, "loss": 1.1826, "step": 12581 }, { "epoch": 0.24, "learning_rate": 4.457039100085417e-06, "loss": 1.0821, "step": 12582 }, { "epoch": 0.24, "learning_rate": 4.456944037512147e-06, "loss": 0.805, "step": 12583 }, { "epoch": 0.24, "learning_rate": 4.456848967631707e-06, "loss": 0.907, "step": 12584 }, { "epoch": 0.24, "learning_rate": 4.456753890444452e-06, "loss": 1.0745, "step": 12585 }, { "epoch": 0.24, "learning_rate": 4.45665880595074e-06, "loss": 1.1457, "step": 12586 }, { "epoch": 0.24, "learning_rate": 4.456563714150922e-06, "loss": 1.1499, "step": 12587 }, { "epoch": 0.24, "learning_rate": 4.456468615045356e-06, "loss": 1.2314, "step": 12588 }, { "epoch": 0.24, "learning_rate": 4.456373508634397e-06, "loss": 0.969, "step": 12589 }, { "epoch": 0.24, "learning_rate": 4.456278394918398e-06, "loss": 0.6375, "step": 12590 }, { "epoch": 0.24, "learning_rate": 4.4561832738977164e-06, "loss": 0.8526, "step": 12591 }, { "epoch": 0.24, "learning_rate": 4.456088145572705e-06, "loss": 0.9341, "step": 12592 }, { "epoch": 0.24, "learning_rate": 4.455993009943722e-06, "loss": 1.1373, "step": 12593 }, { "epoch": 0.24, "learning_rate": 4.455897867011121e-06, "loss": 1.0493, "step": 12594 }, { "epoch": 0.24, "learning_rate": 4.455802716775257e-06, "loss": 1.1137, "step": 12595 }, { "epoch": 0.24, "learning_rate": 4.455707559236485e-06, "loss": 0.8714, "step": 12596 }, { "epoch": 0.24, "learning_rate": 4.455612394395161e-06, "loss": 0.8831, "step": 12597 }, { "epoch": 0.24, "learning_rate": 4.455517222251642e-06, "loss": 0.8423, "step": 12598 }, { "epoch": 0.24, "learning_rate": 4.455422042806279e-06, "loss": 1.2034, "step": 12599 }, { "epoch": 0.24, "learning_rate": 4.4553268560594324e-06, "loss": 1.1372, "step": 12600 }, { "epoch": 0.24, "learning_rate": 4.455231662011454e-06, "loss": 1.1428, "step": 12601 }, { "epoch": 0.24, "learning_rate": 4.4551364606627e-06, "loss": 0.8925, "step": 12602 }, { "epoch": 0.24, "learning_rate": 4.455041252013528e-06, "loss": 0.8799, "step": 12603 }, { "epoch": 0.24, "learning_rate": 4.454946036064291e-06, "loss": 0.8788, "step": 12604 }, { "epoch": 0.24, "learning_rate": 4.454850812815345e-06, "loss": 1.122, "step": 12605 }, { "epoch": 0.24, "learning_rate": 4.454755582267046e-06, "loss": 1.2032, "step": 12606 }, { "epoch": 0.24, "learning_rate": 4.4546603444197514e-06, "loss": 0.8345, "step": 12607 }, { "epoch": 0.24, "learning_rate": 4.454565099273813e-06, "loss": 0.8785, "step": 12608 }, { "epoch": 0.24, "learning_rate": 4.454469846829589e-06, "loss": 1.0278, "step": 12609 }, { "epoch": 0.24, "learning_rate": 4.454374587087435e-06, "loss": 0.8112, "step": 12610 }, { "epoch": 0.24, "learning_rate": 4.454279320047706e-06, "loss": 0.8835, "step": 12611 }, { "epoch": 0.24, "learning_rate": 4.454184045710757e-06, "loss": 1.2227, "step": 12612 }, { "epoch": 0.24, "learning_rate": 4.454088764076946e-06, "loss": 0.9686, "step": 12613 }, { "epoch": 0.24, "learning_rate": 4.4539934751466275e-06, "loss": 0.9812, "step": 12614 }, { "epoch": 0.24, "learning_rate": 4.453898178920156e-06, "loss": 0.8412, "step": 12615 }, { "epoch": 0.24, "learning_rate": 4.45380287539789e-06, "loss": 0.9626, "step": 12616 }, { "epoch": 0.24, "learning_rate": 4.453707564580183e-06, "loss": 0.9584, "step": 12617 }, { "epoch": 0.24, "learning_rate": 4.4536122464673925e-06, "loss": 1.1169, "step": 12618 }, { "epoch": 0.24, "learning_rate": 4.453516921059873e-06, "loss": 1.1172, "step": 12619 }, { "epoch": 0.24, "learning_rate": 4.453421588357982e-06, "loss": 0.7516, "step": 12620 }, { "epoch": 0.24, "learning_rate": 4.453326248362074e-06, "loss": 0.9483, "step": 12621 }, { "epoch": 0.24, "learning_rate": 4.453230901072507e-06, "loss": 0.9653, "step": 12622 }, { "epoch": 0.24, "learning_rate": 4.453135546489634e-06, "loss": 0.8181, "step": 12623 }, { "epoch": 0.24, "learning_rate": 4.453040184613814e-06, "loss": 0.9312, "step": 12624 }, { "epoch": 0.24, "learning_rate": 4.452944815445401e-06, "loss": 1.0849, "step": 12625 }, { "epoch": 0.24, "learning_rate": 4.452849438984752e-06, "loss": 0.9941, "step": 12626 }, { "epoch": 0.24, "learning_rate": 4.452754055232223e-06, "loss": 0.9263, "step": 12627 }, { "epoch": 0.24, "learning_rate": 4.4526586641881715e-06, "loss": 0.9228, "step": 12628 }, { "epoch": 0.24, "learning_rate": 4.452563265852952e-06, "loss": 0.838, "step": 12629 }, { "epoch": 0.24, "learning_rate": 4.45246786022692e-06, "loss": 1.0536, "step": 12630 }, { "epoch": 0.24, "learning_rate": 4.452372447310434e-06, "loss": 0.8204, "step": 12631 }, { "epoch": 0.24, "learning_rate": 4.452277027103848e-06, "loss": 0.9998, "step": 12632 }, { "epoch": 0.24, "learning_rate": 4.45218159960752e-06, "loss": 0.9477, "step": 12633 }, { "epoch": 0.24, "learning_rate": 4.452086164821806e-06, "loss": 0.9362, "step": 12634 }, { "epoch": 0.24, "learning_rate": 4.451990722747062e-06, "loss": 0.9439, "step": 12635 }, { "epoch": 0.24, "learning_rate": 4.451895273383644e-06, "loss": 0.8545, "step": 12636 }, { "epoch": 0.24, "learning_rate": 4.45179981673191e-06, "loss": 1.0952, "step": 12637 }, { "epoch": 0.24, "learning_rate": 4.4517043527922144e-06, "loss": 0.7878, "step": 12638 }, { "epoch": 0.24, "learning_rate": 4.451608881564915e-06, "loss": 0.9744, "step": 12639 }, { "epoch": 0.24, "learning_rate": 4.451513403050367e-06, "loss": 0.9131, "step": 12640 }, { "epoch": 0.24, "learning_rate": 4.451417917248929e-06, "loss": 0.8382, "step": 12641 }, { "epoch": 0.24, "learning_rate": 4.451322424160956e-06, "loss": 1.0508, "step": 12642 }, { "epoch": 0.24, "learning_rate": 4.451226923786804e-06, "loss": 1.0408, "step": 12643 }, { "epoch": 0.24, "learning_rate": 4.451131416126831e-06, "loss": 1.0231, "step": 12644 }, { "epoch": 0.24, "learning_rate": 4.4510359011813946e-06, "loss": 0.8371, "step": 12645 }, { "epoch": 0.24, "learning_rate": 4.4509403789508484e-06, "loss": 0.8304, "step": 12646 }, { "epoch": 0.24, "learning_rate": 4.4508448494355505e-06, "loss": 0.8701, "step": 12647 }, { "epoch": 0.24, "learning_rate": 4.450749312635858e-06, "loss": 1.0718, "step": 12648 }, { "epoch": 0.24, "learning_rate": 4.450653768552128e-06, "loss": 1.0917, "step": 12649 }, { "epoch": 0.24, "learning_rate": 4.4505582171847164e-06, "loss": 1.157, "step": 12650 }, { "epoch": 0.24, "learning_rate": 4.45046265853398e-06, "loss": 1.0059, "step": 12651 }, { "epoch": 0.24, "learning_rate": 4.450367092600276e-06, "loss": 0.9103, "step": 12652 }, { "epoch": 0.24, "learning_rate": 4.450271519383961e-06, "loss": 0.9689, "step": 12653 }, { "epoch": 0.24, "learning_rate": 4.450175938885392e-06, "loss": 0.8389, "step": 12654 }, { "epoch": 0.24, "learning_rate": 4.450080351104925e-06, "loss": 1.2037, "step": 12655 }, { "epoch": 0.24, "learning_rate": 4.449984756042919e-06, "loss": 1.094, "step": 12656 }, { "epoch": 0.24, "learning_rate": 4.449889153699729e-06, "loss": 0.9131, "step": 12657 }, { "epoch": 0.24, "learning_rate": 4.4497935440757125e-06, "loss": 0.8341, "step": 12658 }, { "epoch": 0.24, "learning_rate": 4.4496979271712274e-06, "loss": 0.957, "step": 12659 }, { "epoch": 0.24, "learning_rate": 4.44960230298663e-06, "loss": 1.1054, "step": 12660 }, { "epoch": 0.24, "learning_rate": 4.449506671522277e-06, "loss": 1.0051, "step": 12661 }, { "epoch": 0.24, "learning_rate": 4.449411032778525e-06, "loss": 1.1106, "step": 12662 }, { "epoch": 0.24, "learning_rate": 4.449315386755733e-06, "loss": 1.1165, "step": 12663 }, { "epoch": 0.24, "learning_rate": 4.449219733454258e-06, "loss": 0.9308, "step": 12664 }, { "epoch": 0.24, "learning_rate": 4.449124072874455e-06, "loss": 0.97, "step": 12665 }, { "epoch": 0.24, "learning_rate": 4.449028405016683e-06, "loss": 0.8637, "step": 12666 }, { "epoch": 0.24, "learning_rate": 4.448932729881298e-06, "loss": 0.8425, "step": 12667 }, { "epoch": 0.24, "learning_rate": 4.448837047468659e-06, "loss": 1.2994, "step": 12668 }, { "epoch": 0.24, "learning_rate": 4.4487413577791215e-06, "loss": 0.9609, "step": 12669 }, { "epoch": 0.24, "learning_rate": 4.448645660813043e-06, "loss": 0.8292, "step": 12670 }, { "epoch": 0.24, "learning_rate": 4.448549956570783e-06, "loss": 0.7999, "step": 12671 }, { "epoch": 0.24, "learning_rate": 4.448454245052695e-06, "loss": 0.9099, "step": 12672 }, { "epoch": 0.24, "learning_rate": 4.4483585262591406e-06, "loss": 0.9155, "step": 12673 }, { "epoch": 0.24, "learning_rate": 4.448262800190474e-06, "loss": 1.132, "step": 12674 }, { "epoch": 0.24, "learning_rate": 4.448167066847055e-06, "loss": 0.9827, "step": 12675 }, { "epoch": 0.24, "learning_rate": 4.448071326229239e-06, "loss": 0.8301, "step": 12676 }, { "epoch": 0.24, "learning_rate": 4.447975578337385e-06, "loss": 0.9971, "step": 12677 }, { "epoch": 0.24, "learning_rate": 4.447879823171849e-06, "loss": 0.9422, "step": 12678 }, { "epoch": 0.24, "learning_rate": 4.4477840607329895e-06, "loss": 0.8305, "step": 12679 }, { "epoch": 0.24, "learning_rate": 4.447688291021165e-06, "loss": 0.9443, "step": 12680 }, { "epoch": 0.24, "learning_rate": 4.447592514036732e-06, "loss": 1.1672, "step": 12681 }, { "epoch": 0.24, "learning_rate": 4.447496729780047e-06, "loss": 1.0952, "step": 12682 }, { "epoch": 0.24, "learning_rate": 4.4474009382514695e-06, "loss": 0.8641, "step": 12683 }, { "epoch": 0.24, "learning_rate": 4.4473051394513575e-06, "loss": 0.9811, "step": 12684 }, { "epoch": 0.24, "learning_rate": 4.447209333380067e-06, "loss": 0.8215, "step": 12685 }, { "epoch": 0.24, "learning_rate": 4.4471135200379565e-06, "loss": 0.9172, "step": 12686 }, { "epoch": 0.24, "learning_rate": 4.447017699425384e-06, "loss": 1.0314, "step": 12687 }, { "epoch": 0.24, "learning_rate": 4.4469218715427075e-06, "loss": 1.1564, "step": 12688 }, { "epoch": 0.24, "learning_rate": 4.4468260363902835e-06, "loss": 0.9547, "step": 12689 }, { "epoch": 0.24, "learning_rate": 4.446730193968471e-06, "loss": 0.8815, "step": 12690 }, { "epoch": 0.24, "learning_rate": 4.446634344277629e-06, "loss": 0.968, "step": 12691 }, { "epoch": 0.24, "learning_rate": 4.446538487318113e-06, "loss": 0.8542, "step": 12692 }, { "epoch": 0.24, "learning_rate": 4.4464426230902815e-06, "loss": 0.8752, "step": 12693 }, { "epoch": 0.24, "learning_rate": 4.4463467515944934e-06, "loss": 1.0702, "step": 12694 }, { "epoch": 0.24, "learning_rate": 4.446250872831107e-06, "loss": 0.9078, "step": 12695 }, { "epoch": 0.24, "learning_rate": 4.446154986800478e-06, "loss": 1.0544, "step": 12696 }, { "epoch": 0.24, "learning_rate": 4.446059093502967e-06, "loss": 1.0035, "step": 12697 }, { "epoch": 0.24, "learning_rate": 4.4459631929389315e-06, "loss": 0.8549, "step": 12698 }, { "epoch": 0.24, "learning_rate": 4.445867285108728e-06, "loss": 1.126, "step": 12699 }, { "epoch": 0.24, "learning_rate": 4.445771370012716e-06, "loss": 1.0372, "step": 12700 }, { "epoch": 0.24, "learning_rate": 4.445675447651253e-06, "loss": 0.9163, "step": 12701 }, { "epoch": 0.24, "learning_rate": 4.4455795180246985e-06, "loss": 0.9429, "step": 12702 }, { "epoch": 0.24, "learning_rate": 4.445483581133408e-06, "loss": 1.0345, "step": 12703 }, { "epoch": 0.24, "learning_rate": 4.445387636977744e-06, "loss": 0.8944, "step": 12704 }, { "epoch": 0.24, "learning_rate": 4.445291685558061e-06, "loss": 0.825, "step": 12705 }, { "epoch": 0.24, "learning_rate": 4.445195726874718e-06, "loss": 0.9482, "step": 12706 }, { "epoch": 0.24, "learning_rate": 4.445099760928074e-06, "loss": 0.9149, "step": 12707 }, { "epoch": 0.24, "learning_rate": 4.445003787718487e-06, "loss": 0.8759, "step": 12708 }, { "epoch": 0.24, "learning_rate": 4.444907807246316e-06, "loss": 0.9008, "step": 12709 }, { "epoch": 0.24, "learning_rate": 4.444811819511918e-06, "loss": 1.0461, "step": 12710 }, { "epoch": 0.24, "learning_rate": 4.444715824515653e-06, "loss": 0.9869, "step": 12711 }, { "epoch": 0.24, "learning_rate": 4.444619822257879e-06, "loss": 0.9639, "step": 12712 }, { "epoch": 0.24, "learning_rate": 4.444523812738955e-06, "loss": 0.9536, "step": 12713 }, { "epoch": 0.24, "learning_rate": 4.444427795959236e-06, "loss": 0.8722, "step": 12714 }, { "epoch": 0.24, "learning_rate": 4.444331771919085e-06, "loss": 1.0563, "step": 12715 }, { "epoch": 0.24, "learning_rate": 4.444235740618859e-06, "loss": 1.1091, "step": 12716 }, { "epoch": 0.24, "learning_rate": 4.444139702058916e-06, "loss": 1.0176, "step": 12717 }, { "epoch": 0.24, "learning_rate": 4.444043656239615e-06, "loss": 1.2102, "step": 12718 }, { "epoch": 0.24, "learning_rate": 4.443947603161314e-06, "loss": 0.945, "step": 12719 }, { "epoch": 0.24, "learning_rate": 4.443851542824374e-06, "loss": 0.8447, "step": 12720 }, { "epoch": 0.24, "learning_rate": 4.4437554752291504e-06, "loss": 0.9464, "step": 12721 }, { "epoch": 0.24, "learning_rate": 4.4436594003760034e-06, "loss": 0.9949, "step": 12722 }, { "epoch": 0.24, "learning_rate": 4.443563318265292e-06, "loss": 0.8909, "step": 12723 }, { "epoch": 0.24, "learning_rate": 4.443467228897375e-06, "loss": 1.088, "step": 12724 }, { "epoch": 0.24, "learning_rate": 4.44337113227261e-06, "loss": 0.8788, "step": 12725 }, { "epoch": 0.24, "learning_rate": 4.443275028391359e-06, "loss": 1.0345, "step": 12726 }, { "epoch": 0.24, "learning_rate": 4.443178917253977e-06, "loss": 0.8629, "step": 12727 }, { "epoch": 0.24, "learning_rate": 4.443082798860825e-06, "loss": 0.9547, "step": 12728 }, { "epoch": 0.24, "learning_rate": 4.4429866732122604e-06, "loss": 0.9501, "step": 12729 }, { "epoch": 0.24, "learning_rate": 4.442890540308644e-06, "loss": 1.1937, "step": 12730 }, { "epoch": 0.24, "learning_rate": 4.442794400150334e-06, "loss": 1.0279, "step": 12731 }, { "epoch": 0.24, "learning_rate": 4.4426982527376885e-06, "loss": 1.1086, "step": 12732 }, { "epoch": 0.24, "learning_rate": 4.442602098071068e-06, "loss": 0.8995, "step": 12733 }, { "epoch": 0.24, "learning_rate": 4.442505936150831e-06, "loss": 0.9351, "step": 12734 }, { "epoch": 0.24, "learning_rate": 4.4424097669773355e-06, "loss": 0.982, "step": 12735 }, { "epoch": 0.24, "learning_rate": 4.442313590550943e-06, "loss": 0.6997, "step": 12736 }, { "epoch": 0.24, "learning_rate": 4.44221740687201e-06, "loss": 1.0052, "step": 12737 }, { "epoch": 0.24, "learning_rate": 4.442121215940897e-06, "loss": 0.9609, "step": 12738 }, { "epoch": 0.24, "learning_rate": 4.442025017757963e-06, "loss": 1.1359, "step": 12739 }, { "epoch": 0.24, "learning_rate": 4.441928812323566e-06, "loss": 1.136, "step": 12740 }, { "epoch": 0.24, "learning_rate": 4.441832599638067e-06, "loss": 0.9688, "step": 12741 }, { "epoch": 0.24, "learning_rate": 4.441736379701825e-06, "loss": 0.9623, "step": 12742 }, { "epoch": 0.24, "learning_rate": 4.4416401525152e-06, "loss": 1.2876, "step": 12743 }, { "epoch": 0.24, "learning_rate": 4.441543918078549e-06, "loss": 0.7691, "step": 12744 }, { "epoch": 0.24, "learning_rate": 4.441447676392232e-06, "loss": 0.9637, "step": 12745 }, { "epoch": 0.24, "learning_rate": 4.44135142745661e-06, "loss": 0.9384, "step": 12746 }, { "epoch": 0.24, "learning_rate": 4.441255171272041e-06, "loss": 0.9225, "step": 12747 }, { "epoch": 0.24, "learning_rate": 4.441158907838884e-06, "loss": 0.8506, "step": 12748 }, { "epoch": 0.24, "learning_rate": 4.4410626371574994e-06, "loss": 0.9481, "step": 12749 }, { "epoch": 0.24, "learning_rate": 4.440966359228247e-06, "loss": 1.1589, "step": 12750 }, { "epoch": 0.24, "learning_rate": 4.440870074051486e-06, "loss": 0.968, "step": 12751 }, { "epoch": 0.24, "learning_rate": 4.440773781627574e-06, "loss": 0.7489, "step": 12752 }, { "epoch": 0.24, "learning_rate": 4.440677481956873e-06, "loss": 0.9749, "step": 12753 }, { "epoch": 0.24, "learning_rate": 4.440581175039742e-06, "loss": 0.9961, "step": 12754 }, { "epoch": 0.24, "learning_rate": 4.440484860876541e-06, "loss": 0.9337, "step": 12755 }, { "epoch": 0.24, "learning_rate": 4.440388539467628e-06, "loss": 1.001, "step": 12756 }, { "epoch": 0.24, "learning_rate": 4.440292210813365e-06, "loss": 0.9594, "step": 12757 }, { "epoch": 0.24, "learning_rate": 4.44019587491411e-06, "loss": 0.9102, "step": 12758 }, { "epoch": 0.24, "learning_rate": 4.440099531770222e-06, "loss": 0.9265, "step": 12759 }, { "epoch": 0.24, "learning_rate": 4.440003181382062e-06, "loss": 0.9147, "step": 12760 }, { "epoch": 0.24, "learning_rate": 4.4399068237499896e-06, "loss": 1.0175, "step": 12761 }, { "epoch": 0.24, "learning_rate": 4.439810458874365e-06, "loss": 0.9735, "step": 12762 }, { "epoch": 0.24, "learning_rate": 4.439714086755548e-06, "loss": 1.0928, "step": 12763 }, { "epoch": 0.24, "learning_rate": 4.439617707393898e-06, "loss": 0.9091, "step": 12764 }, { "epoch": 0.24, "learning_rate": 4.439521320789775e-06, "loss": 0.9645, "step": 12765 }, { "epoch": 0.24, "learning_rate": 4.439424926943538e-06, "loss": 0.8288, "step": 12766 }, { "epoch": 0.24, "learning_rate": 4.439328525855548e-06, "loss": 0.9238, "step": 12767 }, { "epoch": 0.24, "learning_rate": 4.439232117526165e-06, "loss": 1.3696, "step": 12768 }, { "epoch": 0.24, "learning_rate": 4.439135701955749e-06, "loss": 1.0583, "step": 12769 }, { "epoch": 0.24, "learning_rate": 4.43903927914466e-06, "loss": 0.7943, "step": 12770 }, { "epoch": 0.24, "learning_rate": 4.438942849093257e-06, "loss": 0.6528, "step": 12771 }, { "epoch": 0.24, "learning_rate": 4.438846411801902e-06, "loss": 1.0519, "step": 12772 }, { "epoch": 0.24, "learning_rate": 4.438749967270952e-06, "loss": 0.7938, "step": 12773 }, { "epoch": 0.24, "learning_rate": 4.4386535155007705e-06, "loss": 1.1207, "step": 12774 }, { "epoch": 0.24, "learning_rate": 4.438557056491716e-06, "loss": 0.9832, "step": 12775 }, { "epoch": 0.24, "learning_rate": 4.438460590244149e-06, "loss": 0.9061, "step": 12776 }, { "epoch": 0.24, "learning_rate": 4.438364116758429e-06, "loss": 0.8408, "step": 12777 }, { "epoch": 0.24, "learning_rate": 4.4382676360349175e-06, "loss": 0.6863, "step": 12778 }, { "epoch": 0.24, "learning_rate": 4.438171148073974e-06, "loss": 0.7382, "step": 12779 }, { "epoch": 0.24, "learning_rate": 4.438074652875959e-06, "loss": 0.8508, "step": 12780 }, { "epoch": 0.24, "learning_rate": 4.4379781504412324e-06, "loss": 1.0897, "step": 12781 }, { "epoch": 0.24, "learning_rate": 4.437881640770154e-06, "loss": 1.0049, "step": 12782 }, { "epoch": 0.24, "learning_rate": 4.4377851238630855e-06, "loss": 0.8897, "step": 12783 }, { "epoch": 0.24, "learning_rate": 4.437688599720387e-06, "loss": 0.9194, "step": 12784 }, { "epoch": 0.24, "learning_rate": 4.437592068342419e-06, "loss": 0.8891, "step": 12785 }, { "epoch": 0.24, "learning_rate": 4.4374955297295415e-06, "loss": 0.946, "step": 12786 }, { "epoch": 0.24, "learning_rate": 4.437398983882115e-06, "loss": 1.3045, "step": 12787 }, { "epoch": 0.24, "learning_rate": 4.4373024308005e-06, "loss": 1.0177, "step": 12788 }, { "epoch": 0.24, "learning_rate": 4.437205870485056e-06, "loss": 0.7587, "step": 12789 }, { "epoch": 0.24, "learning_rate": 4.437109302936146e-06, "loss": 0.8701, "step": 12790 }, { "epoch": 0.24, "learning_rate": 4.43701272815413e-06, "loss": 0.8842, "step": 12791 }, { "epoch": 0.24, "learning_rate": 4.436916146139366e-06, "loss": 0.7505, "step": 12792 }, { "epoch": 0.24, "learning_rate": 4.436819556892218e-06, "loss": 0.9365, "step": 12793 }, { "epoch": 0.24, "learning_rate": 4.436722960413044e-06, "loss": 1.1244, "step": 12794 }, { "epoch": 0.24, "learning_rate": 4.436626356702206e-06, "loss": 0.9297, "step": 12795 }, { "epoch": 0.24, "learning_rate": 4.436529745760065e-06, "loss": 0.8643, "step": 12796 }, { "epoch": 0.24, "learning_rate": 4.436433127586981e-06, "loss": 0.8214, "step": 12797 }, { "epoch": 0.24, "learning_rate": 4.436336502183316e-06, "loss": 0.9219, "step": 12798 }, { "epoch": 0.24, "learning_rate": 4.436239869549429e-06, "loss": 1.2022, "step": 12799 }, { "epoch": 0.24, "learning_rate": 4.436143229685682e-06, "loss": 0.981, "step": 12800 }, { "epoch": 0.24, "learning_rate": 4.4360465825924345e-06, "loss": 0.8727, "step": 12801 }, { "epoch": 0.24, "learning_rate": 4.43594992827005e-06, "loss": 0.9882, "step": 12802 }, { "epoch": 0.24, "learning_rate": 4.435853266718888e-06, "loss": 0.902, "step": 12803 }, { "epoch": 0.24, "learning_rate": 4.435756597939308e-06, "loss": 0.8525, "step": 12804 }, { "epoch": 0.24, "learning_rate": 4.435659921931672e-06, "loss": 0.9583, "step": 12805 }, { "epoch": 0.24, "learning_rate": 4.435563238696342e-06, "loss": 1.2483, "step": 12806 }, { "epoch": 0.24, "learning_rate": 4.435466548233678e-06, "loss": 0.8343, "step": 12807 }, { "epoch": 0.24, "learning_rate": 4.435369850544041e-06, "loss": 0.7796, "step": 12808 }, { "epoch": 0.24, "learning_rate": 4.435273145627793e-06, "loss": 0.8602, "step": 12809 }, { "epoch": 0.24, "learning_rate": 4.435176433485294e-06, "loss": 0.7914, "step": 12810 }, { "epoch": 0.24, "learning_rate": 4.435079714116906e-06, "loss": 0.9529, "step": 12811 }, { "epoch": 0.24, "learning_rate": 4.434982987522989e-06, "loss": 0.8038, "step": 12812 }, { "epoch": 0.24, "learning_rate": 4.434886253703905e-06, "loss": 0.9321, "step": 12813 }, { "epoch": 0.24, "learning_rate": 4.434789512660015e-06, "loss": 0.8931, "step": 12814 }, { "epoch": 0.24, "learning_rate": 4.43469276439168e-06, "loss": 0.9847, "step": 12815 }, { "epoch": 0.24, "learning_rate": 4.4345960088992625e-06, "loss": 0.849, "step": 12816 }, { "epoch": 0.24, "learning_rate": 4.434499246183122e-06, "loss": 1.0519, "step": 12817 }, { "epoch": 0.24, "learning_rate": 4.4344024762436214e-06, "loss": 0.8176, "step": 12818 }, { "epoch": 0.24, "learning_rate": 4.434305699081121e-06, "loss": 1.056, "step": 12819 }, { "epoch": 0.24, "learning_rate": 4.434208914695982e-06, "loss": 1.0289, "step": 12820 }, { "epoch": 0.24, "learning_rate": 4.434112123088566e-06, "loss": 0.8155, "step": 12821 }, { "epoch": 0.24, "learning_rate": 4.434015324259236e-06, "loss": 1.0876, "step": 12822 }, { "epoch": 0.24, "learning_rate": 4.43391851820835e-06, "loss": 0.913, "step": 12823 }, { "epoch": 0.24, "learning_rate": 4.433821704936273e-06, "loss": 1.1602, "step": 12824 }, { "epoch": 0.24, "learning_rate": 4.433724884443365e-06, "loss": 0.9673, "step": 12825 }, { "epoch": 0.24, "learning_rate": 4.433628056729987e-06, "loss": 0.9223, "step": 12826 }, { "epoch": 0.24, "learning_rate": 4.433531221796501e-06, "loss": 0.8575, "step": 12827 }, { "epoch": 0.24, "learning_rate": 4.43343437964327e-06, "loss": 0.9138, "step": 12828 }, { "epoch": 0.24, "learning_rate": 4.433337530270652e-06, "loss": 0.9931, "step": 12829 }, { "epoch": 0.24, "learning_rate": 4.433240673679014e-06, "loss": 1.231, "step": 12830 }, { "epoch": 0.24, "learning_rate": 4.433143809868713e-06, "loss": 0.9948, "step": 12831 }, { "epoch": 0.24, "learning_rate": 4.433046938840111e-06, "loss": 0.9838, "step": 12832 }, { "epoch": 0.24, "learning_rate": 4.432950060593573e-06, "loss": 0.9685, "step": 12833 }, { "epoch": 0.24, "learning_rate": 4.4328531751294576e-06, "loss": 0.896, "step": 12834 }, { "epoch": 0.24, "learning_rate": 4.4327562824481285e-06, "loss": 0.8487, "step": 12835 }, { "epoch": 0.24, "learning_rate": 4.432659382549946e-06, "loss": 0.9007, "step": 12836 }, { "epoch": 0.24, "learning_rate": 4.4325624754352725e-06, "loss": 1.3157, "step": 12837 }, { "epoch": 0.24, "learning_rate": 4.432465561104471e-06, "loss": 0.7755, "step": 12838 }, { "epoch": 0.24, "learning_rate": 4.432368639557901e-06, "loss": 0.8148, "step": 12839 }, { "epoch": 0.24, "learning_rate": 4.432271710795927e-06, "loss": 0.9489, "step": 12840 }, { "epoch": 0.24, "learning_rate": 4.43217477481891e-06, "loss": 0.795, "step": 12841 }, { "epoch": 0.24, "learning_rate": 4.432077831627209e-06, "loss": 0.906, "step": 12842 }, { "epoch": 0.24, "learning_rate": 4.431980881221192e-06, "loss": 0.8342, "step": 12843 }, { "epoch": 0.24, "learning_rate": 4.431883923601216e-06, "loss": 1.2791, "step": 12844 }, { "epoch": 0.24, "learning_rate": 4.431786958767644e-06, "loss": 0.9211, "step": 12845 }, { "epoch": 0.24, "learning_rate": 4.43168998672084e-06, "loss": 0.7196, "step": 12846 }, { "epoch": 0.24, "learning_rate": 4.4315930074611635e-06, "loss": 0.6775, "step": 12847 }, { "epoch": 0.24, "learning_rate": 4.431496020988979e-06, "loss": 1.03, "step": 12848 }, { "epoch": 0.24, "learning_rate": 4.431399027304647e-06, "loss": 1.1946, "step": 12849 }, { "epoch": 0.24, "learning_rate": 4.4313020264085305e-06, "loss": 1.074, "step": 12850 }, { "epoch": 0.24, "learning_rate": 4.431205018300992e-06, "loss": 1.0889, "step": 12851 }, { "epoch": 0.24, "learning_rate": 4.431108002982392e-06, "loss": 0.9217, "step": 12852 }, { "epoch": 0.24, "learning_rate": 4.431010980453094e-06, "loss": 1.0031, "step": 12853 }, { "epoch": 0.24, "learning_rate": 4.430913950713461e-06, "loss": 0.9063, "step": 12854 }, { "epoch": 0.24, "learning_rate": 4.430816913763855e-06, "loss": 1.1575, "step": 12855 }, { "epoch": 0.24, "learning_rate": 4.4307198696046364e-06, "loss": 1.1064, "step": 12856 }, { "epoch": 0.24, "learning_rate": 4.43062281823617e-06, "loss": 1.0846, "step": 12857 }, { "epoch": 0.24, "learning_rate": 4.430525759658817e-06, "loss": 0.8343, "step": 12858 }, { "epoch": 0.24, "learning_rate": 4.43042869387294e-06, "loss": 1.0164, "step": 12859 }, { "epoch": 0.24, "learning_rate": 4.430331620878901e-06, "loss": 0.7443, "step": 12860 }, { "epoch": 0.24, "learning_rate": 4.430234540677064e-06, "loss": 1.0483, "step": 12861 }, { "epoch": 0.24, "learning_rate": 4.430137453267789e-06, "loss": 1.018, "step": 12862 }, { "epoch": 0.24, "learning_rate": 4.43004035865144e-06, "loss": 0.9445, "step": 12863 }, { "epoch": 0.24, "learning_rate": 4.42994325682838e-06, "loss": 0.966, "step": 12864 }, { "epoch": 0.24, "learning_rate": 4.429846147798972e-06, "loss": 1.0922, "step": 12865 }, { "epoch": 0.24, "learning_rate": 4.4297490315635766e-06, "loss": 1.0402, "step": 12866 }, { "epoch": 0.24, "learning_rate": 4.429651908122558e-06, "loss": 0.8368, "step": 12867 }, { "epoch": 0.24, "learning_rate": 4.429554777476278e-06, "loss": 1.0985, "step": 12868 }, { "epoch": 0.24, "learning_rate": 4.429457639625099e-06, "loss": 0.9311, "step": 12869 }, { "epoch": 0.24, "learning_rate": 4.429360494569385e-06, "loss": 1.0135, "step": 12870 }, { "epoch": 0.24, "learning_rate": 4.4292633423094985e-06, "loss": 0.8302, "step": 12871 }, { "epoch": 0.24, "learning_rate": 4.429166182845801e-06, "loss": 1.0213, "step": 12872 }, { "epoch": 0.24, "learning_rate": 4.429069016178656e-06, "loss": 0.8809, "step": 12873 }, { "epoch": 0.24, "learning_rate": 4.428971842308427e-06, "loss": 0.9068, "step": 12874 }, { "epoch": 0.24, "learning_rate": 4.428874661235477e-06, "loss": 1.3248, "step": 12875 }, { "epoch": 0.24, "learning_rate": 4.428777472960167e-06, "loss": 0.7805, "step": 12876 }, { "epoch": 0.24, "learning_rate": 4.428680277482861e-06, "loss": 1.0204, "step": 12877 }, { "epoch": 0.24, "learning_rate": 4.428583074803923e-06, "loss": 1.0471, "step": 12878 }, { "epoch": 0.24, "learning_rate": 4.4284858649237136e-06, "loss": 0.8517, "step": 12879 }, { "epoch": 0.24, "learning_rate": 4.4283886478425986e-06, "loss": 1.0482, "step": 12880 }, { "epoch": 0.24, "learning_rate": 4.428291423560939e-06, "loss": 0.9649, "step": 12881 }, { "epoch": 0.24, "learning_rate": 4.428194192079098e-06, "loss": 1.0337, "step": 12882 }, { "epoch": 0.24, "learning_rate": 4.428096953397439e-06, "loss": 0.8622, "step": 12883 }, { "epoch": 0.24, "learning_rate": 4.427999707516325e-06, "loss": 0.8356, "step": 12884 }, { "epoch": 0.24, "learning_rate": 4.42790245443612e-06, "loss": 0.9745, "step": 12885 }, { "epoch": 0.24, "learning_rate": 4.427805194157185e-06, "loss": 0.8611, "step": 12886 }, { "epoch": 0.24, "learning_rate": 4.427707926679885e-06, "loss": 0.9008, "step": 12887 }, { "epoch": 0.24, "learning_rate": 4.427610652004584e-06, "loss": 1.0677, "step": 12888 }, { "epoch": 0.24, "learning_rate": 4.427513370131642e-06, "loss": 0.8824, "step": 12889 }, { "epoch": 0.24, "learning_rate": 4.4274160810614255e-06, "loss": 1.0099, "step": 12890 }, { "epoch": 0.24, "learning_rate": 4.427318784794295e-06, "loss": 0.8551, "step": 12891 }, { "epoch": 0.24, "learning_rate": 4.427221481330617e-06, "loss": 0.9623, "step": 12892 }, { "epoch": 0.24, "learning_rate": 4.427124170670752e-06, "loss": 1.1782, "step": 12893 }, { "epoch": 0.24, "learning_rate": 4.427026852815065e-06, "loss": 1.1448, "step": 12894 }, { "epoch": 0.24, "learning_rate": 4.426929527763919e-06, "loss": 0.7607, "step": 12895 }, { "epoch": 0.24, "learning_rate": 4.426832195517677e-06, "loss": 0.9434, "step": 12896 }, { "epoch": 0.24, "learning_rate": 4.426734856076702e-06, "loss": 0.8201, "step": 12897 }, { "epoch": 0.24, "learning_rate": 4.426637509441358e-06, "loss": 0.891, "step": 12898 }, { "epoch": 0.24, "learning_rate": 4.42654015561201e-06, "loss": 1.0043, "step": 12899 }, { "epoch": 0.24, "learning_rate": 4.42644279458902e-06, "loss": 1.0601, "step": 12900 }, { "epoch": 0.24, "learning_rate": 4.42634542637275e-06, "loss": 0.7498, "step": 12901 }, { "epoch": 0.24, "learning_rate": 4.4262480509635666e-06, "loss": 1.0098, "step": 12902 }, { "epoch": 0.24, "learning_rate": 4.4261506683618316e-06, "loss": 0.9983, "step": 12903 }, { "epoch": 0.24, "learning_rate": 4.4260532785679085e-06, "loss": 0.8596, "step": 12904 }, { "epoch": 0.24, "learning_rate": 4.425955881582162e-06, "loss": 0.9526, "step": 12905 }, { "epoch": 0.24, "learning_rate": 4.425858477404957e-06, "loss": 1.1453, "step": 12906 }, { "epoch": 0.24, "learning_rate": 4.425761066036654e-06, "loss": 0.8611, "step": 12907 }, { "epoch": 0.24, "learning_rate": 4.425663647477617e-06, "loss": 0.7775, "step": 12908 }, { "epoch": 0.24, "learning_rate": 4.425566221728213e-06, "loss": 1.0219, "step": 12909 }, { "epoch": 0.24, "learning_rate": 4.425468788788803e-06, "loss": 0.8959, "step": 12910 }, { "epoch": 0.24, "learning_rate": 4.42537134865975e-06, "loss": 0.8001, "step": 12911 }, { "epoch": 0.24, "learning_rate": 4.425273901341421e-06, "loss": 1.0647, "step": 12912 }, { "epoch": 0.24, "learning_rate": 4.425176446834179e-06, "loss": 0.9811, "step": 12913 }, { "epoch": 0.24, "learning_rate": 4.425078985138386e-06, "loss": 0.9346, "step": 12914 }, { "epoch": 0.24, "learning_rate": 4.4249815162544075e-06, "loss": 0.8678, "step": 12915 }, { "epoch": 0.24, "learning_rate": 4.424884040182608e-06, "loss": 0.9795, "step": 12916 }, { "epoch": 0.24, "learning_rate": 4.424786556923349e-06, "loss": 0.8161, "step": 12917 }, { "epoch": 0.24, "learning_rate": 4.4246890664769965e-06, "loss": 0.9885, "step": 12918 }, { "epoch": 0.24, "learning_rate": 4.424591568843914e-06, "loss": 0.8386, "step": 12919 }, { "epoch": 0.24, "learning_rate": 4.424494064024465e-06, "loss": 0.9866, "step": 12920 }, { "epoch": 0.24, "learning_rate": 4.424396552019016e-06, "loss": 0.8882, "step": 12921 }, { "epoch": 0.24, "learning_rate": 4.424299032827928e-06, "loss": 0.8581, "step": 12922 }, { "epoch": 0.24, "learning_rate": 4.424201506451566e-06, "loss": 0.9999, "step": 12923 }, { "epoch": 0.24, "learning_rate": 4.424103972890295e-06, "loss": 1.0482, "step": 12924 }, { "epoch": 0.24, "learning_rate": 4.424006432144478e-06, "loss": 0.9909, "step": 12925 }, { "epoch": 0.24, "learning_rate": 4.423908884214482e-06, "loss": 0.7685, "step": 12926 }, { "epoch": 0.24, "learning_rate": 4.423811329100668e-06, "loss": 0.8193, "step": 12927 }, { "epoch": 0.24, "learning_rate": 4.423713766803401e-06, "loss": 0.9706, "step": 12928 }, { "epoch": 0.24, "learning_rate": 4.423616197323046e-06, "loss": 0.9157, "step": 12929 }, { "epoch": 0.24, "learning_rate": 4.423518620659968e-06, "loss": 1.0177, "step": 12930 }, { "epoch": 0.24, "learning_rate": 4.42342103681453e-06, "loss": 1.1722, "step": 12931 }, { "epoch": 0.24, "learning_rate": 4.423323445787097e-06, "loss": 1.1445, "step": 12932 }, { "epoch": 0.24, "learning_rate": 4.423225847578032e-06, "loss": 0.7659, "step": 12933 }, { "epoch": 0.24, "learning_rate": 4.423128242187702e-06, "loss": 1.037, "step": 12934 }, { "epoch": 0.24, "learning_rate": 4.42303062961647e-06, "loss": 0.881, "step": 12935 }, { "epoch": 0.24, "learning_rate": 4.4229330098647e-06, "loss": 1.0655, "step": 12936 }, { "epoch": 0.24, "learning_rate": 4.422835382932758e-06, "loss": 0.9102, "step": 12937 }, { "epoch": 0.24, "learning_rate": 4.422737748821006e-06, "loss": 0.9844, "step": 12938 }, { "epoch": 0.24, "learning_rate": 4.422640107529811e-06, "loss": 0.7503, "step": 12939 }, { "epoch": 0.24, "learning_rate": 4.4225424590595375e-06, "loss": 0.9661, "step": 12940 }, { "epoch": 0.24, "learning_rate": 4.422444803410549e-06, "loss": 0.9426, "step": 12941 }, { "epoch": 0.24, "learning_rate": 4.4223471405832105e-06, "loss": 1.0522, "step": 12942 }, { "epoch": 0.24, "learning_rate": 4.422249470577886e-06, "loss": 0.9153, "step": 12943 }, { "epoch": 0.24, "learning_rate": 4.422151793394942e-06, "loss": 1.0456, "step": 12944 }, { "epoch": 0.24, "learning_rate": 4.422054109034741e-06, "loss": 1.0422, "step": 12945 }, { "epoch": 0.24, "learning_rate": 4.42195641749765e-06, "loss": 0.9271, "step": 12946 }, { "epoch": 0.24, "learning_rate": 4.421858718784033e-06, "loss": 0.9736, "step": 12947 }, { "epoch": 0.24, "learning_rate": 4.421761012894253e-06, "loss": 0.7717, "step": 12948 }, { "epoch": 0.24, "learning_rate": 4.421663299828677e-06, "loss": 1.0726, "step": 12949 }, { "epoch": 0.24, "learning_rate": 4.421565579587669e-06, "loss": 1.1823, "step": 12950 }, { "epoch": 0.24, "learning_rate": 4.421467852171594e-06, "loss": 0.8534, "step": 12951 }, { "epoch": 0.24, "learning_rate": 4.421370117580818e-06, "loss": 0.7413, "step": 12952 }, { "epoch": 0.24, "learning_rate": 4.4212723758157035e-06, "loss": 0.7895, "step": 12953 }, { "epoch": 0.24, "learning_rate": 4.4211746268766175e-06, "loss": 0.7694, "step": 12954 }, { "epoch": 0.24, "learning_rate": 4.421076870763924e-06, "loss": 1.0332, "step": 12955 }, { "epoch": 0.24, "learning_rate": 4.420979107477989e-06, "loss": 1.1041, "step": 12956 }, { "epoch": 0.24, "learning_rate": 4.420881337019176e-06, "loss": 1.035, "step": 12957 }, { "epoch": 0.24, "learning_rate": 4.420783559387852e-06, "loss": 0.7477, "step": 12958 }, { "epoch": 0.24, "learning_rate": 4.420685774584381e-06, "loss": 0.8851, "step": 12959 }, { "epoch": 0.24, "learning_rate": 4.420587982609127e-06, "loss": 0.8184, "step": 12960 }, { "epoch": 0.24, "learning_rate": 4.420490183462458e-06, "loss": 0.772, "step": 12961 }, { "epoch": 0.24, "learning_rate": 4.420392377144737e-06, "loss": 1.2176, "step": 12962 }, { "epoch": 0.24, "learning_rate": 4.420294563656329e-06, "loss": 0.982, "step": 12963 }, { "epoch": 0.24, "learning_rate": 4.4201967429976e-06, "loss": 0.9376, "step": 12964 }, { "epoch": 0.24, "learning_rate": 4.420098915168915e-06, "loss": 1.1158, "step": 12965 }, { "epoch": 0.24, "learning_rate": 4.4200010801706404e-06, "loss": 0.9417, "step": 12966 }, { "epoch": 0.24, "learning_rate": 4.419903238003141e-06, "loss": 0.9675, "step": 12967 }, { "epoch": 0.24, "learning_rate": 4.419805388666781e-06, "loss": 1.0295, "step": 12968 }, { "epoch": 0.24, "learning_rate": 4.4197075321619265e-06, "loss": 1.234, "step": 12969 }, { "epoch": 0.24, "learning_rate": 4.419609668488944e-06, "loss": 0.9233, "step": 12970 }, { "epoch": 0.24, "learning_rate": 4.419511797648196e-06, "loss": 0.9241, "step": 12971 }, { "epoch": 0.24, "learning_rate": 4.419413919640051e-06, "loss": 0.8805, "step": 12972 }, { "epoch": 0.24, "learning_rate": 4.419316034464873e-06, "loss": 0.8773, "step": 12973 }, { "epoch": 0.24, "learning_rate": 4.419218142123028e-06, "loss": 1.0834, "step": 12974 }, { "epoch": 0.24, "learning_rate": 4.419120242614882e-06, "loss": 1.1169, "step": 12975 }, { "epoch": 0.24, "learning_rate": 4.419022335940798e-06, "loss": 0.982, "step": 12976 }, { "epoch": 0.24, "learning_rate": 4.418924422101145e-06, "loss": 0.8285, "step": 12977 }, { "epoch": 0.24, "learning_rate": 4.418826501096286e-06, "loss": 0.9247, "step": 12978 }, { "epoch": 0.24, "learning_rate": 4.4187285729265884e-06, "loss": 0.8424, "step": 12979 }, { "epoch": 0.24, "learning_rate": 4.418630637592417e-06, "loss": 1.0203, "step": 12980 }, { "epoch": 0.24, "learning_rate": 4.418532695094137e-06, "loss": 1.0469, "step": 12981 }, { "epoch": 0.24, "learning_rate": 4.418434745432116e-06, "loss": 1.1478, "step": 12982 }, { "epoch": 0.24, "learning_rate": 4.4183367886067176e-06, "loss": 0.8442, "step": 12983 }, { "epoch": 0.24, "learning_rate": 4.418238824618309e-06, "loss": 1.0438, "step": 12984 }, { "epoch": 0.24, "learning_rate": 4.418140853467255e-06, "loss": 0.7484, "step": 12985 }, { "epoch": 0.25, "learning_rate": 4.418042875153922e-06, "loss": 0.949, "step": 12986 }, { "epoch": 0.25, "learning_rate": 4.417944889678675e-06, "loss": 1.2595, "step": 12987 }, { "epoch": 0.25, "learning_rate": 4.417846897041881e-06, "loss": 0.842, "step": 12988 }, { "epoch": 0.25, "learning_rate": 4.417748897243906e-06, "loss": 0.9236, "step": 12989 }, { "epoch": 0.25, "learning_rate": 4.417650890285116e-06, "loss": 0.7504, "step": 12990 }, { "epoch": 0.25, "learning_rate": 4.417552876165875e-06, "loss": 0.8712, "step": 12991 }, { "epoch": 0.25, "learning_rate": 4.417454854886551e-06, "loss": 0.7993, "step": 12992 }, { "epoch": 0.25, "learning_rate": 4.417356826447509e-06, "loss": 1.0764, "step": 12993 }, { "epoch": 0.25, "learning_rate": 4.417258790849116e-06, "loss": 0.9805, "step": 12994 }, { "epoch": 0.25, "learning_rate": 4.417160748091736e-06, "loss": 0.8418, "step": 12995 }, { "epoch": 0.25, "learning_rate": 4.417062698175738e-06, "loss": 0.7886, "step": 12996 }, { "epoch": 0.25, "learning_rate": 4.416964641101487e-06, "loss": 0.9854, "step": 12997 }, { "epoch": 0.25, "learning_rate": 4.416866576869348e-06, "loss": 0.7365, "step": 12998 }, { "epoch": 0.25, "learning_rate": 4.416768505479688e-06, "loss": 1.0707, "step": 12999 }, { "epoch": 0.25, "learning_rate": 4.4166704269328735e-06, "loss": 1.0607, "step": 13000 }, { "epoch": 0.25, "learning_rate": 4.4165723412292695e-06, "loss": 1.2159, "step": 13001 }, { "epoch": 0.25, "learning_rate": 4.416474248369244e-06, "loss": 0.8916, "step": 13002 }, { "epoch": 0.25, "learning_rate": 4.416376148353162e-06, "loss": 0.8528, "step": 13003 }, { "epoch": 0.25, "learning_rate": 4.416278041181391e-06, "loss": 0.9449, "step": 13004 }, { "epoch": 0.25, "learning_rate": 4.416179926854296e-06, "loss": 0.9293, "step": 13005 }, { "epoch": 0.25, "learning_rate": 4.416081805372243e-06, "loss": 1.1522, "step": 13006 }, { "epoch": 0.25, "learning_rate": 4.415983676735601e-06, "loss": 1.1212, "step": 13007 }, { "epoch": 0.25, "learning_rate": 4.415885540944733e-06, "loss": 0.9141, "step": 13008 }, { "epoch": 0.25, "learning_rate": 4.415787398000008e-06, "loss": 0.8819, "step": 13009 }, { "epoch": 0.25, "learning_rate": 4.415689247901792e-06, "loss": 0.9307, "step": 13010 }, { "epoch": 0.25, "learning_rate": 4.41559109065045e-06, "loss": 0.9164, "step": 13011 }, { "epoch": 0.25, "learning_rate": 4.4154929262463505e-06, "loss": 1.0427, "step": 13012 }, { "epoch": 0.25, "learning_rate": 4.415394754689859e-06, "loss": 0.9369, "step": 13013 }, { "epoch": 0.25, "learning_rate": 4.415296575981343e-06, "loss": 0.9231, "step": 13014 }, { "epoch": 0.25, "learning_rate": 4.415198390121167e-06, "loss": 0.8076, "step": 13015 }, { "epoch": 0.25, "learning_rate": 4.415100197109699e-06, "loss": 0.8442, "step": 13016 }, { "epoch": 0.25, "learning_rate": 4.4150019969473065e-06, "loss": 0.959, "step": 13017 }, { "epoch": 0.25, "learning_rate": 4.414903789634355e-06, "loss": 0.977, "step": 13018 }, { "epoch": 0.25, "learning_rate": 4.414805575171211e-06, "loss": 0.9861, "step": 13019 }, { "epoch": 0.25, "learning_rate": 4.4147073535582415e-06, "loss": 0.8072, "step": 13020 }, { "epoch": 0.25, "learning_rate": 4.414609124795813e-06, "loss": 0.7446, "step": 13021 }, { "epoch": 0.25, "learning_rate": 4.414510888884294e-06, "loss": 1.0936, "step": 13022 }, { "epoch": 0.25, "learning_rate": 4.41441264582405e-06, "loss": 0.869, "step": 13023 }, { "epoch": 0.25, "learning_rate": 4.414314395615447e-06, "loss": 1.1665, "step": 13024 }, { "epoch": 0.25, "learning_rate": 4.414216138258853e-06, "loss": 1.0955, "step": 13025 }, { "epoch": 0.25, "learning_rate": 4.414117873754635e-06, "loss": 0.8942, "step": 13026 }, { "epoch": 0.25, "learning_rate": 4.4140196021031595e-06, "loss": 0.9442, "step": 13027 }, { "epoch": 0.25, "learning_rate": 4.4139213233047935e-06, "loss": 1.0964, "step": 13028 }, { "epoch": 0.25, "learning_rate": 4.413823037359904e-06, "loss": 0.8784, "step": 13029 }, { "epoch": 0.25, "learning_rate": 4.413724744268857e-06, "loss": 0.8244, "step": 13030 }, { "epoch": 0.25, "learning_rate": 4.413626444032022e-06, "loss": 1.062, "step": 13031 }, { "epoch": 0.25, "learning_rate": 4.413528136649764e-06, "loss": 0.9515, "step": 13032 }, { "epoch": 0.25, "learning_rate": 4.41342982212245e-06, "loss": 0.8013, "step": 13033 }, { "epoch": 0.25, "learning_rate": 4.413331500450449e-06, "loss": 1.0355, "step": 13034 }, { "epoch": 0.25, "learning_rate": 4.413233171634125e-06, "loss": 0.8363, "step": 13035 }, { "epoch": 0.25, "learning_rate": 4.413134835673848e-06, "loss": 0.9504, "step": 13036 }, { "epoch": 0.25, "learning_rate": 4.413036492569984e-06, "loss": 1.1118, "step": 13037 }, { "epoch": 0.25, "learning_rate": 4.412938142322901e-06, "loss": 0.8965, "step": 13038 }, { "epoch": 0.25, "learning_rate": 4.412839784932965e-06, "loss": 0.9735, "step": 13039 }, { "epoch": 0.25, "learning_rate": 4.412741420400543e-06, "loss": 0.9442, "step": 13040 }, { "epoch": 0.25, "learning_rate": 4.412643048726005e-06, "loss": 0.9535, "step": 13041 }, { "epoch": 0.25, "learning_rate": 4.412544669909716e-06, "loss": 1.0082, "step": 13042 }, { "epoch": 0.25, "learning_rate": 4.412446283952044e-06, "loss": 1.0336, "step": 13043 }, { "epoch": 0.25, "learning_rate": 4.412347890853355e-06, "loss": 0.9593, "step": 13044 }, { "epoch": 0.25, "learning_rate": 4.412249490614018e-06, "loss": 0.841, "step": 13045 }, { "epoch": 0.25, "learning_rate": 4.412151083234401e-06, "loss": 0.8622, "step": 13046 }, { "epoch": 0.25, "learning_rate": 4.41205266871487e-06, "loss": 0.9004, "step": 13047 }, { "epoch": 0.25, "learning_rate": 4.411954247055793e-06, "loss": 0.9032, "step": 13048 }, { "epoch": 0.25, "learning_rate": 4.411855818257537e-06, "loss": 1.0672, "step": 13049 }, { "epoch": 0.25, "learning_rate": 4.41175738232047e-06, "loss": 1.103, "step": 13050 }, { "epoch": 0.25, "learning_rate": 4.41165893924496e-06, "loss": 0.9504, "step": 13051 }, { "epoch": 0.25, "learning_rate": 4.4115604890313745e-06, "loss": 1.0255, "step": 13052 }, { "epoch": 0.25, "learning_rate": 4.41146203168008e-06, "loss": 0.9955, "step": 13053 }, { "epoch": 0.25, "learning_rate": 4.411363567191445e-06, "loss": 0.8628, "step": 13054 }, { "epoch": 0.25, "learning_rate": 4.411265095565837e-06, "loss": 0.8992, "step": 13055 }, { "epoch": 0.25, "learning_rate": 4.4111666168036244e-06, "loss": 1.0754, "step": 13056 }, { "epoch": 0.25, "learning_rate": 4.411068130905174e-06, "loss": 0.9512, "step": 13057 }, { "epoch": 0.25, "learning_rate": 4.410969637870854e-06, "loss": 1.0721, "step": 13058 }, { "epoch": 0.25, "learning_rate": 4.41087113770103e-06, "loss": 0.8434, "step": 13059 }, { "epoch": 0.25, "learning_rate": 4.410772630396074e-06, "loss": 0.9258, "step": 13060 }, { "epoch": 0.25, "learning_rate": 4.41067411595635e-06, "loss": 0.842, "step": 13061 }, { "epoch": 0.25, "learning_rate": 4.4105755943822295e-06, "loss": 1.2136, "step": 13062 }, { "epoch": 0.25, "learning_rate": 4.410477065674077e-06, "loss": 0.8988, "step": 13063 }, { "epoch": 0.25, "learning_rate": 4.410378529832261e-06, "loss": 0.9265, "step": 13064 }, { "epoch": 0.25, "learning_rate": 4.410279986857151e-06, "loss": 0.9439, "step": 13065 }, { "epoch": 0.25, "learning_rate": 4.410181436749115e-06, "loss": 0.968, "step": 13066 }, { "epoch": 0.25, "learning_rate": 4.4100828795085185e-06, "loss": 1.0228, "step": 13067 }, { "epoch": 0.25, "learning_rate": 4.409984315135732e-06, "loss": 1.1523, "step": 13068 }, { "epoch": 0.25, "learning_rate": 4.409885743631122e-06, "loss": 0.9865, "step": 13069 }, { "epoch": 0.25, "learning_rate": 4.409787164995057e-06, "loss": 0.684, "step": 13070 }, { "epoch": 0.25, "learning_rate": 4.4096885792279066e-06, "loss": 0.9446, "step": 13071 }, { "epoch": 0.25, "learning_rate": 4.409589986330037e-06, "loss": 0.8088, "step": 13072 }, { "epoch": 0.25, "learning_rate": 4.409491386301816e-06, "loss": 0.7845, "step": 13073 }, { "epoch": 0.25, "learning_rate": 4.409392779143614e-06, "loss": 0.9304, "step": 13074 }, { "epoch": 0.25, "learning_rate": 4.409294164855797e-06, "loss": 1.1826, "step": 13075 }, { "epoch": 0.25, "learning_rate": 4.409195543438735e-06, "loss": 0.8774, "step": 13076 }, { "epoch": 0.25, "learning_rate": 4.409096914892795e-06, "loss": 0.9337, "step": 13077 }, { "epoch": 0.25, "learning_rate": 4.408998279218345e-06, "loss": 0.9823, "step": 13078 }, { "epoch": 0.25, "learning_rate": 4.408899636415755e-06, "loss": 0.8538, "step": 13079 }, { "epoch": 0.25, "learning_rate": 4.408800986485392e-06, "loss": 1.1265, "step": 13080 }, { "epoch": 0.25, "learning_rate": 4.408702329427625e-06, "loss": 1.0281, "step": 13081 }, { "epoch": 0.25, "learning_rate": 4.40860366524282e-06, "loss": 1.003, "step": 13082 }, { "epoch": 0.25, "learning_rate": 4.408504993931349e-06, "loss": 0.8363, "step": 13083 }, { "epoch": 0.25, "learning_rate": 4.40840631549358e-06, "loss": 0.7631, "step": 13084 }, { "epoch": 0.25, "learning_rate": 4.408307629929878e-06, "loss": 0.9511, "step": 13085 }, { "epoch": 0.25, "learning_rate": 4.408208937240616e-06, "loss": 1.1776, "step": 13086 }, { "epoch": 0.25, "learning_rate": 4.408110237426158e-06, "loss": 1.1384, "step": 13087 }, { "epoch": 0.25, "learning_rate": 4.408011530486876e-06, "loss": 1.0859, "step": 13088 }, { "epoch": 0.25, "learning_rate": 4.4079128164231375e-06, "loss": 0.8802, "step": 13089 }, { "epoch": 0.25, "learning_rate": 4.407814095235312e-06, "loss": 0.9359, "step": 13090 }, { "epoch": 0.25, "learning_rate": 4.407715366923766e-06, "loss": 0.9516, "step": 13091 }, { "epoch": 0.25, "learning_rate": 4.40761663148887e-06, "loss": 0.9, "step": 13092 }, { "epoch": 0.25, "learning_rate": 4.407517888930991e-06, "loss": 1.2676, "step": 13093 }, { "epoch": 0.25, "learning_rate": 4.407419139250499e-06, "loss": 0.8759, "step": 13094 }, { "epoch": 0.25, "learning_rate": 4.4073203824477625e-06, "loss": 1.0294, "step": 13095 }, { "epoch": 0.25, "learning_rate": 4.407221618523151e-06, "loss": 0.9417, "step": 13096 }, { "epoch": 0.25, "learning_rate": 4.407122847477031e-06, "loss": 0.915, "step": 13097 }, { "epoch": 0.25, "learning_rate": 4.407024069309775e-06, "loss": 0.9, "step": 13098 }, { "epoch": 0.25, "learning_rate": 4.4069252840217475e-06, "loss": 1.0076, "step": 13099 }, { "epoch": 0.25, "learning_rate": 4.40682649161332e-06, "loss": 1.1075, "step": 13100 }, { "epoch": 0.25, "learning_rate": 4.4067276920848614e-06, "loss": 0.8323, "step": 13101 }, { "epoch": 0.25, "learning_rate": 4.4066288854367394e-06, "loss": 1.038, "step": 13102 }, { "epoch": 0.25, "learning_rate": 4.406530071669324e-06, "loss": 1.0884, "step": 13103 }, { "epoch": 0.25, "learning_rate": 4.406431250782983e-06, "loss": 0.943, "step": 13104 }, { "epoch": 0.25, "learning_rate": 4.406332422778087e-06, "loss": 1.0775, "step": 13105 }, { "epoch": 0.25, "learning_rate": 4.406233587655004e-06, "loss": 1.0001, "step": 13106 }, { "epoch": 0.25, "learning_rate": 4.406134745414104e-06, "loss": 0.7849, "step": 13107 }, { "epoch": 0.25, "learning_rate": 4.406035896055754e-06, "loss": 0.9022, "step": 13108 }, { "epoch": 0.25, "learning_rate": 4.405937039580325e-06, "loss": 0.9081, "step": 13109 }, { "epoch": 0.25, "learning_rate": 4.405838175988185e-06, "loss": 0.9684, "step": 13110 }, { "epoch": 0.25, "learning_rate": 4.405739305279704e-06, "loss": 0.8931, "step": 13111 }, { "epoch": 0.25, "learning_rate": 4.4056404274552514e-06, "loss": 0.9959, "step": 13112 }, { "epoch": 0.25, "learning_rate": 4.405541542515195e-06, "loss": 1.0927, "step": 13113 }, { "epoch": 0.25, "learning_rate": 4.4054426504599056e-06, "loss": 0.8813, "step": 13114 }, { "epoch": 0.25, "learning_rate": 4.405343751289751e-06, "loss": 1.0454, "step": 13115 }, { "epoch": 0.25, "learning_rate": 4.405244845005102e-06, "loss": 0.8987, "step": 13116 }, { "epoch": 0.25, "learning_rate": 4.405145931606328e-06, "loss": 0.8093, "step": 13117 }, { "epoch": 0.25, "learning_rate": 4.405047011093795e-06, "loss": 0.7545, "step": 13118 }, { "epoch": 0.25, "learning_rate": 4.4049480834678764e-06, "loss": 0.8662, "step": 13119 }, { "epoch": 0.25, "learning_rate": 4.40484914872894e-06, "loss": 0.9451, "step": 13120 }, { "epoch": 0.25, "learning_rate": 4.404750206877355e-06, "loss": 0.9649, "step": 13121 }, { "epoch": 0.25, "learning_rate": 4.404651257913491e-06, "loss": 0.9973, "step": 13122 }, { "epoch": 0.25, "learning_rate": 4.404552301837719e-06, "loss": 0.9975, "step": 13123 }, { "epoch": 0.25, "learning_rate": 4.404453338650406e-06, "loss": 0.9256, "step": 13124 }, { "epoch": 0.25, "learning_rate": 4.404354368351922e-06, "loss": 0.9601, "step": 13125 }, { "epoch": 0.25, "learning_rate": 4.404255390942638e-06, "loss": 0.9764, "step": 13126 }, { "epoch": 0.25, "learning_rate": 4.404156406422923e-06, "loss": 0.6864, "step": 13127 }, { "epoch": 0.25, "learning_rate": 4.404057414793146e-06, "loss": 0.8193, "step": 13128 }, { "epoch": 0.25, "learning_rate": 4.403958416053677e-06, "loss": 0.7624, "step": 13129 }, { "epoch": 0.25, "learning_rate": 4.403859410204886e-06, "loss": 1.1183, "step": 13130 }, { "epoch": 0.25, "learning_rate": 4.403760397247141e-06, "loss": 1.1442, "step": 13131 }, { "epoch": 0.25, "learning_rate": 4.403661377180814e-06, "loss": 0.9778, "step": 13132 }, { "epoch": 0.25, "learning_rate": 4.4035623500062745e-06, "loss": 1.0007, "step": 13133 }, { "epoch": 0.25, "learning_rate": 4.403463315723891e-06, "loss": 1.0168, "step": 13134 }, { "epoch": 0.25, "learning_rate": 4.403364274334033e-06, "loss": 0.8909, "step": 13135 }, { "epoch": 0.25, "learning_rate": 4.403265225837072e-06, "loss": 0.9664, "step": 13136 }, { "epoch": 0.25, "learning_rate": 4.403166170233377e-06, "loss": 1.1144, "step": 13137 }, { "epoch": 0.25, "learning_rate": 4.403067107523318e-06, "loss": 1.0107, "step": 13138 }, { "epoch": 0.25, "learning_rate": 4.402968037707264e-06, "loss": 0.8737, "step": 13139 }, { "epoch": 0.25, "learning_rate": 4.4028689607855865e-06, "loss": 0.7913, "step": 13140 }, { "epoch": 0.25, "learning_rate": 4.402769876758654e-06, "loss": 0.9966, "step": 13141 }, { "epoch": 0.25, "learning_rate": 4.402670785626838e-06, "loss": 0.707, "step": 13142 }, { "epoch": 0.25, "learning_rate": 4.402571687390507e-06, "loss": 1.0035, "step": 13143 }, { "epoch": 0.25, "learning_rate": 4.402472582050031e-06, "loss": 1.2803, "step": 13144 }, { "epoch": 0.25, "learning_rate": 4.402373469605782e-06, "loss": 0.8965, "step": 13145 }, { "epoch": 0.25, "learning_rate": 4.402274350058128e-06, "loss": 0.917, "step": 13146 }, { "epoch": 0.25, "learning_rate": 4.40217522340744e-06, "loss": 0.8482, "step": 13147 }, { "epoch": 0.25, "learning_rate": 4.402076089654088e-06, "loss": 0.7571, "step": 13148 }, { "epoch": 0.25, "learning_rate": 4.401976948798442e-06, "loss": 1.162, "step": 13149 }, { "epoch": 0.25, "learning_rate": 4.401877800840873e-06, "loss": 1.0237, "step": 13150 }, { "epoch": 0.25, "learning_rate": 4.4017786457817516e-06, "loss": 0.9004, "step": 13151 }, { "epoch": 0.25, "learning_rate": 4.401679483621445e-06, "loss": 0.9618, "step": 13152 }, { "epoch": 0.25, "learning_rate": 4.401580314360326e-06, "loss": 0.7392, "step": 13153 }, { "epoch": 0.25, "learning_rate": 4.401481137998765e-06, "loss": 0.852, "step": 13154 }, { "epoch": 0.25, "learning_rate": 4.401381954537132e-06, "loss": 0.8623, "step": 13155 }, { "epoch": 0.25, "learning_rate": 4.401282763975796e-06, "loss": 0.9271, "step": 13156 }, { "epoch": 0.25, "learning_rate": 4.4011835663151295e-06, "loss": 1.0564, "step": 13157 }, { "epoch": 0.25, "learning_rate": 4.401084361555501e-06, "loss": 0.7731, "step": 13158 }, { "epoch": 0.25, "learning_rate": 4.400985149697282e-06, "loss": 1.0154, "step": 13159 }, { "epoch": 0.25, "learning_rate": 4.400885930740843e-06, "loss": 0.8113, "step": 13160 }, { "epoch": 0.25, "learning_rate": 4.4007867046865536e-06, "loss": 0.7009, "step": 13161 }, { "epoch": 0.25, "learning_rate": 4.400687471534786e-06, "loss": 1.0158, "step": 13162 }, { "epoch": 0.25, "learning_rate": 4.400588231285909e-06, "loss": 1.0547, "step": 13163 }, { "epoch": 0.25, "learning_rate": 4.400488983940294e-06, "loss": 0.8632, "step": 13164 }, { "epoch": 0.25, "learning_rate": 4.400389729498311e-06, "loss": 0.9259, "step": 13165 }, { "epoch": 0.25, "learning_rate": 4.4002904679603315e-06, "loss": 0.9949, "step": 13166 }, { "epoch": 0.25, "learning_rate": 4.400191199326726e-06, "loss": 0.9239, "step": 13167 }, { "epoch": 0.25, "learning_rate": 4.400091923597863e-06, "loss": 0.8693, "step": 13168 }, { "epoch": 0.25, "learning_rate": 4.399992640774117e-06, "loss": 1.2078, "step": 13169 }, { "epoch": 0.25, "learning_rate": 4.399893350855856e-06, "loss": 1.0904, "step": 13170 }, { "epoch": 0.25, "learning_rate": 4.399794053843451e-06, "loss": 0.9248, "step": 13171 }, { "epoch": 0.25, "learning_rate": 4.399694749737274e-06, "loss": 0.9233, "step": 13172 }, { "epoch": 0.25, "learning_rate": 4.399595438537695e-06, "loss": 1.0031, "step": 13173 }, { "epoch": 0.25, "learning_rate": 4.399496120245085e-06, "loss": 0.9764, "step": 13174 }, { "epoch": 0.25, "learning_rate": 4.3993967948598144e-06, "loss": 1.024, "step": 13175 }, { "epoch": 0.25, "learning_rate": 4.399297462382254e-06, "loss": 0.8939, "step": 13176 }, { "epoch": 0.25, "learning_rate": 4.3991981228127755e-06, "loss": 0.9697, "step": 13177 }, { "epoch": 0.25, "learning_rate": 4.39909877615175e-06, "loss": 0.8006, "step": 13178 }, { "epoch": 0.25, "learning_rate": 4.398999422399547e-06, "loss": 0.8748, "step": 13179 }, { "epoch": 0.25, "learning_rate": 4.398900061556539e-06, "loss": 0.9792, "step": 13180 }, { "epoch": 0.25, "learning_rate": 4.398800693623096e-06, "loss": 1.1987, "step": 13181 }, { "epoch": 0.25, "learning_rate": 4.39870131859959e-06, "loss": 0.9667, "step": 13182 }, { "epoch": 0.25, "learning_rate": 4.398601936486391e-06, "loss": 1.0033, "step": 13183 }, { "epoch": 0.25, "learning_rate": 4.398502547283871e-06, "loss": 1.1215, "step": 13184 }, { "epoch": 0.25, "learning_rate": 4.3984031509924e-06, "loss": 0.7683, "step": 13185 }, { "epoch": 0.25, "learning_rate": 4.398303747612351e-06, "loss": 0.9803, "step": 13186 }, { "epoch": 0.25, "learning_rate": 4.398204337144092e-06, "loss": 0.9715, "step": 13187 }, { "epoch": 0.25, "learning_rate": 4.398104919587998e-06, "loss": 0.7698, "step": 13188 }, { "epoch": 0.25, "learning_rate": 4.398005494944437e-06, "loss": 0.9115, "step": 13189 }, { "epoch": 0.25, "learning_rate": 4.397906063213783e-06, "loss": 0.861, "step": 13190 }, { "epoch": 0.25, "learning_rate": 4.3978066243964054e-06, "loss": 0.9249, "step": 13191 }, { "epoch": 0.25, "learning_rate": 4.3977071784926765e-06, "loss": 1.0164, "step": 13192 }, { "epoch": 0.25, "learning_rate": 4.397607725502966e-06, "loss": 1.1481, "step": 13193 }, { "epoch": 0.25, "learning_rate": 4.397508265427647e-06, "loss": 1.0198, "step": 13194 }, { "epoch": 0.25, "learning_rate": 4.397408798267091e-06, "loss": 0.9167, "step": 13195 }, { "epoch": 0.25, "learning_rate": 4.397309324021668e-06, "loss": 1.0494, "step": 13196 }, { "epoch": 0.25, "learning_rate": 4.3972098426917506e-06, "loss": 0.9223, "step": 13197 }, { "epoch": 0.25, "learning_rate": 4.39711035427771e-06, "loss": 0.868, "step": 13198 }, { "epoch": 0.25, "learning_rate": 4.397010858779916e-06, "loss": 1.0217, "step": 13199 }, { "epoch": 0.25, "learning_rate": 4.396911356198743e-06, "loss": 1.1621, "step": 13200 }, { "epoch": 0.25, "learning_rate": 4.396811846534561e-06, "loss": 1.1643, "step": 13201 }, { "epoch": 0.25, "learning_rate": 4.396712329787742e-06, "loss": 1.0067, "step": 13202 }, { "epoch": 0.25, "learning_rate": 4.396612805958657e-06, "loss": 0.79, "step": 13203 }, { "epoch": 0.25, "learning_rate": 4.396513275047678e-06, "loss": 0.824, "step": 13204 }, { "epoch": 0.25, "learning_rate": 4.396413737055176e-06, "loss": 0.8864, "step": 13205 }, { "epoch": 0.25, "learning_rate": 4.396314191981524e-06, "loss": 1.0128, "step": 13206 }, { "epoch": 0.25, "learning_rate": 4.396214639827093e-06, "loss": 0.7257, "step": 13207 }, { "epoch": 0.25, "learning_rate": 4.396115080592254e-06, "loss": 0.976, "step": 13208 }, { "epoch": 0.25, "learning_rate": 4.39601551427738e-06, "loss": 1.0889, "step": 13209 }, { "epoch": 0.25, "learning_rate": 4.395915940882842e-06, "loss": 0.9295, "step": 13210 }, { "epoch": 0.25, "learning_rate": 4.395816360409012e-06, "loss": 1.0695, "step": 13211 }, { "epoch": 0.25, "learning_rate": 4.395716772856262e-06, "loss": 0.9412, "step": 13212 }, { "epoch": 0.25, "learning_rate": 4.395617178224964e-06, "loss": 1.0545, "step": 13213 }, { "epoch": 0.25, "learning_rate": 4.395517576515488e-06, "loss": 0.9604, "step": 13214 }, { "epoch": 0.25, "learning_rate": 4.3954179677282086e-06, "loss": 1.0778, "step": 13215 }, { "epoch": 0.25, "learning_rate": 4.395318351863497e-06, "loss": 0.8616, "step": 13216 }, { "epoch": 0.25, "learning_rate": 4.395218728921724e-06, "loss": 0.7758, "step": 13217 }, { "epoch": 0.25, "learning_rate": 4.3951190989032625e-06, "loss": 1.0039, "step": 13218 }, { "epoch": 0.25, "learning_rate": 4.395019461808485e-06, "loss": 1.1008, "step": 13219 }, { "epoch": 0.25, "learning_rate": 4.394919817637763e-06, "loss": 0.9664, "step": 13220 }, { "epoch": 0.25, "learning_rate": 4.394820166391468e-06, "loss": 1.019, "step": 13221 }, { "epoch": 0.25, "learning_rate": 4.3947205080699724e-06, "loss": 0.8177, "step": 13222 }, { "epoch": 0.25, "learning_rate": 4.394620842673649e-06, "loss": 1.0078, "step": 13223 }, { "epoch": 0.25, "learning_rate": 4.394521170202869e-06, "loss": 0.9402, "step": 13224 }, { "epoch": 0.25, "learning_rate": 4.394421490658005e-06, "loss": 1.0461, "step": 13225 }, { "epoch": 0.25, "learning_rate": 4.39432180403943e-06, "loss": 0.8729, "step": 13226 }, { "epoch": 0.25, "learning_rate": 4.394222110347515e-06, "loss": 0.7079, "step": 13227 }, { "epoch": 0.25, "learning_rate": 4.394122409582633e-06, "loss": 0.8466, "step": 13228 }, { "epoch": 0.25, "learning_rate": 4.394022701745155e-06, "loss": 0.805, "step": 13229 }, { "epoch": 0.25, "learning_rate": 4.3939229868354546e-06, "loss": 0.9323, "step": 13230 }, { "epoch": 0.25, "learning_rate": 4.393823264853905e-06, "loss": 1.0673, "step": 13231 }, { "epoch": 0.25, "learning_rate": 4.393723535800877e-06, "loss": 1.0162, "step": 13232 }, { "epoch": 0.25, "learning_rate": 4.393623799676743e-06, "loss": 0.9489, "step": 13233 }, { "epoch": 0.25, "learning_rate": 4.393524056481875e-06, "loss": 1.004, "step": 13234 }, { "epoch": 0.25, "learning_rate": 4.393424306216647e-06, "loss": 0.9794, "step": 13235 }, { "epoch": 0.25, "learning_rate": 4.393324548881431e-06, "loss": 0.8007, "step": 13236 }, { "epoch": 0.25, "learning_rate": 4.393224784476599e-06, "loss": 1.0909, "step": 13237 }, { "epoch": 0.25, "learning_rate": 4.393125013002524e-06, "loss": 1.0767, "step": 13238 }, { "epoch": 0.25, "learning_rate": 4.393025234459577e-06, "loss": 0.8052, "step": 13239 }, { "epoch": 0.25, "learning_rate": 4.392925448848133e-06, "loss": 0.9921, "step": 13240 }, { "epoch": 0.25, "learning_rate": 4.392825656168563e-06, "loss": 0.7363, "step": 13241 }, { "epoch": 0.25, "learning_rate": 4.392725856421241e-06, "loss": 0.9429, "step": 13242 }, { "epoch": 0.25, "learning_rate": 4.3926260496065375e-06, "loss": 1.1069, "step": 13243 }, { "epoch": 0.25, "learning_rate": 4.392526235724827e-06, "loss": 1.0341, "step": 13244 }, { "epoch": 0.25, "learning_rate": 4.39242641477648e-06, "loss": 1.1028, "step": 13245 }, { "epoch": 0.25, "learning_rate": 4.392326586761872e-06, "loss": 0.739, "step": 13246 }, { "epoch": 0.25, "learning_rate": 4.3922267516813755e-06, "loss": 0.9805, "step": 13247 }, { "epoch": 0.25, "learning_rate": 4.392126909535361e-06, "loss": 0.7396, "step": 13248 }, { "epoch": 0.25, "learning_rate": 4.3920270603242035e-06, "loss": 1.2463, "step": 13249 }, { "epoch": 0.25, "learning_rate": 4.391927204048274e-06, "loss": 1.1628, "step": 13250 }, { "epoch": 0.25, "learning_rate": 4.391827340707947e-06, "loss": 0.8589, "step": 13251 }, { "epoch": 0.25, "learning_rate": 4.391727470303594e-06, "loss": 1.1477, "step": 13252 }, { "epoch": 0.25, "learning_rate": 4.39162759283559e-06, "loss": 1.187, "step": 13253 }, { "epoch": 0.25, "learning_rate": 4.391527708304305e-06, "loss": 0.8011, "step": 13254 }, { "epoch": 0.25, "learning_rate": 4.391427816710115e-06, "loss": 0.8423, "step": 13255 }, { "epoch": 0.25, "learning_rate": 4.391327918053391e-06, "loss": 1.1964, "step": 13256 }, { "epoch": 0.25, "learning_rate": 4.391228012334506e-06, "loss": 0.9045, "step": 13257 }, { "epoch": 0.25, "learning_rate": 4.391128099553834e-06, "loss": 1.1796, "step": 13258 }, { "epoch": 0.25, "learning_rate": 4.391028179711747e-06, "loss": 0.8549, "step": 13259 }, { "epoch": 0.25, "learning_rate": 4.390928252808619e-06, "loss": 0.8998, "step": 13260 }, { "epoch": 0.25, "learning_rate": 4.390828318844824e-06, "loss": 0.9647, "step": 13261 }, { "epoch": 0.25, "learning_rate": 4.3907283778207335e-06, "loss": 0.9536, "step": 13262 }, { "epoch": 0.25, "learning_rate": 4.390628429736721e-06, "loss": 1.0036, "step": 13263 }, { "epoch": 0.25, "learning_rate": 4.39052847459316e-06, "loss": 0.8909, "step": 13264 }, { "epoch": 0.25, "learning_rate": 4.390428512390423e-06, "loss": 1.0156, "step": 13265 }, { "epoch": 0.25, "learning_rate": 4.3903285431288845e-06, "loss": 0.9582, "step": 13266 }, { "epoch": 0.25, "learning_rate": 4.390228566808917e-06, "loss": 0.8588, "step": 13267 }, { "epoch": 0.25, "learning_rate": 4.390128583430894e-06, "loss": 0.9146, "step": 13268 }, { "epoch": 0.25, "learning_rate": 4.390028592995189e-06, "loss": 0.9747, "step": 13269 }, { "epoch": 0.25, "learning_rate": 4.389928595502175e-06, "loss": 0.9771, "step": 13270 }, { "epoch": 0.25, "learning_rate": 4.389828590952226e-06, "loss": 1.0271, "step": 13271 }, { "epoch": 0.25, "learning_rate": 4.389728579345715e-06, "loss": 0.9919, "step": 13272 }, { "epoch": 0.25, "learning_rate": 4.389628560683015e-06, "loss": 0.8427, "step": 13273 }, { "epoch": 0.25, "learning_rate": 4.389528534964499e-06, "loss": 1.0774, "step": 13274 }, { "epoch": 0.25, "learning_rate": 4.389428502190543e-06, "loss": 1.002, "step": 13275 }, { "epoch": 0.25, "learning_rate": 4.3893284623615185e-06, "loss": 1.0699, "step": 13276 }, { "epoch": 0.25, "learning_rate": 4.389228415477798e-06, "loss": 0.7403, "step": 13277 }, { "epoch": 0.25, "learning_rate": 4.389128361539758e-06, "loss": 0.9425, "step": 13278 }, { "epoch": 0.25, "learning_rate": 4.389028300547771e-06, "loss": 0.7719, "step": 13279 }, { "epoch": 0.25, "learning_rate": 4.38892823250221e-06, "loss": 0.9368, "step": 13280 }, { "epoch": 0.25, "learning_rate": 4.3888281574034475e-06, "loss": 1.0657, "step": 13281 }, { "epoch": 0.25, "learning_rate": 4.3887280752518605e-06, "loss": 1.1281, "step": 13282 }, { "epoch": 0.25, "learning_rate": 4.3886279860478195e-06, "loss": 0.9742, "step": 13283 }, { "epoch": 0.25, "learning_rate": 4.388527889791699e-06, "loss": 0.8681, "step": 13284 }, { "epoch": 0.25, "learning_rate": 4.388427786483875e-06, "loss": 0.8943, "step": 13285 }, { "epoch": 0.25, "learning_rate": 4.388327676124719e-06, "loss": 0.8102, "step": 13286 }, { "epoch": 0.25, "learning_rate": 4.388227558714604e-06, "loss": 1.2555, "step": 13287 }, { "epoch": 0.25, "learning_rate": 4.388127434253906e-06, "loss": 1.1219, "step": 13288 }, { "epoch": 0.25, "learning_rate": 4.388027302742999e-06, "loss": 0.8293, "step": 13289 }, { "epoch": 0.25, "learning_rate": 4.387927164182255e-06, "loss": 0.96, "step": 13290 }, { "epoch": 0.25, "learning_rate": 4.387827018572049e-06, "loss": 0.8662, "step": 13291 }, { "epoch": 0.25, "learning_rate": 4.387726865912755e-06, "loss": 0.8535, "step": 13292 }, { "epoch": 0.25, "learning_rate": 4.387626706204746e-06, "loss": 1.0072, "step": 13293 }, { "epoch": 0.25, "learning_rate": 4.387526539448398e-06, "loss": 1.0198, "step": 13294 }, { "epoch": 0.25, "learning_rate": 4.387426365644083e-06, "loss": 0.9312, "step": 13295 }, { "epoch": 0.25, "learning_rate": 4.387326184792175e-06, "loss": 0.9252, "step": 13296 }, { "epoch": 0.25, "learning_rate": 4.3872259968930505e-06, "loss": 1.0452, "step": 13297 }, { "epoch": 0.25, "learning_rate": 4.387125801947082e-06, "loss": 0.8224, "step": 13298 }, { "epoch": 0.25, "learning_rate": 4.3870255999546424e-06, "loss": 1.0845, "step": 13299 }, { "epoch": 0.25, "learning_rate": 4.386925390916108e-06, "loss": 1.1947, "step": 13300 }, { "epoch": 0.25, "learning_rate": 4.386825174831852e-06, "loss": 1.0589, "step": 13301 }, { "epoch": 0.25, "learning_rate": 4.386724951702247e-06, "loss": 1.0188, "step": 13302 }, { "epoch": 0.25, "learning_rate": 4.386624721527671e-06, "loss": 0.845, "step": 13303 }, { "epoch": 0.25, "learning_rate": 4.386524484308495e-06, "loss": 0.8857, "step": 13304 }, { "epoch": 0.25, "learning_rate": 4.386424240045094e-06, "loss": 1.0544, "step": 13305 }, { "epoch": 0.25, "learning_rate": 4.386323988737844e-06, "loss": 0.9668, "step": 13306 }, { "epoch": 0.25, "learning_rate": 4.386223730387118e-06, "loss": 0.958, "step": 13307 }, { "epoch": 0.25, "learning_rate": 4.386123464993289e-06, "loss": 0.875, "step": 13308 }, { "epoch": 0.25, "learning_rate": 4.386023192556734e-06, "loss": 1.1151, "step": 13309 }, { "epoch": 0.25, "learning_rate": 4.3859229130778265e-06, "loss": 0.8202, "step": 13310 }, { "epoch": 0.25, "learning_rate": 4.38582262655694e-06, "loss": 0.8204, "step": 13311 }, { "epoch": 0.25, "learning_rate": 4.38572233299445e-06, "loss": 1.1177, "step": 13312 }, { "epoch": 0.25, "learning_rate": 4.385622032390731e-06, "loss": 1.1166, "step": 13313 }, { "epoch": 0.25, "learning_rate": 4.385521724746156e-06, "loss": 0.9691, "step": 13314 }, { "epoch": 0.25, "learning_rate": 4.385421410061101e-06, "loss": 0.9857, "step": 13315 }, { "epoch": 0.25, "learning_rate": 4.385321088335941e-06, "loss": 0.9966, "step": 13316 }, { "epoch": 0.25, "learning_rate": 4.385220759571049e-06, "loss": 0.9297, "step": 13317 }, { "epoch": 0.25, "learning_rate": 4.385120423766801e-06, "loss": 1.1941, "step": 13318 }, { "epoch": 0.25, "learning_rate": 4.385020080923571e-06, "loss": 1.0504, "step": 13319 }, { "epoch": 0.25, "learning_rate": 4.384919731041733e-06, "loss": 0.9847, "step": 13320 }, { "epoch": 0.25, "learning_rate": 4.384819374121664e-06, "loss": 0.8526, "step": 13321 }, { "epoch": 0.25, "learning_rate": 4.384719010163736e-06, "loss": 0.9111, "step": 13322 }, { "epoch": 0.25, "learning_rate": 4.384618639168326e-06, "loss": 0.8096, "step": 13323 }, { "epoch": 0.25, "learning_rate": 4.3845182611358075e-06, "loss": 0.9886, "step": 13324 }, { "epoch": 0.25, "learning_rate": 4.3844178760665556e-06, "loss": 1.0965, "step": 13325 }, { "epoch": 0.25, "learning_rate": 4.384317483960945e-06, "loss": 0.829, "step": 13326 }, { "epoch": 0.25, "learning_rate": 4.38421708481935e-06, "loss": 0.973, "step": 13327 }, { "epoch": 0.25, "learning_rate": 4.384116678642147e-06, "loss": 1.0671, "step": 13328 }, { "epoch": 0.25, "learning_rate": 4.38401626542971e-06, "loss": 0.9239, "step": 13329 }, { "epoch": 0.25, "learning_rate": 4.383915845182414e-06, "loss": 0.8374, "step": 13330 }, { "epoch": 0.25, "learning_rate": 4.383815417900635e-06, "loss": 1.0779, "step": 13331 }, { "epoch": 0.25, "learning_rate": 4.383714983584745e-06, "loss": 0.9986, "step": 13332 }, { "epoch": 0.25, "learning_rate": 4.383614542235121e-06, "loss": 0.9388, "step": 13333 }, { "epoch": 0.25, "learning_rate": 4.38351409385214e-06, "loss": 0.8129, "step": 13334 }, { "epoch": 0.25, "learning_rate": 4.3834136384361745e-06, "loss": 0.9569, "step": 13335 }, { "epoch": 0.25, "learning_rate": 4.383313175987599e-06, "loss": 0.9232, "step": 13336 }, { "epoch": 0.25, "learning_rate": 4.383212706506791e-06, "loss": 1.0951, "step": 13337 }, { "epoch": 0.25, "learning_rate": 4.383112229994124e-06, "loss": 0.9687, "step": 13338 }, { "epoch": 0.25, "learning_rate": 4.383011746449975e-06, "loss": 1.0157, "step": 13339 }, { "epoch": 0.25, "learning_rate": 4.3829112558747155e-06, "loss": 0.9056, "step": 13340 }, { "epoch": 0.25, "learning_rate": 4.382810758268725e-06, "loss": 0.929, "step": 13341 }, { "epoch": 0.25, "learning_rate": 4.382710253632376e-06, "loss": 0.9768, "step": 13342 }, { "epoch": 0.25, "learning_rate": 4.382609741966044e-06, "loss": 0.9176, "step": 13343 }, { "epoch": 0.25, "learning_rate": 4.382509223270106e-06, "loss": 1.0607, "step": 13344 }, { "epoch": 0.25, "learning_rate": 4.382408697544936e-06, "loss": 0.9931, "step": 13345 }, { "epoch": 0.25, "learning_rate": 4.38230816479091e-06, "loss": 1.0405, "step": 13346 }, { "epoch": 0.25, "learning_rate": 4.382207625008403e-06, "loss": 0.9933, "step": 13347 }, { "epoch": 0.25, "learning_rate": 4.38210707819779e-06, "loss": 0.9891, "step": 13348 }, { "epoch": 0.25, "learning_rate": 4.382006524359447e-06, "loss": 1.066, "step": 13349 }, { "epoch": 0.25, "learning_rate": 4.38190596349375e-06, "loss": 1.1458, "step": 13350 }, { "epoch": 0.25, "learning_rate": 4.381805395601073e-06, "loss": 0.8331, "step": 13351 }, { "epoch": 0.25, "learning_rate": 4.381704820681792e-06, "loss": 0.9208, "step": 13352 }, { "epoch": 0.25, "learning_rate": 4.381604238736284e-06, "loss": 1.002, "step": 13353 }, { "epoch": 0.25, "learning_rate": 4.381503649764923e-06, "loss": 1.0743, "step": 13354 }, { "epoch": 0.25, "learning_rate": 4.3814030537680844e-06, "loss": 0.8951, "step": 13355 }, { "epoch": 0.25, "learning_rate": 4.3813024507461455e-06, "loss": 0.9911, "step": 13356 }, { "epoch": 0.25, "learning_rate": 4.38120184069948e-06, "loss": 0.9916, "step": 13357 }, { "epoch": 0.25, "learning_rate": 4.381101223628466e-06, "loss": 1.097, "step": 13358 }, { "epoch": 0.25, "learning_rate": 4.381000599533476e-06, "loss": 0.7565, "step": 13359 }, { "epoch": 0.25, "learning_rate": 4.3808999684148875e-06, "loss": 0.8489, "step": 13360 }, { "epoch": 0.25, "learning_rate": 4.380799330273078e-06, "loss": 0.7341, "step": 13361 }, { "epoch": 0.25, "learning_rate": 4.38069868510842e-06, "loss": 1.0488, "step": 13362 }, { "epoch": 0.25, "learning_rate": 4.38059803292129e-06, "loss": 0.9495, "step": 13363 }, { "epoch": 0.25, "learning_rate": 4.380497373712066e-06, "loss": 1.1187, "step": 13364 }, { "epoch": 0.25, "learning_rate": 4.380396707481123e-06, "loss": 0.9961, "step": 13365 }, { "epoch": 0.25, "learning_rate": 4.3802960342288344e-06, "loss": 0.8496, "step": 13366 }, { "epoch": 0.25, "learning_rate": 4.38019535395558e-06, "loss": 0.8651, "step": 13367 }, { "epoch": 0.25, "learning_rate": 4.380094666661733e-06, "loss": 1.1212, "step": 13368 }, { "epoch": 0.25, "learning_rate": 4.37999397234767e-06, "loss": 0.9509, "step": 13369 }, { "epoch": 0.25, "learning_rate": 4.379893271013768e-06, "loss": 1.0093, "step": 13370 }, { "epoch": 0.25, "learning_rate": 4.379792562660401e-06, "loss": 0.7699, "step": 13371 }, { "epoch": 0.25, "learning_rate": 4.379691847287947e-06, "loss": 1.04, "step": 13372 }, { "epoch": 0.25, "learning_rate": 4.37959112489678e-06, "loss": 0.8614, "step": 13373 }, { "epoch": 0.25, "learning_rate": 4.379490395487278e-06, "loss": 1.0865, "step": 13374 }, { "epoch": 0.25, "learning_rate": 4.379389659059817e-06, "loss": 1.0098, "step": 13375 }, { "epoch": 0.25, "learning_rate": 4.3792889156147726e-06, "loss": 0.7678, "step": 13376 }, { "epoch": 0.25, "learning_rate": 4.379188165152521e-06, "loss": 0.8018, "step": 13377 }, { "epoch": 0.25, "learning_rate": 4.379087407673438e-06, "loss": 0.85, "step": 13378 }, { "epoch": 0.25, "learning_rate": 4.3789866431779005e-06, "loss": 0.8882, "step": 13379 }, { "epoch": 0.25, "learning_rate": 4.378885871666284e-06, "loss": 1.1049, "step": 13380 }, { "epoch": 0.25, "learning_rate": 4.378785093138966e-06, "loss": 0.8671, "step": 13381 }, { "epoch": 0.25, "learning_rate": 4.378684307596321e-06, "loss": 1.0507, "step": 13382 }, { "epoch": 0.25, "learning_rate": 4.3785835150387275e-06, "loss": 0.9867, "step": 13383 }, { "epoch": 0.25, "learning_rate": 4.378482715466561e-06, "loss": 0.9198, "step": 13384 }, { "epoch": 0.25, "learning_rate": 4.378381908880197e-06, "loss": 0.9975, "step": 13385 }, { "epoch": 0.25, "learning_rate": 4.378281095280013e-06, "loss": 0.7938, "step": 13386 }, { "epoch": 0.25, "learning_rate": 4.378180274666384e-06, "loss": 0.9969, "step": 13387 }, { "epoch": 0.25, "learning_rate": 4.378079447039688e-06, "loss": 1.015, "step": 13388 }, { "epoch": 0.25, "learning_rate": 4.377978612400301e-06, "loss": 0.9578, "step": 13389 }, { "epoch": 0.25, "learning_rate": 4.377877770748599e-06, "loss": 0.8022, "step": 13390 }, { "epoch": 0.25, "learning_rate": 4.37777692208496e-06, "loss": 0.9147, "step": 13391 }, { "epoch": 0.25, "learning_rate": 4.377676066409759e-06, "loss": 0.914, "step": 13392 }, { "epoch": 0.25, "learning_rate": 4.377575203723372e-06, "loss": 1.0071, "step": 13393 }, { "epoch": 0.25, "learning_rate": 4.377474334026178e-06, "loss": 1.1877, "step": 13394 }, { "epoch": 0.25, "learning_rate": 4.3773734573185525e-06, "loss": 0.7941, "step": 13395 }, { "epoch": 0.25, "learning_rate": 4.3772725736008716e-06, "loss": 1.0146, "step": 13396 }, { "epoch": 0.25, "learning_rate": 4.3771716828735135e-06, "loss": 0.9619, "step": 13397 }, { "epoch": 0.25, "learning_rate": 4.377070785136853e-06, "loss": 0.8765, "step": 13398 }, { "epoch": 0.25, "learning_rate": 4.376969880391267e-06, "loss": 0.8637, "step": 13399 }, { "epoch": 0.25, "learning_rate": 4.3768689686371344e-06, "loss": 1.0304, "step": 13400 }, { "epoch": 0.25, "learning_rate": 4.37676804987483e-06, "loss": 0.9108, "step": 13401 }, { "epoch": 0.25, "learning_rate": 4.376667124104731e-06, "loss": 0.8994, "step": 13402 }, { "epoch": 0.25, "learning_rate": 4.376566191327214e-06, "loss": 1.0839, "step": 13403 }, { "epoch": 0.25, "learning_rate": 4.376465251542657e-06, "loss": 0.7409, "step": 13404 }, { "epoch": 0.25, "learning_rate": 4.376364304751437e-06, "loss": 1.0279, "step": 13405 }, { "epoch": 0.25, "learning_rate": 4.3762633509539295e-06, "loss": 1.1027, "step": 13406 }, { "epoch": 0.25, "learning_rate": 4.3761623901505125e-06, "loss": 0.9135, "step": 13407 }, { "epoch": 0.25, "learning_rate": 4.376061422341563e-06, "loss": 0.8759, "step": 13408 }, { "epoch": 0.25, "learning_rate": 4.375960447527456e-06, "loss": 0.996, "step": 13409 }, { "epoch": 0.25, "learning_rate": 4.3758594657085716e-06, "loss": 0.868, "step": 13410 }, { "epoch": 0.25, "learning_rate": 4.375758476885286e-06, "loss": 0.7745, "step": 13411 }, { "epoch": 0.25, "learning_rate": 4.375657481057974e-06, "loss": 1.257, "step": 13412 }, { "epoch": 0.25, "learning_rate": 4.375556478227016e-06, "loss": 0.7054, "step": 13413 }, { "epoch": 0.25, "learning_rate": 4.3754554683927875e-06, "loss": 0.9774, "step": 13414 }, { "epoch": 0.25, "learning_rate": 4.375354451555665e-06, "loss": 0.8421, "step": 13415 }, { "epoch": 0.25, "learning_rate": 4.375253427716027e-06, "loss": 0.9219, "step": 13416 }, { "epoch": 0.25, "learning_rate": 4.3751523968742496e-06, "loss": 0.7966, "step": 13417 }, { "epoch": 0.25, "learning_rate": 4.375051359030712e-06, "loss": 1.0113, "step": 13418 }, { "epoch": 0.25, "learning_rate": 4.374950314185789e-06, "loss": 0.9412, "step": 13419 }, { "epoch": 0.25, "learning_rate": 4.374849262339859e-06, "loss": 0.7044, "step": 13420 }, { "epoch": 0.25, "learning_rate": 4.3747482034932996e-06, "loss": 1.0508, "step": 13421 }, { "epoch": 0.25, "learning_rate": 4.3746471376464875e-06, "loss": 1.0289, "step": 13422 }, { "epoch": 0.25, "learning_rate": 4.3745460647998e-06, "loss": 0.7975, "step": 13423 }, { "epoch": 0.25, "learning_rate": 4.3744449849536165e-06, "loss": 1.041, "step": 13424 }, { "epoch": 0.25, "learning_rate": 4.374343898108312e-06, "loss": 1.2325, "step": 13425 }, { "epoch": 0.25, "learning_rate": 4.374242804264265e-06, "loss": 1.0344, "step": 13426 }, { "epoch": 0.25, "learning_rate": 4.3741417034218524e-06, "loss": 1.0887, "step": 13427 }, { "epoch": 0.25, "learning_rate": 4.374040595581453e-06, "loss": 0.929, "step": 13428 }, { "epoch": 0.25, "learning_rate": 4.373939480743443e-06, "loss": 0.783, "step": 13429 }, { "epoch": 0.25, "learning_rate": 4.3738383589082006e-06, "loss": 1.0605, "step": 13430 }, { "epoch": 0.25, "learning_rate": 4.373737230076103e-06, "loss": 1.1138, "step": 13431 }, { "epoch": 0.25, "learning_rate": 4.373636094247529e-06, "loss": 1.0135, "step": 13432 }, { "epoch": 0.25, "learning_rate": 4.373534951422854e-06, "loss": 0.8811, "step": 13433 }, { "epoch": 0.25, "learning_rate": 4.373433801602457e-06, "loss": 0.9613, "step": 13434 }, { "epoch": 0.25, "learning_rate": 4.373332644786716e-06, "loss": 0.791, "step": 13435 }, { "epoch": 0.25, "learning_rate": 4.373231480976009e-06, "loss": 1.0286, "step": 13436 }, { "epoch": 0.25, "learning_rate": 4.373130310170712e-06, "loss": 1.2081, "step": 13437 }, { "epoch": 0.25, "learning_rate": 4.373029132371204e-06, "loss": 1.137, "step": 13438 }, { "epoch": 0.25, "learning_rate": 4.372927947577863e-06, "loss": 0.9862, "step": 13439 }, { "epoch": 0.25, "learning_rate": 4.3728267557910666e-06, "loss": 0.9051, "step": 13440 }, { "epoch": 0.25, "learning_rate": 4.372725557011192e-06, "loss": 0.8912, "step": 13441 }, { "epoch": 0.25, "learning_rate": 4.372624351238618e-06, "loss": 0.9845, "step": 13442 }, { "epoch": 0.25, "learning_rate": 4.372523138473722e-06, "loss": 1.0167, "step": 13443 }, { "epoch": 0.25, "learning_rate": 4.372421918716882e-06, "loss": 1.0531, "step": 13444 }, { "epoch": 0.25, "learning_rate": 4.372320691968476e-06, "loss": 0.9414, "step": 13445 }, { "epoch": 0.25, "learning_rate": 4.372219458228882e-06, "loss": 1.0386, "step": 13446 }, { "epoch": 0.25, "learning_rate": 4.3721182174984776e-06, "loss": 0.8171, "step": 13447 }, { "epoch": 0.25, "learning_rate": 4.372016969777641e-06, "loss": 0.725, "step": 13448 }, { "epoch": 0.25, "learning_rate": 4.371915715066751e-06, "loss": 1.1631, "step": 13449 }, { "epoch": 0.25, "learning_rate": 4.371814453366185e-06, "loss": 1.1026, "step": 13450 }, { "epoch": 0.25, "learning_rate": 4.3717131846763215e-06, "loss": 1.0397, "step": 13451 }, { "epoch": 0.25, "learning_rate": 4.371611908997538e-06, "loss": 0.7309, "step": 13452 }, { "epoch": 0.25, "learning_rate": 4.371510626330213e-06, "loss": 0.9318, "step": 13453 }, { "epoch": 0.25, "learning_rate": 4.371409336674725e-06, "loss": 0.9788, "step": 13454 }, { "epoch": 0.25, "learning_rate": 4.3713080400314515e-06, "loss": 1.1407, "step": 13455 }, { "epoch": 0.25, "learning_rate": 4.3712067364007716e-06, "loss": 0.9505, "step": 13456 }, { "epoch": 0.25, "learning_rate": 4.3711054257830625e-06, "loss": 0.8477, "step": 13457 }, { "epoch": 0.25, "learning_rate": 4.371004108178704e-06, "loss": 0.7779, "step": 13458 }, { "epoch": 0.25, "learning_rate": 4.3709027835880725e-06, "loss": 0.8235, "step": 13459 }, { "epoch": 0.25, "learning_rate": 4.370801452011548e-06, "loss": 0.7424, "step": 13460 }, { "epoch": 0.25, "learning_rate": 4.370700113449508e-06, "loss": 1.1868, "step": 13461 }, { "epoch": 0.25, "learning_rate": 4.370598767902331e-06, "loss": 1.1208, "step": 13462 }, { "epoch": 0.25, "learning_rate": 4.370497415370396e-06, "loss": 0.9726, "step": 13463 }, { "epoch": 0.25, "learning_rate": 4.3703960558540806e-06, "loss": 0.905, "step": 13464 }, { "epoch": 0.25, "learning_rate": 4.370294689353764e-06, "loss": 1.0074, "step": 13465 }, { "epoch": 0.25, "learning_rate": 4.370193315869824e-06, "loss": 0.8943, "step": 13466 }, { "epoch": 0.25, "learning_rate": 4.37009193540264e-06, "loss": 0.9376, "step": 13467 }, { "epoch": 0.25, "learning_rate": 4.3699905479525896e-06, "loss": 0.9507, "step": 13468 }, { "epoch": 0.25, "learning_rate": 4.369889153520051e-06, "loss": 1.2487, "step": 13469 }, { "epoch": 0.25, "learning_rate": 4.369787752105405e-06, "loss": 0.9113, "step": 13470 }, { "epoch": 0.25, "learning_rate": 4.36968634370903e-06, "loss": 0.8796, "step": 13471 }, { "epoch": 0.25, "learning_rate": 4.369584928331301e-06, "loss": 0.9218, "step": 13472 }, { "epoch": 0.25, "learning_rate": 4.3694835059726005e-06, "loss": 0.9313, "step": 13473 }, { "epoch": 0.25, "learning_rate": 4.369382076633305e-06, "loss": 0.8912, "step": 13474 }, { "epoch": 0.25, "learning_rate": 4.369280640313795e-06, "loss": 0.9562, "step": 13475 }, { "epoch": 0.25, "learning_rate": 4.369179197014448e-06, "loss": 1.0312, "step": 13476 }, { "epoch": 0.25, "learning_rate": 4.369077746735644e-06, "loss": 0.8266, "step": 13477 }, { "epoch": 0.25, "learning_rate": 4.36897628947776e-06, "loss": 0.7773, "step": 13478 }, { "epoch": 0.25, "learning_rate": 4.368874825241176e-06, "loss": 0.6764, "step": 13479 }, { "epoch": 0.25, "learning_rate": 4.368773354026271e-06, "loss": 1.1561, "step": 13480 }, { "epoch": 0.25, "learning_rate": 4.368671875833424e-06, "loss": 1.2173, "step": 13481 }, { "epoch": 0.25, "learning_rate": 4.368570390663013e-06, "loss": 0.8704, "step": 13482 }, { "epoch": 0.25, "learning_rate": 4.368468898515418e-06, "loss": 1.0916, "step": 13483 }, { "epoch": 0.25, "learning_rate": 4.368367399391016e-06, "loss": 0.9751, "step": 13484 }, { "epoch": 0.25, "learning_rate": 4.368265893290189e-06, "loss": 0.8448, "step": 13485 }, { "epoch": 0.25, "learning_rate": 4.368164380213313e-06, "loss": 0.8753, "step": 13486 }, { "epoch": 0.25, "learning_rate": 4.36806286016077e-06, "loss": 1.0391, "step": 13487 }, { "epoch": 0.25, "learning_rate": 4.3679613331329365e-06, "loss": 0.9677, "step": 13488 }, { "epoch": 0.25, "learning_rate": 4.367859799130193e-06, "loss": 0.783, "step": 13489 }, { "epoch": 0.25, "learning_rate": 4.367758258152917e-06, "loss": 1.025, "step": 13490 }, { "epoch": 0.25, "learning_rate": 4.367656710201491e-06, "loss": 0.8823, "step": 13491 }, { "epoch": 0.25, "learning_rate": 4.3675551552762915e-06, "loss": 0.908, "step": 13492 }, { "epoch": 0.25, "learning_rate": 4.367453593377698e-06, "loss": 0.8577, "step": 13493 }, { "epoch": 0.25, "learning_rate": 4.36735202450609e-06, "loss": 1.0851, "step": 13494 }, { "epoch": 0.25, "learning_rate": 4.367250448661847e-06, "loss": 0.9572, "step": 13495 }, { "epoch": 0.25, "learning_rate": 4.367148865845348e-06, "loss": 1.0181, "step": 13496 }, { "epoch": 0.25, "learning_rate": 4.367047276056972e-06, "loss": 0.7643, "step": 13497 }, { "epoch": 0.25, "learning_rate": 4.366945679297099e-06, "loss": 0.9407, "step": 13498 }, { "epoch": 0.25, "learning_rate": 4.366844075566109e-06, "loss": 1.1148, "step": 13499 }, { "epoch": 0.25, "learning_rate": 4.366742464864379e-06, "loss": 1.2686, "step": 13500 }, { "epoch": 0.25, "learning_rate": 4.36664084719229e-06, "loss": 1.0352, "step": 13501 }, { "epoch": 0.25, "learning_rate": 4.366539222550222e-06, "loss": 0.9112, "step": 13502 }, { "epoch": 0.25, "learning_rate": 4.366437590938554e-06, "loss": 1.042, "step": 13503 }, { "epoch": 0.25, "learning_rate": 4.366335952357665e-06, "loss": 0.7245, "step": 13504 }, { "epoch": 0.25, "learning_rate": 4.366234306807934e-06, "loss": 1.1074, "step": 13505 }, { "epoch": 0.25, "learning_rate": 4.366132654289742e-06, "loss": 1.1718, "step": 13506 }, { "epoch": 0.25, "learning_rate": 4.366030994803468e-06, "loss": 0.7762, "step": 13507 }, { "epoch": 0.25, "learning_rate": 4.365929328349491e-06, "loss": 0.8809, "step": 13508 }, { "epoch": 0.25, "learning_rate": 4.365827654928192e-06, "loss": 0.8164, "step": 13509 }, { "epoch": 0.25, "learning_rate": 4.365725974539949e-06, "loss": 0.9131, "step": 13510 }, { "epoch": 0.25, "learning_rate": 4.365624287185143e-06, "loss": 0.9457, "step": 13511 }, { "epoch": 0.25, "learning_rate": 4.365522592864152e-06, "loss": 1.2611, "step": 13512 }, { "epoch": 0.25, "learning_rate": 4.365420891577357e-06, "loss": 0.9656, "step": 13513 }, { "epoch": 0.25, "learning_rate": 4.365319183325139e-06, "loss": 0.9926, "step": 13514 }, { "epoch": 0.25, "learning_rate": 4.365217468107875e-06, "loss": 1.0084, "step": 13515 }, { "epoch": 0.26, "learning_rate": 4.3651157459259465e-06, "loss": 0.7119, "step": 13516 }, { "epoch": 0.26, "learning_rate": 4.365014016779733e-06, "loss": 0.9881, "step": 13517 }, { "epoch": 0.26, "learning_rate": 4.364912280669615e-06, "loss": 1.095, "step": 13518 }, { "epoch": 0.26, "learning_rate": 4.364810537595971e-06, "loss": 1.076, "step": 13519 }, { "epoch": 0.26, "learning_rate": 4.364708787559182e-06, "loss": 0.9831, "step": 13520 }, { "epoch": 0.26, "learning_rate": 4.364607030559627e-06, "loss": 0.9299, "step": 13521 }, { "epoch": 0.26, "learning_rate": 4.364505266597687e-06, "loss": 0.7886, "step": 13522 }, { "epoch": 0.26, "learning_rate": 4.364403495673742e-06, "loss": 0.8873, "step": 13523 }, { "epoch": 0.26, "learning_rate": 4.36430171778817e-06, "loss": 1.0837, "step": 13524 }, { "epoch": 0.26, "learning_rate": 4.364199932941353e-06, "loss": 0.9247, "step": 13525 }, { "epoch": 0.26, "learning_rate": 4.364098141133671e-06, "loss": 0.6618, "step": 13526 }, { "epoch": 0.26, "learning_rate": 4.363996342365504e-06, "loss": 0.9041, "step": 13527 }, { "epoch": 0.26, "learning_rate": 4.363894536637232e-06, "loss": 0.765, "step": 13528 }, { "epoch": 0.26, "learning_rate": 4.363792723949235e-06, "loss": 0.8721, "step": 13529 }, { "epoch": 0.26, "learning_rate": 4.363690904301891e-06, "loss": 0.9937, "step": 13530 }, { "epoch": 0.26, "learning_rate": 4.363589077695584e-06, "loss": 1.2221, "step": 13531 }, { "epoch": 0.26, "learning_rate": 4.363487244130693e-06, "loss": 1.2186, "step": 13532 }, { "epoch": 0.26, "learning_rate": 4.363385403607597e-06, "loss": 0.9083, "step": 13533 }, { "epoch": 0.26, "learning_rate": 4.3632835561266775e-06, "loss": 1.0673, "step": 13534 }, { "epoch": 0.26, "learning_rate": 4.363181701688315e-06, "loss": 0.949, "step": 13535 }, { "epoch": 0.26, "learning_rate": 4.363079840292887e-06, "loss": 0.8144, "step": 13536 }, { "epoch": 0.26, "learning_rate": 4.362977971940778e-06, "loss": 0.8977, "step": 13537 }, { "epoch": 0.26, "learning_rate": 4.362876096632365e-06, "loss": 1.019, "step": 13538 }, { "epoch": 0.26, "learning_rate": 4.3627742143680306e-06, "loss": 0.8908, "step": 13539 }, { "epoch": 0.26, "learning_rate": 4.362672325148154e-06, "loss": 0.9793, "step": 13540 }, { "epoch": 0.26, "learning_rate": 4.362570428973117e-06, "loss": 1.0048, "step": 13541 }, { "epoch": 0.26, "learning_rate": 4.362468525843298e-06, "loss": 1.0027, "step": 13542 }, { "epoch": 0.26, "learning_rate": 4.362366615759079e-06, "loss": 1.0593, "step": 13543 }, { "epoch": 0.26, "learning_rate": 4.36226469872084e-06, "loss": 1.1904, "step": 13544 }, { "epoch": 0.26, "learning_rate": 4.362162774728962e-06, "loss": 0.9559, "step": 13545 }, { "epoch": 0.26, "learning_rate": 4.3620608437838245e-06, "loss": 0.834, "step": 13546 }, { "epoch": 0.26, "learning_rate": 4.36195890588581e-06, "loss": 0.7135, "step": 13547 }, { "epoch": 0.26, "learning_rate": 4.361856961035297e-06, "loss": 0.7819, "step": 13548 }, { "epoch": 0.26, "learning_rate": 4.361755009232667e-06, "loss": 1.1948, "step": 13549 }, { "epoch": 0.26, "learning_rate": 4.361653050478302e-06, "loss": 1.1761, "step": 13550 }, { "epoch": 0.26, "learning_rate": 4.361551084772582e-06, "loss": 0.855, "step": 13551 }, { "epoch": 0.26, "learning_rate": 4.3614491121158865e-06, "loss": 0.9318, "step": 13552 }, { "epoch": 0.26, "learning_rate": 4.361347132508597e-06, "loss": 0.9077, "step": 13553 }, { "epoch": 0.26, "learning_rate": 4.361245145951095e-06, "loss": 0.9199, "step": 13554 }, { "epoch": 0.26, "learning_rate": 4.36114315244376e-06, "loss": 1.1678, "step": 13555 }, { "epoch": 0.26, "learning_rate": 4.361041151986973e-06, "loss": 1.1115, "step": 13556 }, { "epoch": 0.26, "learning_rate": 4.360939144581117e-06, "loss": 1.2119, "step": 13557 }, { "epoch": 0.26, "learning_rate": 4.360837130226571e-06, "loss": 1.0394, "step": 13558 }, { "epoch": 0.26, "learning_rate": 4.360735108923715e-06, "loss": 0.8788, "step": 13559 }, { "epoch": 0.26, "learning_rate": 4.360633080672931e-06, "loss": 0.8731, "step": 13560 }, { "epoch": 0.26, "learning_rate": 4.360531045474602e-06, "loss": 1.0041, "step": 13561 }, { "epoch": 0.26, "learning_rate": 4.360429003329105e-06, "loss": 1.1509, "step": 13562 }, { "epoch": 0.26, "learning_rate": 4.360326954236825e-06, "loss": 1.0024, "step": 13563 }, { "epoch": 0.26, "learning_rate": 4.36022489819814e-06, "loss": 1.102, "step": 13564 }, { "epoch": 0.26, "learning_rate": 4.360122835213433e-06, "loss": 0.9382, "step": 13565 }, { "epoch": 0.26, "learning_rate": 4.360020765283084e-06, "loss": 0.8457, "step": 13566 }, { "epoch": 0.26, "learning_rate": 4.359918688407474e-06, "loss": 0.8735, "step": 13567 }, { "epoch": 0.26, "learning_rate": 4.359816604586985e-06, "loss": 0.9187, "step": 13568 }, { "epoch": 0.26, "learning_rate": 4.3597145138219984e-06, "loss": 1.0712, "step": 13569 }, { "epoch": 0.26, "learning_rate": 4.359612416112894e-06, "loss": 1.0265, "step": 13570 }, { "epoch": 0.26, "learning_rate": 4.359510311460054e-06, "loss": 0.9319, "step": 13571 }, { "epoch": 0.26, "learning_rate": 4.35940819986386e-06, "loss": 0.8814, "step": 13572 }, { "epoch": 0.26, "learning_rate": 4.3593060813246926e-06, "loss": 0.7692, "step": 13573 }, { "epoch": 0.26, "learning_rate": 4.359203955842933e-06, "loss": 0.8446, "step": 13574 }, { "epoch": 0.26, "learning_rate": 4.359101823418964e-06, "loss": 0.8272, "step": 13575 }, { "epoch": 0.26, "learning_rate": 4.358999684053164e-06, "loss": 0.9086, "step": 13576 }, { "epoch": 0.26, "learning_rate": 4.358897537745917e-06, "loss": 0.838, "step": 13577 }, { "epoch": 0.26, "learning_rate": 4.358795384497605e-06, "loss": 1.0031, "step": 13578 }, { "epoch": 0.26, "learning_rate": 4.358693224308606e-06, "loss": 0.7607, "step": 13579 }, { "epoch": 0.26, "learning_rate": 4.358591057179304e-06, "loss": 0.9095, "step": 13580 }, { "epoch": 0.26, "learning_rate": 4.35848888311008e-06, "loss": 1.0654, "step": 13581 }, { "epoch": 0.26, "learning_rate": 4.358386702101316e-06, "loss": 0.878, "step": 13582 }, { "epoch": 0.26, "learning_rate": 4.358284514153392e-06, "loss": 0.7389, "step": 13583 }, { "epoch": 0.26, "learning_rate": 4.358182319266692e-06, "loss": 0.9938, "step": 13584 }, { "epoch": 0.26, "learning_rate": 4.358080117441595e-06, "loss": 0.807, "step": 13585 }, { "epoch": 0.26, "learning_rate": 4.357977908678485e-06, "loss": 1.0314, "step": 13586 }, { "epoch": 0.26, "learning_rate": 4.357875692977741e-06, "loss": 1.2562, "step": 13587 }, { "epoch": 0.26, "learning_rate": 4.357773470339746e-06, "loss": 1.0096, "step": 13588 }, { "epoch": 0.26, "learning_rate": 4.357671240764884e-06, "loss": 1.1044, "step": 13589 }, { "epoch": 0.26, "learning_rate": 4.357569004253533e-06, "loss": 0.8178, "step": 13590 }, { "epoch": 0.26, "learning_rate": 4.357466760806076e-06, "loss": 0.7728, "step": 13591 }, { "epoch": 0.26, "learning_rate": 4.357364510422896e-06, "loss": 0.9529, "step": 13592 }, { "epoch": 0.26, "learning_rate": 4.357262253104374e-06, "loss": 1.138, "step": 13593 }, { "epoch": 0.26, "learning_rate": 4.357159988850891e-06, "loss": 0.9534, "step": 13594 }, { "epoch": 0.26, "learning_rate": 4.3570577176628295e-06, "loss": 0.8092, "step": 13595 }, { "epoch": 0.26, "learning_rate": 4.356955439540572e-06, "loss": 0.973, "step": 13596 }, { "epoch": 0.26, "learning_rate": 4.3568531544844985e-06, "loss": 0.9182, "step": 13597 }, { "epoch": 0.26, "learning_rate": 4.3567508624949936e-06, "loss": 0.8521, "step": 13598 }, { "epoch": 0.26, "learning_rate": 4.356648563572438e-06, "loss": 1.0163, "step": 13599 }, { "epoch": 0.26, "learning_rate": 4.3565462577172126e-06, "loss": 1.2392, "step": 13600 }, { "epoch": 0.26, "learning_rate": 4.3564439449297005e-06, "loss": 0.7794, "step": 13601 }, { "epoch": 0.26, "learning_rate": 4.356341625210284e-06, "loss": 0.8752, "step": 13602 }, { "epoch": 0.26, "learning_rate": 4.356239298559345e-06, "loss": 1.0536, "step": 13603 }, { "epoch": 0.26, "learning_rate": 4.356136964977265e-06, "loss": 0.918, "step": 13604 }, { "epoch": 0.26, "learning_rate": 4.356034624464427e-06, "loss": 0.7324, "step": 13605 }, { "epoch": 0.26, "learning_rate": 4.355932277021212e-06, "loss": 1.1343, "step": 13606 }, { "epoch": 0.26, "learning_rate": 4.355829922648004e-06, "loss": 0.9991, "step": 13607 }, { "epoch": 0.26, "learning_rate": 4.355727561345182e-06, "loss": 1.0239, "step": 13608 }, { "epoch": 0.26, "learning_rate": 4.355625193113131e-06, "loss": 0.8965, "step": 13609 }, { "epoch": 0.26, "learning_rate": 4.355522817952233e-06, "loss": 0.8948, "step": 13610 }, { "epoch": 0.26, "learning_rate": 4.3554204358628695e-06, "loss": 0.9282, "step": 13611 }, { "epoch": 0.26, "learning_rate": 4.355318046845423e-06, "loss": 1.0958, "step": 13612 }, { "epoch": 0.26, "learning_rate": 4.355215650900275e-06, "loss": 0.7977, "step": 13613 }, { "epoch": 0.26, "learning_rate": 4.355113248027809e-06, "loss": 0.6687, "step": 13614 }, { "epoch": 0.26, "learning_rate": 4.355010838228407e-06, "loss": 0.7854, "step": 13615 }, { "epoch": 0.26, "learning_rate": 4.354908421502453e-06, "loss": 0.8984, "step": 13616 }, { "epoch": 0.26, "learning_rate": 4.354805997850325e-06, "loss": 0.8351, "step": 13617 }, { "epoch": 0.26, "learning_rate": 4.35470356727241e-06, "loss": 1.0901, "step": 13618 }, { "epoch": 0.26, "learning_rate": 4.354601129769089e-06, "loss": 1.0604, "step": 13619 }, { "epoch": 0.26, "learning_rate": 4.354498685340744e-06, "loss": 0.955, "step": 13620 }, { "epoch": 0.26, "learning_rate": 4.354396233987757e-06, "loss": 0.8524, "step": 13621 }, { "epoch": 0.26, "learning_rate": 4.354293775710512e-06, "loss": 0.9791, "step": 13622 }, { "epoch": 0.26, "learning_rate": 4.354191310509391e-06, "loss": 0.8774, "step": 13623 }, { "epoch": 0.26, "learning_rate": 4.3540888383847765e-06, "loss": 0.9556, "step": 13624 }, { "epoch": 0.26, "learning_rate": 4.35398635933705e-06, "loss": 0.9566, "step": 13625 }, { "epoch": 0.26, "learning_rate": 4.353883873366597e-06, "loss": 0.8059, "step": 13626 }, { "epoch": 0.26, "learning_rate": 4.3537813804737976e-06, "loss": 0.9379, "step": 13627 }, { "epoch": 0.26, "learning_rate": 4.353678880659035e-06, "loss": 0.7243, "step": 13628 }, { "epoch": 0.26, "learning_rate": 4.353576373922692e-06, "loss": 1.0541, "step": 13629 }, { "epoch": 0.26, "learning_rate": 4.353473860265153e-06, "loss": 0.8653, "step": 13630 }, { "epoch": 0.26, "learning_rate": 4.353371339686798e-06, "loss": 1.0532, "step": 13631 }, { "epoch": 0.26, "learning_rate": 4.353268812188012e-06, "loss": 1.1319, "step": 13632 }, { "epoch": 0.26, "learning_rate": 4.3531662777691775e-06, "loss": 0.8006, "step": 13633 }, { "epoch": 0.26, "learning_rate": 4.353063736430677e-06, "loss": 1.0526, "step": 13634 }, { "epoch": 0.26, "learning_rate": 4.352961188172893e-06, "loss": 0.903, "step": 13635 }, { "epoch": 0.26, "learning_rate": 4.3528586329962075e-06, "loss": 0.9008, "step": 13636 }, { "epoch": 0.26, "learning_rate": 4.352756070901006e-06, "loss": 1.0803, "step": 13637 }, { "epoch": 0.26, "learning_rate": 4.352653501887671e-06, "loss": 0.9485, "step": 13638 }, { "epoch": 0.26, "learning_rate": 4.3525509259565825e-06, "loss": 0.9381, "step": 13639 }, { "epoch": 0.26, "learning_rate": 4.352448343108127e-06, "loss": 0.8438, "step": 13640 }, { "epoch": 0.26, "learning_rate": 4.352345753342686e-06, "loss": 1.0429, "step": 13641 }, { "epoch": 0.26, "learning_rate": 4.3522431566606415e-06, "loss": 0.944, "step": 13642 }, { "epoch": 0.26, "learning_rate": 4.352140553062379e-06, "loss": 0.8542, "step": 13643 }, { "epoch": 0.26, "learning_rate": 4.352037942548281e-06, "loss": 1.0194, "step": 13644 }, { "epoch": 0.26, "learning_rate": 4.351935325118729e-06, "loss": 0.927, "step": 13645 }, { "epoch": 0.26, "learning_rate": 4.351832700774108e-06, "loss": 0.9784, "step": 13646 }, { "epoch": 0.26, "learning_rate": 4.3517300695148e-06, "loss": 0.8251, "step": 13647 }, { "epoch": 0.26, "learning_rate": 4.351627431341189e-06, "loss": 0.7908, "step": 13648 }, { "epoch": 0.26, "learning_rate": 4.351524786253658e-06, "loss": 1.1415, "step": 13649 }, { "epoch": 0.26, "learning_rate": 4.35142213425259e-06, "loss": 1.092, "step": 13650 }, { "epoch": 0.26, "learning_rate": 4.351319475338368e-06, "loss": 1.0222, "step": 13651 }, { "epoch": 0.26, "learning_rate": 4.351216809511377e-06, "loss": 0.9378, "step": 13652 }, { "epoch": 0.26, "learning_rate": 4.351114136771999e-06, "loss": 0.9729, "step": 13653 }, { "epoch": 0.26, "learning_rate": 4.3510114571206165e-06, "loss": 0.9385, "step": 13654 }, { "epoch": 0.26, "learning_rate": 4.350908770557615e-06, "loss": 0.8503, "step": 13655 }, { "epoch": 0.26, "learning_rate": 4.3508060770833775e-06, "loss": 1.0067, "step": 13656 }, { "epoch": 0.26, "learning_rate": 4.3507033766982856e-06, "loss": 0.8893, "step": 13657 }, { "epoch": 0.26, "learning_rate": 4.350600669402724e-06, "loss": 0.8127, "step": 13658 }, { "epoch": 0.26, "learning_rate": 4.350497955197077e-06, "loss": 0.8838, "step": 13659 }, { "epoch": 0.26, "learning_rate": 4.350395234081727e-06, "loss": 0.8136, "step": 13660 }, { "epoch": 0.26, "learning_rate": 4.350292506057058e-06, "loss": 1.0861, "step": 13661 }, { "epoch": 0.26, "learning_rate": 4.350189771123453e-06, "loss": 1.127, "step": 13662 }, { "epoch": 0.26, "learning_rate": 4.350087029281297e-06, "loss": 1.1052, "step": 13663 }, { "epoch": 0.26, "learning_rate": 4.3499842805309715e-06, "loss": 0.7998, "step": 13664 }, { "epoch": 0.26, "learning_rate": 4.349881524872862e-06, "loss": 0.9989, "step": 13665 }, { "epoch": 0.26, "learning_rate": 4.349778762307352e-06, "loss": 0.9793, "step": 13666 }, { "epoch": 0.26, "learning_rate": 4.349675992834826e-06, "loss": 0.7872, "step": 13667 }, { "epoch": 0.26, "learning_rate": 4.349573216455664e-06, "loss": 1.0599, "step": 13668 }, { "epoch": 0.26, "learning_rate": 4.349470433170254e-06, "loss": 0.9026, "step": 13669 }, { "epoch": 0.26, "learning_rate": 4.349367642978977e-06, "loss": 1.053, "step": 13670 }, { "epoch": 0.26, "learning_rate": 4.349264845882218e-06, "loss": 1.0873, "step": 13671 }, { "epoch": 0.26, "learning_rate": 4.3491620418803625e-06, "loss": 0.89, "step": 13672 }, { "epoch": 0.26, "learning_rate": 4.349059230973791e-06, "loss": 0.8679, "step": 13673 }, { "epoch": 0.26, "learning_rate": 4.348956413162889e-06, "loss": 0.8995, "step": 13674 }, { "epoch": 0.26, "learning_rate": 4.348853588448041e-06, "loss": 1.3474, "step": 13675 }, { "epoch": 0.26, "learning_rate": 4.348750756829631e-06, "loss": 1.0066, "step": 13676 }, { "epoch": 0.26, "learning_rate": 4.348647918308042e-06, "loss": 0.9093, "step": 13677 }, { "epoch": 0.26, "learning_rate": 4.348545072883658e-06, "loss": 0.9433, "step": 13678 }, { "epoch": 0.26, "learning_rate": 4.348442220556863e-06, "loss": 0.9188, "step": 13679 }, { "epoch": 0.26, "learning_rate": 4.348339361328042e-06, "loss": 0.8676, "step": 13680 }, { "epoch": 0.26, "learning_rate": 4.348236495197578e-06, "loss": 1.1405, "step": 13681 }, { "epoch": 0.26, "learning_rate": 4.348133622165856e-06, "loss": 0.9822, "step": 13682 }, { "epoch": 0.26, "learning_rate": 4.34803074223326e-06, "loss": 0.8932, "step": 13683 }, { "epoch": 0.26, "learning_rate": 4.347927855400173e-06, "loss": 0.8927, "step": 13684 }, { "epoch": 0.26, "learning_rate": 4.347824961666981e-06, "loss": 0.8216, "step": 13685 }, { "epoch": 0.26, "learning_rate": 4.347722061034066e-06, "loss": 1.0206, "step": 13686 }, { "epoch": 0.26, "learning_rate": 4.3476191535018145e-06, "loss": 1.0213, "step": 13687 }, { "epoch": 0.26, "learning_rate": 4.347516239070609e-06, "loss": 1.0026, "step": 13688 }, { "epoch": 0.26, "learning_rate": 4.347413317740835e-06, "loss": 0.8473, "step": 13689 }, { "epoch": 0.26, "learning_rate": 4.347310389512877e-06, "loss": 1.0275, "step": 13690 }, { "epoch": 0.26, "learning_rate": 4.3472074543871176e-06, "loss": 1.0104, "step": 13691 }, { "epoch": 0.26, "learning_rate": 4.3471045123639435e-06, "loss": 0.8268, "step": 13692 }, { "epoch": 0.26, "learning_rate": 4.347001563443736e-06, "loss": 0.8845, "step": 13693 }, { "epoch": 0.26, "learning_rate": 4.346898607626883e-06, "loss": 0.962, "step": 13694 }, { "epoch": 0.26, "learning_rate": 4.346795644913766e-06, "loss": 0.8711, "step": 13695 }, { "epoch": 0.26, "learning_rate": 4.346692675304771e-06, "loss": 0.6369, "step": 13696 }, { "epoch": 0.26, "learning_rate": 4.346589698800282e-06, "loss": 0.9523, "step": 13697 }, { "epoch": 0.26, "learning_rate": 4.346486715400684e-06, "loss": 0.9506, "step": 13698 }, { "epoch": 0.26, "learning_rate": 4.346383725106361e-06, "loss": 1.1414, "step": 13699 }, { "epoch": 0.26, "learning_rate": 4.346280727917699e-06, "loss": 1.194, "step": 13700 }, { "epoch": 0.26, "learning_rate": 4.346177723835079e-06, "loss": 0.9901, "step": 13701 }, { "epoch": 0.26, "learning_rate": 4.34607471285889e-06, "loss": 0.9237, "step": 13702 }, { "epoch": 0.26, "learning_rate": 4.345971694989514e-06, "loss": 0.9011, "step": 13703 }, { "epoch": 0.26, "learning_rate": 4.345868670227335e-06, "loss": 1.0197, "step": 13704 }, { "epoch": 0.26, "learning_rate": 4.345765638572741e-06, "loss": 0.8645, "step": 13705 }, { "epoch": 0.26, "learning_rate": 4.345662600026114e-06, "loss": 0.8988, "step": 13706 }, { "epoch": 0.26, "learning_rate": 4.345559554587839e-06, "loss": 0.864, "step": 13707 }, { "epoch": 0.26, "learning_rate": 4.345456502258302e-06, "loss": 0.91, "step": 13708 }, { "epoch": 0.26, "learning_rate": 4.345353443037887e-06, "loss": 0.7651, "step": 13709 }, { "epoch": 0.26, "learning_rate": 4.345250376926977e-06, "loss": 0.8854, "step": 13710 }, { "epoch": 0.26, "learning_rate": 4.345147303925961e-06, "loss": 0.9111, "step": 13711 }, { "epoch": 0.26, "learning_rate": 4.34504422403522e-06, "loss": 1.1913, "step": 13712 }, { "epoch": 0.26, "learning_rate": 4.344941137255141e-06, "loss": 1.1018, "step": 13713 }, { "epoch": 0.26, "learning_rate": 4.344838043586108e-06, "loss": 1.0092, "step": 13714 }, { "epoch": 0.26, "learning_rate": 4.344734943028507e-06, "loss": 0.7988, "step": 13715 }, { "epoch": 0.26, "learning_rate": 4.3446318355827225e-06, "loss": 1.1699, "step": 13716 }, { "epoch": 0.26, "learning_rate": 4.344528721249139e-06, "loss": 1.0196, "step": 13717 }, { "epoch": 0.26, "learning_rate": 4.344425600028141e-06, "loss": 1.0778, "step": 13718 }, { "epoch": 0.26, "learning_rate": 4.344322471920115e-06, "loss": 1.1382, "step": 13719 }, { "epoch": 0.26, "learning_rate": 4.344219336925445e-06, "loss": 0.9482, "step": 13720 }, { "epoch": 0.26, "learning_rate": 4.344116195044517e-06, "loss": 1.0147, "step": 13721 }, { "epoch": 0.26, "learning_rate": 4.344013046277715e-06, "loss": 0.8788, "step": 13722 }, { "epoch": 0.26, "learning_rate": 4.3439098906254255e-06, "loss": 0.9845, "step": 13723 }, { "epoch": 0.26, "learning_rate": 4.343806728088033e-06, "loss": 0.9366, "step": 13724 }, { "epoch": 0.26, "learning_rate": 4.343703558665923e-06, "loss": 1.0612, "step": 13725 }, { "epoch": 0.26, "learning_rate": 4.34360038235948e-06, "loss": 0.7134, "step": 13726 }, { "epoch": 0.26, "learning_rate": 4.3434971991690895e-06, "loss": 0.985, "step": 13727 }, { "epoch": 0.26, "learning_rate": 4.3433940090951374e-06, "loss": 0.9307, "step": 13728 }, { "epoch": 0.26, "learning_rate": 4.343290812138008e-06, "loss": 0.8461, "step": 13729 }, { "epoch": 0.26, "learning_rate": 4.343187608298088e-06, "loss": 0.9073, "step": 13730 }, { "epoch": 0.26, "learning_rate": 4.343084397575761e-06, "loss": 1.0177, "step": 13731 }, { "epoch": 0.26, "learning_rate": 4.342981179971415e-06, "loss": 0.9335, "step": 13732 }, { "epoch": 0.26, "learning_rate": 4.342877955485431e-06, "loss": 0.8671, "step": 13733 }, { "epoch": 0.26, "learning_rate": 4.3427747241182e-06, "loss": 0.9745, "step": 13734 }, { "epoch": 0.26, "learning_rate": 4.342671485870103e-06, "loss": 0.8482, "step": 13735 }, { "epoch": 0.26, "learning_rate": 4.342568240741528e-06, "loss": 0.8711, "step": 13736 }, { "epoch": 0.26, "learning_rate": 4.3424649887328605e-06, "loss": 1.1406, "step": 13737 }, { "epoch": 0.26, "learning_rate": 4.342361729844484e-06, "loss": 0.8766, "step": 13738 }, { "epoch": 0.26, "learning_rate": 4.342258464076785e-06, "loss": 0.8063, "step": 13739 }, { "epoch": 0.26, "learning_rate": 4.34215519143015e-06, "loss": 1.1083, "step": 13740 }, { "epoch": 0.26, "learning_rate": 4.342051911904964e-06, "loss": 0.7955, "step": 13741 }, { "epoch": 0.26, "learning_rate": 4.341948625501613e-06, "loss": 0.9384, "step": 13742 }, { "epoch": 0.26, "learning_rate": 4.341845332220481e-06, "loss": 0.9583, "step": 13743 }, { "epoch": 0.26, "learning_rate": 4.3417420320619565e-06, "loss": 1.037, "step": 13744 }, { "epoch": 0.26, "learning_rate": 4.341638725026422e-06, "loss": 0.8647, "step": 13745 }, { "epoch": 0.26, "learning_rate": 4.341535411114267e-06, "loss": 0.9531, "step": 13746 }, { "epoch": 0.26, "learning_rate": 4.341432090325874e-06, "loss": 1.038, "step": 13747 }, { "epoch": 0.26, "learning_rate": 4.34132876266163e-06, "loss": 0.8609, "step": 13748 }, { "epoch": 0.26, "learning_rate": 4.3412254281219215e-06, "loss": 1.0022, "step": 13749 }, { "epoch": 0.26, "learning_rate": 4.341122086707133e-06, "loss": 0.8677, "step": 13750 }, { "epoch": 0.26, "learning_rate": 4.341018738417652e-06, "loss": 0.9462, "step": 13751 }, { "epoch": 0.26, "learning_rate": 4.340915383253863e-06, "loss": 0.7295, "step": 13752 }, { "epoch": 0.26, "learning_rate": 4.340812021216152e-06, "loss": 0.8619, "step": 13753 }, { "epoch": 0.26, "learning_rate": 4.340708652304906e-06, "loss": 0.8471, "step": 13754 }, { "epoch": 0.26, "learning_rate": 4.34060527652051e-06, "loss": 0.9219, "step": 13755 }, { "epoch": 0.26, "learning_rate": 4.34050189386335e-06, "loss": 0.8806, "step": 13756 }, { "epoch": 0.26, "learning_rate": 4.340398504333813e-06, "loss": 0.9951, "step": 13757 }, { "epoch": 0.26, "learning_rate": 4.340295107932284e-06, "loss": 0.924, "step": 13758 }, { "epoch": 0.26, "learning_rate": 4.340191704659149e-06, "loss": 0.771, "step": 13759 }, { "epoch": 0.26, "learning_rate": 4.3400882945147956e-06, "loss": 0.881, "step": 13760 }, { "epoch": 0.26, "learning_rate": 4.339984877499609e-06, "loss": 1.0699, "step": 13761 }, { "epoch": 0.26, "learning_rate": 4.3398814536139745e-06, "loss": 0.9473, "step": 13762 }, { "epoch": 0.26, "learning_rate": 4.3397780228582795e-06, "loss": 1.1976, "step": 13763 }, { "epoch": 0.26, "learning_rate": 4.339674585232909e-06, "loss": 0.8724, "step": 13764 }, { "epoch": 0.26, "learning_rate": 4.339571140738251e-06, "loss": 0.7998, "step": 13765 }, { "epoch": 0.26, "learning_rate": 4.33946768937469e-06, "loss": 0.8987, "step": 13766 }, { "epoch": 0.26, "learning_rate": 4.339364231142614e-06, "loss": 0.9086, "step": 13767 }, { "epoch": 0.26, "learning_rate": 4.339260766042408e-06, "loss": 1.2087, "step": 13768 }, { "epoch": 0.26, "learning_rate": 4.339157294074458e-06, "loss": 1.0603, "step": 13769 }, { "epoch": 0.26, "learning_rate": 4.339053815239152e-06, "loss": 1.0575, "step": 13770 }, { "epoch": 0.26, "learning_rate": 4.338950329536875e-06, "loss": 0.927, "step": 13771 }, { "epoch": 0.26, "learning_rate": 4.338846836968014e-06, "loss": 0.9146, "step": 13772 }, { "epoch": 0.26, "learning_rate": 4.3387433375329544e-06, "loss": 0.9765, "step": 13773 }, { "epoch": 0.26, "learning_rate": 4.338639831232084e-06, "loss": 0.8573, "step": 13774 }, { "epoch": 0.26, "learning_rate": 4.33853631806579e-06, "loss": 1.2731, "step": 13775 }, { "epoch": 0.26, "learning_rate": 4.338432798034457e-06, "loss": 1.0639, "step": 13776 }, { "epoch": 0.26, "learning_rate": 4.338329271138472e-06, "loss": 0.9093, "step": 13777 }, { "epoch": 0.26, "learning_rate": 4.338225737378222e-06, "loss": 0.9438, "step": 13778 }, { "epoch": 0.26, "learning_rate": 4.338122196754094e-06, "loss": 0.8675, "step": 13779 }, { "epoch": 0.26, "learning_rate": 4.338018649266473e-06, "loss": 1.0454, "step": 13780 }, { "epoch": 0.26, "learning_rate": 4.337915094915748e-06, "loss": 0.9164, "step": 13781 }, { "epoch": 0.26, "learning_rate": 4.337811533702303e-06, "loss": 1.1727, "step": 13782 }, { "epoch": 0.26, "learning_rate": 4.337707965626527e-06, "loss": 0.6686, "step": 13783 }, { "epoch": 0.26, "learning_rate": 4.337604390688805e-06, "loss": 0.8633, "step": 13784 }, { "epoch": 0.26, "learning_rate": 4.337500808889525e-06, "loss": 0.9879, "step": 13785 }, { "epoch": 0.26, "learning_rate": 4.337397220229074e-06, "loss": 1.0553, "step": 13786 }, { "epoch": 0.26, "learning_rate": 4.337293624707838e-06, "loss": 1.2258, "step": 13787 }, { "epoch": 0.26, "learning_rate": 4.337190022326203e-06, "loss": 0.9578, "step": 13788 }, { "epoch": 0.26, "learning_rate": 4.337086413084558e-06, "loss": 1.0133, "step": 13789 }, { "epoch": 0.26, "learning_rate": 4.3369827969832875e-06, "loss": 1.0009, "step": 13790 }, { "epoch": 0.26, "learning_rate": 4.33687917402278e-06, "loss": 0.7864, "step": 13791 }, { "epoch": 0.26, "learning_rate": 4.336775544203422e-06, "loss": 0.8445, "step": 13792 }, { "epoch": 0.26, "learning_rate": 4.3366719075256e-06, "loss": 0.9308, "step": 13793 }, { "epoch": 0.26, "learning_rate": 4.336568263989702e-06, "loss": 1.1966, "step": 13794 }, { "epoch": 0.26, "learning_rate": 4.336464613596114e-06, "loss": 1.057, "step": 13795 }, { "epoch": 0.26, "learning_rate": 4.336360956345224e-06, "loss": 0.9178, "step": 13796 }, { "epoch": 0.26, "learning_rate": 4.336257292237418e-06, "loss": 0.8359, "step": 13797 }, { "epoch": 0.26, "learning_rate": 4.3361536212730846e-06, "loss": 0.8366, "step": 13798 }, { "epoch": 0.26, "learning_rate": 4.336049943452608e-06, "loss": 1.1142, "step": 13799 }, { "epoch": 0.26, "learning_rate": 4.335946258776379e-06, "loss": 0.8631, "step": 13800 }, { "epoch": 0.26, "learning_rate": 4.335842567244782e-06, "loss": 1.0541, "step": 13801 }, { "epoch": 0.26, "learning_rate": 4.335738868858205e-06, "loss": 0.9717, "step": 13802 }, { "epoch": 0.26, "learning_rate": 4.335635163617036e-06, "loss": 0.9043, "step": 13803 }, { "epoch": 0.26, "learning_rate": 4.3355314515216614e-06, "loss": 0.907, "step": 13804 }, { "epoch": 0.26, "learning_rate": 4.335427732572468e-06, "loss": 0.9636, "step": 13805 }, { "epoch": 0.26, "learning_rate": 4.335324006769844e-06, "loss": 1.3369, "step": 13806 }, { "epoch": 0.26, "learning_rate": 4.335220274114177e-06, "loss": 0.9088, "step": 13807 }, { "epoch": 0.26, "learning_rate": 4.335116534605853e-06, "loss": 0.8146, "step": 13808 }, { "epoch": 0.26, "learning_rate": 4.335012788245261e-06, "loss": 1.2247, "step": 13809 }, { "epoch": 0.26, "learning_rate": 4.3349090350327874e-06, "loss": 0.8127, "step": 13810 }, { "epoch": 0.26, "learning_rate": 4.33480527496882e-06, "loss": 1.1346, "step": 13811 }, { "epoch": 0.26, "learning_rate": 4.334701508053744e-06, "loss": 0.9883, "step": 13812 }, { "epoch": 0.26, "learning_rate": 4.334597734287951e-06, "loss": 0.9081, "step": 13813 }, { "epoch": 0.26, "learning_rate": 4.334493953671825e-06, "loss": 0.9669, "step": 13814 }, { "epoch": 0.26, "learning_rate": 4.334390166205755e-06, "loss": 0.7039, "step": 13815 }, { "epoch": 0.26, "learning_rate": 4.33428637189013e-06, "loss": 0.9384, "step": 13816 }, { "epoch": 0.26, "learning_rate": 4.334182570725334e-06, "loss": 0.8074, "step": 13817 }, { "epoch": 0.26, "learning_rate": 4.334078762711757e-06, "loss": 1.0319, "step": 13818 }, { "epoch": 0.26, "learning_rate": 4.333974947849786e-06, "loss": 0.9118, "step": 13819 }, { "epoch": 0.26, "learning_rate": 4.333871126139809e-06, "loss": 0.9967, "step": 13820 }, { "epoch": 0.26, "learning_rate": 4.333767297582213e-06, "loss": 0.9581, "step": 13821 }, { "epoch": 0.26, "learning_rate": 4.333663462177388e-06, "loss": 0.9504, "step": 13822 }, { "epoch": 0.26, "learning_rate": 4.333559619925718e-06, "loss": 1.0743, "step": 13823 }, { "epoch": 0.26, "learning_rate": 4.333455770827592e-06, "loss": 0.9903, "step": 13824 }, { "epoch": 0.26, "learning_rate": 4.3333519148834e-06, "loss": 1.0779, "step": 13825 }, { "epoch": 0.26, "learning_rate": 4.333248052093527e-06, "loss": 0.8745, "step": 13826 }, { "epoch": 0.26, "learning_rate": 4.333144182458363e-06, "loss": 0.8754, "step": 13827 }, { "epoch": 0.26, "learning_rate": 4.333040305978295e-06, "loss": 1.2324, "step": 13828 }, { "epoch": 0.26, "learning_rate": 4.332936422653709e-06, "loss": 0.8294, "step": 13829 }, { "epoch": 0.26, "learning_rate": 4.332832532484996e-06, "loss": 0.9556, "step": 13830 }, { "epoch": 0.26, "learning_rate": 4.3327286354725426e-06, "loss": 1.0555, "step": 13831 }, { "epoch": 0.26, "learning_rate": 4.332624731616737e-06, "loss": 1.0466, "step": 13832 }, { "epoch": 0.26, "learning_rate": 4.332520820917966e-06, "loss": 0.7478, "step": 13833 }, { "epoch": 0.26, "learning_rate": 4.332416903376618e-06, "loss": 0.8415, "step": 13834 }, { "epoch": 0.26, "learning_rate": 4.332312978993082e-06, "loss": 0.7479, "step": 13835 }, { "epoch": 0.26, "learning_rate": 4.332209047767746e-06, "loss": 1.0392, "step": 13836 }, { "epoch": 0.26, "learning_rate": 4.332105109700997e-06, "loss": 0.9638, "step": 13837 }, { "epoch": 0.26, "learning_rate": 4.332001164793223e-06, "loss": 0.7698, "step": 13838 }, { "epoch": 0.26, "learning_rate": 4.331897213044815e-06, "loss": 0.9222, "step": 13839 }, { "epoch": 0.26, "learning_rate": 4.331793254456157e-06, "loss": 0.7993, "step": 13840 }, { "epoch": 0.26, "learning_rate": 4.3316892890276395e-06, "loss": 1.0004, "step": 13841 }, { "epoch": 0.26, "learning_rate": 4.331585316759651e-06, "loss": 0.9348, "step": 13842 }, { "epoch": 0.26, "learning_rate": 4.331481337652579e-06, "loss": 1.0458, "step": 13843 }, { "epoch": 0.26, "learning_rate": 4.331377351706811e-06, "loss": 1.1152, "step": 13844 }, { "epoch": 0.26, "learning_rate": 4.331273358922737e-06, "loss": 0.986, "step": 13845 }, { "epoch": 0.26, "learning_rate": 4.331169359300745e-06, "loss": 0.7633, "step": 13846 }, { "epoch": 0.26, "learning_rate": 4.33106535284122e-06, "loss": 0.9194, "step": 13847 }, { "epoch": 0.26, "learning_rate": 4.330961339544555e-06, "loss": 0.8573, "step": 13848 }, { "epoch": 0.26, "learning_rate": 4.330857319411137e-06, "loss": 1.0107, "step": 13849 }, { "epoch": 0.26, "learning_rate": 4.330753292441354e-06, "loss": 1.0757, "step": 13850 }, { "epoch": 0.26, "learning_rate": 4.3306492586355935e-06, "loss": 1.0034, "step": 13851 }, { "epoch": 0.26, "learning_rate": 4.330545217994245e-06, "loss": 0.7964, "step": 13852 }, { "epoch": 0.26, "learning_rate": 4.3304411705176965e-06, "loss": 0.9543, "step": 13853 }, { "epoch": 0.26, "learning_rate": 4.330337116206337e-06, "loss": 1.0582, "step": 13854 }, { "epoch": 0.26, "learning_rate": 4.330233055060555e-06, "loss": 0.85, "step": 13855 }, { "epoch": 0.26, "learning_rate": 4.330128987080739e-06, "loss": 1.0845, "step": 13856 }, { "epoch": 0.26, "learning_rate": 4.330024912267277e-06, "loss": 1.046, "step": 13857 }, { "epoch": 0.26, "learning_rate": 4.3299208306205586e-06, "loss": 1.0941, "step": 13858 }, { "epoch": 0.26, "learning_rate": 4.329816742140971e-06, "loss": 1.0638, "step": 13859 }, { "epoch": 0.26, "learning_rate": 4.329712646828905e-06, "loss": 0.7437, "step": 13860 }, { "epoch": 0.26, "learning_rate": 4.329608544684748e-06, "loss": 0.9264, "step": 13861 }, { "epoch": 0.26, "learning_rate": 4.329504435708888e-06, "loss": 1.0472, "step": 13862 }, { "epoch": 0.26, "learning_rate": 4.3294003199017144e-06, "loss": 1.0077, "step": 13863 }, { "epoch": 0.26, "learning_rate": 4.329296197263617e-06, "loss": 0.998, "step": 13864 }, { "epoch": 0.26, "learning_rate": 4.329192067794983e-06, "loss": 0.9386, "step": 13865 }, { "epoch": 0.26, "learning_rate": 4.329087931496202e-06, "loss": 0.7653, "step": 13866 }, { "epoch": 0.26, "learning_rate": 4.328983788367664e-06, "loss": 0.8234, "step": 13867 }, { "epoch": 0.26, "learning_rate": 4.328879638409755e-06, "loss": 1.0718, "step": 13868 }, { "epoch": 0.26, "learning_rate": 4.328775481622866e-06, "loss": 1.0224, "step": 13869 }, { "epoch": 0.26, "learning_rate": 4.328671318007385e-06, "loss": 0.985, "step": 13870 }, { "epoch": 0.26, "learning_rate": 4.328567147563703e-06, "loss": 1.0071, "step": 13871 }, { "epoch": 0.26, "learning_rate": 4.3284629702922055e-06, "loss": 0.8532, "step": 13872 }, { "epoch": 0.26, "learning_rate": 4.328358786193284e-06, "loss": 1.0216, "step": 13873 }, { "epoch": 0.26, "learning_rate": 4.328254595267326e-06, "loss": 1.0053, "step": 13874 }, { "epoch": 0.26, "learning_rate": 4.328150397514722e-06, "loss": 1.1714, "step": 13875 }, { "epoch": 0.26, "learning_rate": 4.328046192935861e-06, "loss": 0.9019, "step": 13876 }, { "epoch": 0.26, "learning_rate": 4.327941981531132e-06, "loss": 0.8896, "step": 13877 }, { "epoch": 0.26, "learning_rate": 4.327837763300923e-06, "loss": 0.9451, "step": 13878 }, { "epoch": 0.26, "learning_rate": 4.327733538245623e-06, "loss": 0.841, "step": 13879 }, { "epoch": 0.26, "learning_rate": 4.3276293063656235e-06, "loss": 0.973, "step": 13880 }, { "epoch": 0.26, "learning_rate": 4.327525067661311e-06, "loss": 1.028, "step": 13881 }, { "epoch": 0.26, "learning_rate": 4.327420822133076e-06, "loss": 1.064, "step": 13882 }, { "epoch": 0.26, "learning_rate": 4.327316569781309e-06, "loss": 0.9767, "step": 13883 }, { "epoch": 0.26, "learning_rate": 4.327212310606397e-06, "loss": 0.7549, "step": 13884 }, { "epoch": 0.26, "learning_rate": 4.32710804460873e-06, "loss": 0.7747, "step": 13885 }, { "epoch": 0.26, "learning_rate": 4.327003771788698e-06, "loss": 0.9406, "step": 13886 }, { "epoch": 0.26, "learning_rate": 4.32689949214669e-06, "loss": 1.0183, "step": 13887 }, { "epoch": 0.26, "learning_rate": 4.326795205683095e-06, "loss": 1.0891, "step": 13888 }, { "epoch": 0.26, "learning_rate": 4.3266909123983025e-06, "loss": 0.9623, "step": 13889 }, { "epoch": 0.26, "learning_rate": 4.326586612292703e-06, "loss": 0.8558, "step": 13890 }, { "epoch": 0.26, "learning_rate": 4.3264823053666845e-06, "loss": 0.874, "step": 13891 }, { "epoch": 0.26, "learning_rate": 4.326377991620637e-06, "loss": 0.952, "step": 13892 }, { "epoch": 0.26, "learning_rate": 4.32627367105495e-06, "loss": 1.3231, "step": 13893 }, { "epoch": 0.26, "learning_rate": 4.326169343670014e-06, "loss": 0.9623, "step": 13894 }, { "epoch": 0.26, "learning_rate": 4.326065009466217e-06, "loss": 0.881, "step": 13895 }, { "epoch": 0.26, "learning_rate": 4.325960668443949e-06, "loss": 1.0655, "step": 13896 }, { "epoch": 0.26, "learning_rate": 4.325856320603599e-06, "loss": 1.0129, "step": 13897 }, { "epoch": 0.26, "learning_rate": 4.325751965945559e-06, "loss": 0.7003, "step": 13898 }, { "epoch": 0.26, "learning_rate": 4.325647604470218e-06, "loss": 1.0579, "step": 13899 }, { "epoch": 0.26, "learning_rate": 4.3255432361779625e-06, "loss": 1.1392, "step": 13900 }, { "epoch": 0.26, "learning_rate": 4.325438861069185e-06, "loss": 1.0051, "step": 13901 }, { "epoch": 0.26, "learning_rate": 4.325334479144276e-06, "loss": 0.9975, "step": 13902 }, { "epoch": 0.26, "learning_rate": 4.325230090403624e-06, "loss": 0.9759, "step": 13903 }, { "epoch": 0.26, "learning_rate": 4.325125694847617e-06, "loss": 0.7267, "step": 13904 }, { "epoch": 0.26, "learning_rate": 4.325021292476649e-06, "loss": 1.0497, "step": 13905 }, { "epoch": 0.26, "learning_rate": 4.324916883291106e-06, "loss": 0.9777, "step": 13906 }, { "epoch": 0.26, "learning_rate": 4.3248124672913794e-06, "loss": 1.0078, "step": 13907 }, { "epoch": 0.26, "learning_rate": 4.324708044477859e-06, "loss": 0.6399, "step": 13908 }, { "epoch": 0.26, "learning_rate": 4.324603614850934e-06, "loss": 0.8958, "step": 13909 }, { "epoch": 0.26, "learning_rate": 4.3244991784109965e-06, "loss": 0.8756, "step": 13910 }, { "epoch": 0.26, "learning_rate": 4.324394735158435e-06, "loss": 0.8856, "step": 13911 }, { "epoch": 0.26, "learning_rate": 4.324290285093638e-06, "loss": 0.8765, "step": 13912 }, { "epoch": 0.26, "learning_rate": 4.324185828216999e-06, "loss": 0.915, "step": 13913 }, { "epoch": 0.26, "learning_rate": 4.324081364528904e-06, "loss": 0.986, "step": 13914 }, { "epoch": 0.26, "learning_rate": 4.323976894029747e-06, "loss": 0.8071, "step": 13915 }, { "epoch": 0.26, "learning_rate": 4.323872416719915e-06, "loss": 0.9716, "step": 13916 }, { "epoch": 0.26, "learning_rate": 4.323767932599799e-06, "loss": 0.8554, "step": 13917 }, { "epoch": 0.26, "learning_rate": 4.32366344166979e-06, "loss": 1.0267, "step": 13918 }, { "epoch": 0.26, "learning_rate": 4.323558943930278e-06, "loss": 1.0209, "step": 13919 }, { "epoch": 0.26, "learning_rate": 4.3234544393816525e-06, "loss": 0.7468, "step": 13920 }, { "epoch": 0.26, "learning_rate": 4.3233499280243035e-06, "loss": 1.022, "step": 13921 }, { "epoch": 0.26, "learning_rate": 4.323245409858623e-06, "loss": 0.8266, "step": 13922 }, { "epoch": 0.26, "learning_rate": 4.3231408848849985e-06, "loss": 0.76, "step": 13923 }, { "epoch": 0.26, "learning_rate": 4.323036353103823e-06, "loss": 1.0985, "step": 13924 }, { "epoch": 0.26, "learning_rate": 4.322931814515485e-06, "loss": 1.1885, "step": 13925 }, { "epoch": 0.26, "learning_rate": 4.322827269120376e-06, "loss": 0.9331, "step": 13926 }, { "epoch": 0.26, "learning_rate": 4.322722716918886e-06, "loss": 0.9536, "step": 13927 }, { "epoch": 0.26, "learning_rate": 4.3226181579114045e-06, "loss": 0.8796, "step": 13928 }, { "epoch": 0.26, "learning_rate": 4.322513592098323e-06, "loss": 0.918, "step": 13929 }, { "epoch": 0.26, "learning_rate": 4.3224090194800315e-06, "loss": 0.9708, "step": 13930 }, { "epoch": 0.26, "learning_rate": 4.322304440056922e-06, "loss": 1.1612, "step": 13931 }, { "epoch": 0.26, "learning_rate": 4.322199853829382e-06, "loss": 1.0243, "step": 13932 }, { "epoch": 0.26, "learning_rate": 4.322095260797804e-06, "loss": 0.9763, "step": 13933 }, { "epoch": 0.26, "learning_rate": 4.321990660962578e-06, "loss": 1.1606, "step": 13934 }, { "epoch": 0.26, "learning_rate": 4.321886054324095e-06, "loss": 0.9761, "step": 13935 }, { "epoch": 0.26, "learning_rate": 4.321781440882745e-06, "loss": 0.849, "step": 13936 }, { "epoch": 0.26, "learning_rate": 4.321676820638919e-06, "loss": 1.1897, "step": 13937 }, { "epoch": 0.26, "learning_rate": 4.321572193593008e-06, "loss": 1.0078, "step": 13938 }, { "epoch": 0.26, "learning_rate": 4.321467559745402e-06, "loss": 0.8353, "step": 13939 }, { "epoch": 0.26, "learning_rate": 4.321362919096492e-06, "loss": 0.9996, "step": 13940 }, { "epoch": 0.26, "learning_rate": 4.321258271646669e-06, "loss": 0.8234, "step": 13941 }, { "epoch": 0.26, "learning_rate": 4.321153617396323e-06, "loss": 0.8954, "step": 13942 }, { "epoch": 0.26, "learning_rate": 4.321048956345846e-06, "loss": 1.025, "step": 13943 }, { "epoch": 0.26, "learning_rate": 4.320944288495628e-06, "loss": 0.9287, "step": 13944 }, { "epoch": 0.26, "learning_rate": 4.320839613846059e-06, "loss": 0.8923, "step": 13945 }, { "epoch": 0.26, "learning_rate": 4.320734932397531e-06, "loss": 0.9697, "step": 13946 }, { "epoch": 0.26, "learning_rate": 4.320630244150435e-06, "loss": 1.0363, "step": 13947 }, { "epoch": 0.26, "learning_rate": 4.3205255491051615e-06, "loss": 0.8024, "step": 13948 }, { "epoch": 0.26, "learning_rate": 4.3204208472621e-06, "loss": 0.7822, "step": 13949 }, { "epoch": 0.26, "learning_rate": 4.320316138621645e-06, "loss": 1.0603, "step": 13950 }, { "epoch": 0.26, "learning_rate": 4.320211423184184e-06, "loss": 0.8972, "step": 13951 }, { "epoch": 0.26, "learning_rate": 4.32010670095011e-06, "loss": 0.9807, "step": 13952 }, { "epoch": 0.26, "learning_rate": 4.320001971919812e-06, "loss": 1.0823, "step": 13953 }, { "epoch": 0.26, "learning_rate": 4.319897236093684e-06, "loss": 0.9044, "step": 13954 }, { "epoch": 0.26, "learning_rate": 4.3197924934721145e-06, "loss": 1.0106, "step": 13955 }, { "epoch": 0.26, "learning_rate": 4.319687744055497e-06, "loss": 0.9753, "step": 13956 }, { "epoch": 0.26, "learning_rate": 4.31958298784422e-06, "loss": 1.0349, "step": 13957 }, { "epoch": 0.26, "learning_rate": 4.319478224838677e-06, "loss": 0.7776, "step": 13958 }, { "epoch": 0.26, "learning_rate": 4.319373455039256e-06, "loss": 1.0752, "step": 13959 }, { "epoch": 0.26, "learning_rate": 4.319268678446352e-06, "loss": 0.8597, "step": 13960 }, { "epoch": 0.26, "learning_rate": 4.3191638950603546e-06, "loss": 0.7242, "step": 13961 }, { "epoch": 0.26, "learning_rate": 4.319059104881654e-06, "loss": 1.0005, "step": 13962 }, { "epoch": 0.26, "learning_rate": 4.3189543079106434e-06, "loss": 0.961, "step": 13963 }, { "epoch": 0.26, "learning_rate": 4.318849504147713e-06, "loss": 0.9977, "step": 13964 }, { "epoch": 0.26, "learning_rate": 4.318744693593254e-06, "loss": 0.8449, "step": 13965 }, { "epoch": 0.26, "learning_rate": 4.318639876247659e-06, "loss": 0.9224, "step": 13966 }, { "epoch": 0.26, "learning_rate": 4.318535052111317e-06, "loss": 0.9174, "step": 13967 }, { "epoch": 0.26, "learning_rate": 4.318430221184622e-06, "loss": 0.9366, "step": 13968 }, { "epoch": 0.26, "learning_rate": 4.318325383467964e-06, "loss": 1.1122, "step": 13969 }, { "epoch": 0.26, "learning_rate": 4.318220538961735e-06, "loss": 0.8679, "step": 13970 }, { "epoch": 0.26, "learning_rate": 4.318115687666325e-06, "loss": 0.8134, "step": 13971 }, { "epoch": 0.26, "learning_rate": 4.318010829582129e-06, "loss": 0.7189, "step": 13972 }, { "epoch": 0.26, "learning_rate": 4.317905964709535e-06, "loss": 0.7725, "step": 13973 }, { "epoch": 0.26, "learning_rate": 4.317801093048936e-06, "loss": 0.9735, "step": 13974 }, { "epoch": 0.26, "learning_rate": 4.317696214600723e-06, "loss": 1.1859, "step": 13975 }, { "epoch": 0.26, "learning_rate": 4.317591329365288e-06, "loss": 0.8911, "step": 13976 }, { "epoch": 0.26, "learning_rate": 4.317486437343023e-06, "loss": 0.9902, "step": 13977 }, { "epoch": 0.26, "learning_rate": 4.3173815385343195e-06, "loss": 1.0652, "step": 13978 }, { "epoch": 0.26, "learning_rate": 4.317276632939569e-06, "loss": 0.8752, "step": 13979 }, { "epoch": 0.26, "learning_rate": 4.3171717205591636e-06, "loss": 0.8108, "step": 13980 }, { "epoch": 0.26, "learning_rate": 4.317066801393495e-06, "loss": 0.9469, "step": 13981 }, { "epoch": 0.26, "learning_rate": 4.3169618754429536e-06, "loss": 0.9257, "step": 13982 }, { "epoch": 0.26, "learning_rate": 4.316856942707932e-06, "loss": 0.976, "step": 13983 }, { "epoch": 0.26, "learning_rate": 4.3167520031888235e-06, "loss": 0.8058, "step": 13984 }, { "epoch": 0.26, "learning_rate": 4.316647056886018e-06, "loss": 0.7338, "step": 13985 }, { "epoch": 0.26, "learning_rate": 4.316542103799909e-06, "loss": 0.8468, "step": 13986 }, { "epoch": 0.26, "learning_rate": 4.316437143930886e-06, "loss": 1.0356, "step": 13987 }, { "epoch": 0.26, "learning_rate": 4.316332177279344e-06, "loss": 0.9791, "step": 13988 }, { "epoch": 0.26, "learning_rate": 4.316227203845672e-06, "loss": 0.7699, "step": 13989 }, { "epoch": 0.26, "learning_rate": 4.316122223630264e-06, "loss": 1.019, "step": 13990 }, { "epoch": 0.26, "learning_rate": 4.316017236633511e-06, "loss": 0.9214, "step": 13991 }, { "epoch": 0.26, "learning_rate": 4.315912242855806e-06, "loss": 0.8018, "step": 13992 }, { "epoch": 0.26, "learning_rate": 4.31580724229754e-06, "loss": 1.1679, "step": 13993 }, { "epoch": 0.26, "learning_rate": 4.315702234959105e-06, "loss": 1.1459, "step": 13994 }, { "epoch": 0.26, "learning_rate": 4.315597220840894e-06, "loss": 0.9842, "step": 13995 }, { "epoch": 0.26, "learning_rate": 4.315492199943299e-06, "loss": 0.9577, "step": 13996 }, { "epoch": 0.26, "learning_rate": 4.315387172266711e-06, "loss": 0.9724, "step": 13997 }, { "epoch": 0.26, "learning_rate": 4.315282137811523e-06, "loss": 0.8156, "step": 13998 }, { "epoch": 0.26, "learning_rate": 4.315177096578127e-06, "loss": 1.0341, "step": 13999 }, { "epoch": 0.26, "learning_rate": 4.315072048566916e-06, "loss": 1.135, "step": 14000 }, { "epoch": 0.26, "learning_rate": 4.314966993778281e-06, "loss": 0.7978, "step": 14001 }, { "epoch": 0.26, "learning_rate": 4.314861932212616e-06, "loss": 1.0862, "step": 14002 }, { "epoch": 0.26, "learning_rate": 4.314756863870311e-06, "loss": 1.027, "step": 14003 }, { "epoch": 0.26, "learning_rate": 4.31465178875176e-06, "loss": 0.7593, "step": 14004 }, { "epoch": 0.26, "learning_rate": 4.314546706857355e-06, "loss": 0.8555, "step": 14005 }, { "epoch": 0.26, "learning_rate": 4.314441618187488e-06, "loss": 1.0517, "step": 14006 }, { "epoch": 0.26, "learning_rate": 4.314336522742552e-06, "loss": 0.94, "step": 14007 }, { "epoch": 0.26, "learning_rate": 4.314231420522939e-06, "loss": 0.8038, "step": 14008 }, { "epoch": 0.26, "learning_rate": 4.314126311529041e-06, "loss": 1.1943, "step": 14009 }, { "epoch": 0.26, "learning_rate": 4.314021195761251e-06, "loss": 0.9218, "step": 14010 }, { "epoch": 0.26, "learning_rate": 4.313916073219961e-06, "loss": 0.9237, "step": 14011 }, { "epoch": 0.26, "learning_rate": 4.313810943905565e-06, "loss": 1.1003, "step": 14012 }, { "epoch": 0.26, "learning_rate": 4.313705807818454e-06, "loss": 0.8306, "step": 14013 }, { "epoch": 0.26, "learning_rate": 4.313600664959022e-06, "loss": 0.7289, "step": 14014 }, { "epoch": 0.26, "learning_rate": 4.31349551532766e-06, "loss": 1.0061, "step": 14015 }, { "epoch": 0.26, "learning_rate": 4.313390358924761e-06, "loss": 0.9985, "step": 14016 }, { "epoch": 0.26, "learning_rate": 4.313285195750718e-06, "loss": 0.9351, "step": 14017 }, { "epoch": 0.26, "learning_rate": 4.313180025805924e-06, "loss": 0.8556, "step": 14018 }, { "epoch": 0.26, "learning_rate": 4.313074849090772e-06, "loss": 1.1736, "step": 14019 }, { "epoch": 0.26, "learning_rate": 4.312969665605654e-06, "loss": 0.8037, "step": 14020 }, { "epoch": 0.26, "learning_rate": 4.312864475350962e-06, "loss": 0.8574, "step": 14021 }, { "epoch": 0.26, "learning_rate": 4.31275927832709e-06, "loss": 0.946, "step": 14022 }, { "epoch": 0.26, "learning_rate": 4.312654074534431e-06, "loss": 0.8918, "step": 14023 }, { "epoch": 0.26, "learning_rate": 4.312548863973376e-06, "loss": 0.9651, "step": 14024 }, { "epoch": 0.26, "learning_rate": 4.31244364664432e-06, "loss": 0.958, "step": 14025 }, { "epoch": 0.26, "learning_rate": 4.312338422547655e-06, "loss": 0.8378, "step": 14026 }, { "epoch": 0.26, "learning_rate": 4.312233191683774e-06, "loss": 1.0549, "step": 14027 }, { "epoch": 0.26, "learning_rate": 4.312127954053069e-06, "loss": 0.7718, "step": 14028 }, { "epoch": 0.26, "learning_rate": 4.312022709655935e-06, "loss": 0.877, "step": 14029 }, { "epoch": 0.26, "learning_rate": 4.311917458492763e-06, "loss": 1.0253, "step": 14030 }, { "epoch": 0.26, "learning_rate": 4.311812200563947e-06, "loss": 1.1107, "step": 14031 }, { "epoch": 0.26, "learning_rate": 4.311706935869879e-06, "loss": 1.0596, "step": 14032 }, { "epoch": 0.26, "learning_rate": 4.311601664410955e-06, "loss": 0.9538, "step": 14033 }, { "epoch": 0.26, "learning_rate": 4.311496386187564e-06, "loss": 0.8667, "step": 14034 }, { "epoch": 0.26, "learning_rate": 4.311391101200101e-06, "loss": 0.8866, "step": 14035 }, { "epoch": 0.26, "learning_rate": 4.31128580944896e-06, "loss": 0.8273, "step": 14036 }, { "epoch": 0.26, "learning_rate": 4.3111805109345324e-06, "loss": 1.0629, "step": 14037 }, { "epoch": 0.26, "learning_rate": 4.3110752056572136e-06, "loss": 1.0213, "step": 14038 }, { "epoch": 0.26, "learning_rate": 4.3109698936173945e-06, "loss": 0.8923, "step": 14039 }, { "epoch": 0.26, "learning_rate": 4.31086457481547e-06, "loss": 0.7998, "step": 14040 }, { "epoch": 0.26, "learning_rate": 4.310759249251832e-06, "loss": 0.9154, "step": 14041 }, { "epoch": 0.26, "learning_rate": 4.3106539169268745e-06, "loss": 0.8338, "step": 14042 }, { "epoch": 0.26, "learning_rate": 4.310548577840992e-06, "loss": 1.0522, "step": 14043 }, { "epoch": 0.26, "learning_rate": 4.310443231994575e-06, "loss": 1.0347, "step": 14044 }, { "epoch": 0.26, "learning_rate": 4.31033787938802e-06, "loss": 0.9595, "step": 14045 }, { "epoch": 0.27, "learning_rate": 4.310232520021718e-06, "loss": 0.8876, "step": 14046 }, { "epoch": 0.27, "learning_rate": 4.310127153896063e-06, "loss": 0.777, "step": 14047 }, { "epoch": 0.27, "learning_rate": 4.31002178101145e-06, "loss": 1.0406, "step": 14048 }, { "epoch": 0.27, "learning_rate": 4.309916401368269e-06, "loss": 1.1343, "step": 14049 }, { "epoch": 0.27, "learning_rate": 4.309811014966917e-06, "loss": 1.36, "step": 14050 }, { "epoch": 0.27, "learning_rate": 4.309705621807787e-06, "loss": 0.9911, "step": 14051 }, { "epoch": 0.27, "learning_rate": 4.30960022189127e-06, "loss": 0.941, "step": 14052 }, { "epoch": 0.27, "learning_rate": 4.3094948152177615e-06, "loss": 0.9076, "step": 14053 }, { "epoch": 0.27, "learning_rate": 4.309389401787656e-06, "loss": 0.9568, "step": 14054 }, { "epoch": 0.27, "learning_rate": 4.309283981601346e-06, "loss": 0.9153, "step": 14055 }, { "epoch": 0.27, "learning_rate": 4.309178554659224e-06, "loss": 1.1447, "step": 14056 }, { "epoch": 0.27, "learning_rate": 4.309073120961685e-06, "loss": 1.0538, "step": 14057 }, { "epoch": 0.27, "learning_rate": 4.308967680509122e-06, "loss": 0.8094, "step": 14058 }, { "epoch": 0.27, "learning_rate": 4.30886223330193e-06, "loss": 0.8116, "step": 14059 }, { "epoch": 0.27, "learning_rate": 4.3087567793405015e-06, "loss": 0.819, "step": 14060 }, { "epoch": 0.27, "learning_rate": 4.308651318625231e-06, "loss": 0.9618, "step": 14061 }, { "epoch": 0.27, "learning_rate": 4.308545851156511e-06, "loss": 1.1376, "step": 14062 }, { "epoch": 0.27, "learning_rate": 4.308440376934737e-06, "loss": 1.0173, "step": 14063 }, { "epoch": 0.27, "learning_rate": 4.308334895960302e-06, "loss": 0.9241, "step": 14064 }, { "epoch": 0.27, "learning_rate": 4.3082294082336e-06, "loss": 0.7995, "step": 14065 }, { "epoch": 0.27, "learning_rate": 4.308123913755026e-06, "loss": 1.0386, "step": 14066 }, { "epoch": 0.27, "learning_rate": 4.308018412524971e-06, "loss": 0.8203, "step": 14067 }, { "epoch": 0.27, "learning_rate": 4.307912904543831e-06, "loss": 0.913, "step": 14068 }, { "epoch": 0.27, "learning_rate": 4.307807389812e-06, "loss": 1.1351, "step": 14069 }, { "epoch": 0.27, "learning_rate": 4.307701868329871e-06, "loss": 0.8535, "step": 14070 }, { "epoch": 0.27, "learning_rate": 4.307596340097839e-06, "loss": 0.8097, "step": 14071 }, { "epoch": 0.27, "learning_rate": 4.307490805116299e-06, "loss": 0.931, "step": 14072 }, { "epoch": 0.27, "learning_rate": 4.3073852633856414e-06, "loss": 0.784, "step": 14073 }, { "epoch": 0.27, "learning_rate": 4.3072797149062636e-06, "loss": 1.1838, "step": 14074 }, { "epoch": 0.27, "learning_rate": 4.30717415967856e-06, "loss": 1.0006, "step": 14075 }, { "epoch": 0.27, "learning_rate": 4.307068597702922e-06, "loss": 0.8878, "step": 14076 }, { "epoch": 0.27, "learning_rate": 4.306963028979746e-06, "loss": 0.9122, "step": 14077 }, { "epoch": 0.27, "learning_rate": 4.306857453509425e-06, "loss": 0.7978, "step": 14078 }, { "epoch": 0.27, "learning_rate": 4.306751871292354e-06, "loss": 0.82, "step": 14079 }, { "epoch": 0.27, "learning_rate": 4.306646282328927e-06, "loss": 0.8782, "step": 14080 }, { "epoch": 0.27, "learning_rate": 4.3065406866195374e-06, "loss": 0.9476, "step": 14081 }, { "epoch": 0.27, "learning_rate": 4.306435084164581e-06, "loss": 1.032, "step": 14082 }, { "epoch": 0.27, "learning_rate": 4.306329474964451e-06, "loss": 1.0003, "step": 14083 }, { "epoch": 0.27, "learning_rate": 4.3062238590195425e-06, "loss": 0.8055, "step": 14084 }, { "epoch": 0.27, "learning_rate": 4.306118236330249e-06, "loss": 0.8947, "step": 14085 }, { "epoch": 0.27, "learning_rate": 4.306012606896966e-06, "loss": 0.9228, "step": 14086 }, { "epoch": 0.27, "learning_rate": 4.3059069707200875e-06, "loss": 1.2203, "step": 14087 }, { "epoch": 0.27, "learning_rate": 4.305801327800006e-06, "loss": 0.9695, "step": 14088 }, { "epoch": 0.27, "learning_rate": 4.305695678137119e-06, "loss": 0.82, "step": 14089 }, { "epoch": 0.27, "learning_rate": 4.30559002173182e-06, "loss": 0.9125, "step": 14090 }, { "epoch": 0.27, "learning_rate": 4.305484358584503e-06, "loss": 0.92, "step": 14091 }, { "epoch": 0.27, "learning_rate": 4.305378688695563e-06, "loss": 0.8867, "step": 14092 }, { "epoch": 0.27, "learning_rate": 4.3052730120653935e-06, "loss": 0.9862, "step": 14093 }, { "epoch": 0.27, "learning_rate": 4.305167328694391e-06, "loss": 1.0828, "step": 14094 }, { "epoch": 0.27, "learning_rate": 4.305061638582948e-06, "loss": 0.9311, "step": 14095 }, { "epoch": 0.27, "learning_rate": 4.30495594173146e-06, "loss": 0.8031, "step": 14096 }, { "epoch": 0.27, "learning_rate": 4.304850238140323e-06, "loss": 0.8637, "step": 14097 }, { "epoch": 0.27, "learning_rate": 4.304744527809929e-06, "loss": 0.9431, "step": 14098 }, { "epoch": 0.27, "learning_rate": 4.304638810740676e-06, "loss": 1.0825, "step": 14099 }, { "epoch": 0.27, "learning_rate": 4.304533086932957e-06, "loss": 1.1619, "step": 14100 }, { "epoch": 0.27, "learning_rate": 4.304427356387166e-06, "loss": 0.8828, "step": 14101 }, { "epoch": 0.27, "learning_rate": 4.304321619103698e-06, "loss": 0.9456, "step": 14102 }, { "epoch": 0.27, "learning_rate": 4.3042158750829486e-06, "loss": 0.9362, "step": 14103 }, { "epoch": 0.27, "learning_rate": 4.304110124325314e-06, "loss": 0.7919, "step": 14104 }, { "epoch": 0.27, "learning_rate": 4.3040043668311856e-06, "loss": 0.871, "step": 14105 }, { "epoch": 0.27, "learning_rate": 4.303898602600961e-06, "loss": 0.9149, "step": 14106 }, { "epoch": 0.27, "learning_rate": 4.303792831635034e-06, "loss": 0.7247, "step": 14107 }, { "epoch": 0.27, "learning_rate": 4.303687053933801e-06, "loss": 0.9066, "step": 14108 }, { "epoch": 0.27, "learning_rate": 4.303581269497655e-06, "loss": 0.8786, "step": 14109 }, { "epoch": 0.27, "learning_rate": 4.303475478326992e-06, "loss": 0.9939, "step": 14110 }, { "epoch": 0.27, "learning_rate": 4.303369680422206e-06, "loss": 0.6838, "step": 14111 }, { "epoch": 0.27, "learning_rate": 4.303263875783694e-06, "loss": 1.1074, "step": 14112 }, { "epoch": 0.27, "learning_rate": 4.3031580644118495e-06, "loss": 1.0927, "step": 14113 }, { "epoch": 0.27, "learning_rate": 4.303052246307068e-06, "loss": 0.9241, "step": 14114 }, { "epoch": 0.27, "learning_rate": 4.3029464214697455e-06, "loss": 0.944, "step": 14115 }, { "epoch": 0.27, "learning_rate": 4.302840589900275e-06, "loss": 0.8434, "step": 14116 }, { "epoch": 0.27, "learning_rate": 4.302734751599054e-06, "loss": 0.8333, "step": 14117 }, { "epoch": 0.27, "learning_rate": 4.302628906566476e-06, "loss": 1.1709, "step": 14118 }, { "epoch": 0.27, "learning_rate": 4.302523054802938e-06, "loss": 1.0133, "step": 14119 }, { "epoch": 0.27, "learning_rate": 4.302417196308833e-06, "loss": 0.8701, "step": 14120 }, { "epoch": 0.27, "learning_rate": 4.3023113310845585e-06, "loss": 0.9071, "step": 14121 }, { "epoch": 0.27, "learning_rate": 4.302205459130509e-06, "loss": 0.8289, "step": 14122 }, { "epoch": 0.27, "learning_rate": 4.302099580447078e-06, "loss": 0.79, "step": 14123 }, { "epoch": 0.27, "learning_rate": 4.301993695034663e-06, "loss": 0.9341, "step": 14124 }, { "epoch": 0.27, "learning_rate": 4.301887802893659e-06, "loss": 1.1536, "step": 14125 }, { "epoch": 0.27, "learning_rate": 4.301781904024461e-06, "loss": 0.9607, "step": 14126 }, { "epoch": 0.27, "learning_rate": 4.3016759984274656e-06, "loss": 0.9607, "step": 14127 }, { "epoch": 0.27, "learning_rate": 4.301570086103066e-06, "loss": 0.898, "step": 14128 }, { "epoch": 0.27, "learning_rate": 4.30146416705166e-06, "loss": 0.7353, "step": 14129 }, { "epoch": 0.27, "learning_rate": 4.301358241273641e-06, "loss": 0.9105, "step": 14130 }, { "epoch": 0.27, "learning_rate": 4.301252308769407e-06, "loss": 1.2449, "step": 14131 }, { "epoch": 0.27, "learning_rate": 4.301146369539351e-06, "loss": 0.7256, "step": 14132 }, { "epoch": 0.27, "learning_rate": 4.301040423583869e-06, "loss": 1.0142, "step": 14133 }, { "epoch": 0.27, "learning_rate": 4.300934470903359e-06, "loss": 0.9091, "step": 14134 }, { "epoch": 0.27, "learning_rate": 4.300828511498213e-06, "loss": 0.859, "step": 14135 }, { "epoch": 0.27, "learning_rate": 4.3007225453688304e-06, "loss": 0.9119, "step": 14136 }, { "epoch": 0.27, "learning_rate": 4.300616572515604e-06, "loss": 1.0503, "step": 14137 }, { "epoch": 0.27, "learning_rate": 4.30051059293893e-06, "loss": 1.0742, "step": 14138 }, { "epoch": 0.27, "learning_rate": 4.300404606639206e-06, "loss": 0.8145, "step": 14139 }, { "epoch": 0.27, "learning_rate": 4.3002986136168256e-06, "loss": 0.9915, "step": 14140 }, { "epoch": 0.27, "learning_rate": 4.300192613872185e-06, "loss": 0.7353, "step": 14141 }, { "epoch": 0.27, "learning_rate": 4.300086607405681e-06, "loss": 0.983, "step": 14142 }, { "epoch": 0.27, "learning_rate": 4.299980594217709e-06, "loss": 1.0468, "step": 14143 }, { "epoch": 0.27, "learning_rate": 4.299874574308664e-06, "loss": 0.9993, "step": 14144 }, { "epoch": 0.27, "learning_rate": 4.299768547678943e-06, "loss": 0.992, "step": 14145 }, { "epoch": 0.27, "learning_rate": 4.299662514328942e-06, "loss": 0.8752, "step": 14146 }, { "epoch": 0.27, "learning_rate": 4.2995564742590555e-06, "loss": 0.9535, "step": 14147 }, { "epoch": 0.27, "learning_rate": 4.2994504274696806e-06, "loss": 0.8709, "step": 14148 }, { "epoch": 0.27, "learning_rate": 4.2993443739612126e-06, "loss": 1.0852, "step": 14149 }, { "epoch": 0.27, "learning_rate": 4.299238313734048e-06, "loss": 0.9625, "step": 14150 }, { "epoch": 0.27, "learning_rate": 4.299132246788583e-06, "loss": 0.9846, "step": 14151 }, { "epoch": 0.27, "learning_rate": 4.299026173125213e-06, "loss": 0.7135, "step": 14152 }, { "epoch": 0.27, "learning_rate": 4.2989200927443345e-06, "loss": 0.7252, "step": 14153 }, { "epoch": 0.27, "learning_rate": 4.298814005646344e-06, "loss": 0.8163, "step": 14154 }, { "epoch": 0.27, "learning_rate": 4.298707911831637e-06, "loss": 1.0164, "step": 14155 }, { "epoch": 0.27, "learning_rate": 4.298601811300609e-06, "loss": 1.0806, "step": 14156 }, { "epoch": 0.27, "learning_rate": 4.298495704053658e-06, "loss": 1.0546, "step": 14157 }, { "epoch": 0.27, "learning_rate": 4.298389590091179e-06, "loss": 0.9192, "step": 14158 }, { "epoch": 0.27, "learning_rate": 4.298283469413568e-06, "loss": 0.9955, "step": 14159 }, { "epoch": 0.27, "learning_rate": 4.2981773420212215e-06, "loss": 1.0076, "step": 14160 }, { "epoch": 0.27, "learning_rate": 4.298071207914536e-06, "loss": 0.9806, "step": 14161 }, { "epoch": 0.27, "learning_rate": 4.297965067093909e-06, "loss": 1.0634, "step": 14162 }, { "epoch": 0.27, "learning_rate": 4.297858919559734e-06, "loss": 0.8757, "step": 14163 }, { "epoch": 0.27, "learning_rate": 4.29775276531241e-06, "loss": 0.6659, "step": 14164 }, { "epoch": 0.27, "learning_rate": 4.297646604352331e-06, "loss": 0.8928, "step": 14165 }, { "epoch": 0.27, "learning_rate": 4.297540436679895e-06, "loss": 0.8517, "step": 14166 }, { "epoch": 0.27, "learning_rate": 4.2974342622955e-06, "loss": 0.9396, "step": 14167 }, { "epoch": 0.27, "learning_rate": 4.297328081199538e-06, "loss": 1.2373, "step": 14168 }, { "epoch": 0.27, "learning_rate": 4.29722189339241e-06, "loss": 0.8664, "step": 14169 }, { "epoch": 0.27, "learning_rate": 4.29711569887451e-06, "loss": 0.827, "step": 14170 }, { "epoch": 0.27, "learning_rate": 4.297009497646234e-06, "loss": 0.8824, "step": 14171 }, { "epoch": 0.27, "learning_rate": 4.296903289707981e-06, "loss": 0.9277, "step": 14172 }, { "epoch": 0.27, "learning_rate": 4.296797075060146e-06, "loss": 0.8025, "step": 14173 }, { "epoch": 0.27, "learning_rate": 4.296690853703125e-06, "loss": 0.973, "step": 14174 }, { "epoch": 0.27, "learning_rate": 4.296584625637316e-06, "loss": 1.1422, "step": 14175 }, { "epoch": 0.27, "learning_rate": 4.296478390863116e-06, "loss": 0.9326, "step": 14176 }, { "epoch": 0.27, "learning_rate": 4.296372149380919e-06, "loss": 0.7999, "step": 14177 }, { "epoch": 0.27, "learning_rate": 4.296265901191124e-06, "loss": 0.8062, "step": 14178 }, { "epoch": 0.27, "learning_rate": 4.296159646294128e-06, "loss": 0.9715, "step": 14179 }, { "epoch": 0.27, "learning_rate": 4.2960533846903265e-06, "loss": 1.0675, "step": 14180 }, { "epoch": 0.27, "learning_rate": 4.295947116380116e-06, "loss": 0.9489, "step": 14181 }, { "epoch": 0.27, "learning_rate": 4.295840841363895e-06, "loss": 0.9154, "step": 14182 }, { "epoch": 0.27, "learning_rate": 4.295734559642059e-06, "loss": 0.8064, "step": 14183 }, { "epoch": 0.27, "learning_rate": 4.2956282712150055e-06, "loss": 0.9425, "step": 14184 }, { "epoch": 0.27, "learning_rate": 4.295521976083131e-06, "loss": 0.9171, "step": 14185 }, { "epoch": 0.27, "learning_rate": 4.2954156742468325e-06, "loss": 1.0014, "step": 14186 }, { "epoch": 0.27, "learning_rate": 4.295309365706506e-06, "loss": 0.9718, "step": 14187 }, { "epoch": 0.27, "learning_rate": 4.295203050462551e-06, "loss": 0.9684, "step": 14188 }, { "epoch": 0.27, "learning_rate": 4.2950967285153625e-06, "loss": 0.7875, "step": 14189 }, { "epoch": 0.27, "learning_rate": 4.2949903998653364e-06, "loss": 0.8437, "step": 14190 }, { "epoch": 0.27, "learning_rate": 4.2948840645128725e-06, "loss": 1.1003, "step": 14191 }, { "epoch": 0.27, "learning_rate": 4.294777722458366e-06, "loss": 1.0062, "step": 14192 }, { "epoch": 0.27, "learning_rate": 4.294671373702215e-06, "loss": 0.9449, "step": 14193 }, { "epoch": 0.27, "learning_rate": 4.294565018244816e-06, "loss": 1.0118, "step": 14194 }, { "epoch": 0.27, "learning_rate": 4.294458656086565e-06, "loss": 0.9226, "step": 14195 }, { "epoch": 0.27, "learning_rate": 4.294352287227862e-06, "loss": 0.923, "step": 14196 }, { "epoch": 0.27, "learning_rate": 4.294245911669102e-06, "loss": 0.8682, "step": 14197 }, { "epoch": 0.27, "learning_rate": 4.294139529410684e-06, "loss": 0.804, "step": 14198 }, { "epoch": 0.27, "learning_rate": 4.294033140453002e-06, "loss": 1.0738, "step": 14199 }, { "epoch": 0.27, "learning_rate": 4.293926744796456e-06, "loss": 1.1135, "step": 14200 }, { "epoch": 0.27, "learning_rate": 4.293820342441443e-06, "loss": 1.0982, "step": 14201 }, { "epoch": 0.27, "learning_rate": 4.293713933388359e-06, "loss": 0.8942, "step": 14202 }, { "epoch": 0.27, "learning_rate": 4.293607517637602e-06, "loss": 0.9849, "step": 14203 }, { "epoch": 0.27, "learning_rate": 4.293501095189571e-06, "loss": 0.9614, "step": 14204 }, { "epoch": 0.27, "learning_rate": 4.293394666044661e-06, "loss": 1.136, "step": 14205 }, { "epoch": 0.27, "learning_rate": 4.29328823020327e-06, "loss": 0.9551, "step": 14206 }, { "epoch": 0.27, "learning_rate": 4.293181787665797e-06, "loss": 0.9937, "step": 14207 }, { "epoch": 0.27, "learning_rate": 4.293075338432636e-06, "loss": 0.886, "step": 14208 }, { "epoch": 0.27, "learning_rate": 4.2929688825041885e-06, "loss": 0.8911, "step": 14209 }, { "epoch": 0.27, "learning_rate": 4.29286241988085e-06, "loss": 0.8099, "step": 14210 }, { "epoch": 0.27, "learning_rate": 4.292755950563018e-06, "loss": 0.9425, "step": 14211 }, { "epoch": 0.27, "learning_rate": 4.29264947455109e-06, "loss": 1.0624, "step": 14212 }, { "epoch": 0.27, "learning_rate": 4.292542991845463e-06, "loss": 0.9644, "step": 14213 }, { "epoch": 0.27, "learning_rate": 4.2924365024465365e-06, "loss": 0.8891, "step": 14214 }, { "epoch": 0.27, "learning_rate": 4.292330006354707e-06, "loss": 1.0422, "step": 14215 }, { "epoch": 0.27, "learning_rate": 4.292223503570372e-06, "loss": 0.9512, "step": 14216 }, { "epoch": 0.27, "learning_rate": 4.29211699409393e-06, "loss": 0.9853, "step": 14217 }, { "epoch": 0.27, "learning_rate": 4.292010477925777e-06, "loss": 0.9954, "step": 14218 }, { "epoch": 0.27, "learning_rate": 4.291903955066313e-06, "loss": 1.1904, "step": 14219 }, { "epoch": 0.27, "learning_rate": 4.291797425515933e-06, "loss": 0.7244, "step": 14220 }, { "epoch": 0.27, "learning_rate": 4.291690889275038e-06, "loss": 0.7767, "step": 14221 }, { "epoch": 0.27, "learning_rate": 4.291584346344024e-06, "loss": 0.9451, "step": 14222 }, { "epoch": 0.27, "learning_rate": 4.291477796723288e-06, "loss": 0.9332, "step": 14223 }, { "epoch": 0.27, "learning_rate": 4.291371240413229e-06, "loss": 0.8973, "step": 14224 }, { "epoch": 0.27, "learning_rate": 4.291264677414245e-06, "loss": 1.1554, "step": 14225 }, { "epoch": 0.27, "learning_rate": 4.291158107726734e-06, "loss": 0.886, "step": 14226 }, { "epoch": 0.27, "learning_rate": 4.2910515313510925e-06, "loss": 0.8631, "step": 14227 }, { "epoch": 0.27, "learning_rate": 4.29094494828772e-06, "loss": 1.0281, "step": 14228 }, { "epoch": 0.27, "learning_rate": 4.290838358537015e-06, "loss": 0.7931, "step": 14229 }, { "epoch": 0.27, "learning_rate": 4.290731762099372e-06, "loss": 0.945, "step": 14230 }, { "epoch": 0.27, "learning_rate": 4.290625158975194e-06, "loss": 1.1579, "step": 14231 }, { "epoch": 0.27, "learning_rate": 4.290518549164876e-06, "loss": 0.8934, "step": 14232 }, { "epoch": 0.27, "learning_rate": 4.2904119326688165e-06, "loss": 0.9216, "step": 14233 }, { "epoch": 0.27, "learning_rate": 4.290305309487413e-06, "loss": 1.1003, "step": 14234 }, { "epoch": 0.27, "learning_rate": 4.290198679621065e-06, "loss": 0.9019, "step": 14235 }, { "epoch": 0.27, "learning_rate": 4.29009204307017e-06, "loss": 1.0178, "step": 14236 }, { "epoch": 0.27, "learning_rate": 4.289985399835126e-06, "loss": 1.1586, "step": 14237 }, { "epoch": 0.27, "learning_rate": 4.289878749916331e-06, "loss": 1.0486, "step": 14238 }, { "epoch": 0.27, "learning_rate": 4.289772093314184e-06, "loss": 0.7238, "step": 14239 }, { "epoch": 0.27, "learning_rate": 4.289665430029084e-06, "loss": 0.8649, "step": 14240 }, { "epoch": 0.27, "learning_rate": 4.289558760061427e-06, "loss": 1.092, "step": 14241 }, { "epoch": 0.27, "learning_rate": 4.289452083411612e-06, "loss": 0.7551, "step": 14242 }, { "epoch": 0.27, "learning_rate": 4.289345400080039e-06, "loss": 0.9479, "step": 14243 }, { "epoch": 0.27, "learning_rate": 4.289238710067104e-06, "loss": 0.9402, "step": 14244 }, { "epoch": 0.27, "learning_rate": 4.289132013373207e-06, "loss": 0.9245, "step": 14245 }, { "epoch": 0.27, "learning_rate": 4.289025309998747e-06, "loss": 0.9426, "step": 14246 }, { "epoch": 0.27, "learning_rate": 4.28891859994412e-06, "loss": 0.8691, "step": 14247 }, { "epoch": 0.27, "learning_rate": 4.288811883209726e-06, "loss": 0.8658, "step": 14248 }, { "epoch": 0.27, "learning_rate": 4.2887051597959635e-06, "loss": 0.9109, "step": 14249 }, { "epoch": 0.27, "learning_rate": 4.2885984297032305e-06, "loss": 1.0212, "step": 14250 }, { "epoch": 0.27, "learning_rate": 4.2884916929319264e-06, "loss": 0.9513, "step": 14251 }, { "epoch": 0.27, "learning_rate": 4.288384949482448e-06, "loss": 0.9521, "step": 14252 }, { "epoch": 0.27, "learning_rate": 4.288278199355196e-06, "loss": 0.7971, "step": 14253 }, { "epoch": 0.27, "learning_rate": 4.288171442550568e-06, "loss": 0.843, "step": 14254 }, { "epoch": 0.27, "learning_rate": 4.288064679068962e-06, "loss": 1.0549, "step": 14255 }, { "epoch": 0.27, "learning_rate": 4.287957908910778e-06, "loss": 0.8191, "step": 14256 }, { "epoch": 0.27, "learning_rate": 4.287851132076414e-06, "loss": 1.1558, "step": 14257 }, { "epoch": 0.27, "learning_rate": 4.287744348566269e-06, "loss": 0.9207, "step": 14258 }, { "epoch": 0.27, "learning_rate": 4.287637558380741e-06, "loss": 0.9842, "step": 14259 }, { "epoch": 0.27, "learning_rate": 4.287530761520228e-06, "loss": 0.9368, "step": 14260 }, { "epoch": 0.27, "learning_rate": 4.287423957985131e-06, "loss": 0.8652, "step": 14261 }, { "epoch": 0.27, "learning_rate": 4.287317147775848e-06, "loss": 1.0863, "step": 14262 }, { "epoch": 0.27, "learning_rate": 4.287210330892777e-06, "loss": 1.1378, "step": 14263 }, { "epoch": 0.27, "learning_rate": 4.287103507336318e-06, "loss": 0.9207, "step": 14264 }, { "epoch": 0.27, "learning_rate": 4.28699667710687e-06, "loss": 0.9819, "step": 14265 }, { "epoch": 0.27, "learning_rate": 4.2868898402048295e-06, "loss": 0.9882, "step": 14266 }, { "epoch": 0.27, "learning_rate": 4.286782996630597e-06, "loss": 0.8777, "step": 14267 }, { "epoch": 0.27, "learning_rate": 4.286676146384573e-06, "loss": 0.9756, "step": 14268 }, { "epoch": 0.27, "learning_rate": 4.286569289467154e-06, "loss": 0.8376, "step": 14269 }, { "epoch": 0.27, "learning_rate": 4.2864624258787415e-06, "loss": 0.941, "step": 14270 }, { "epoch": 0.27, "learning_rate": 4.286355555619732e-06, "loss": 0.7512, "step": 14271 }, { "epoch": 0.27, "learning_rate": 4.286248678690525e-06, "loss": 0.9212, "step": 14272 }, { "epoch": 0.27, "learning_rate": 4.286141795091521e-06, "loss": 0.9374, "step": 14273 }, { "epoch": 0.27, "learning_rate": 4.286034904823118e-06, "loss": 1.0642, "step": 14274 }, { "epoch": 0.27, "learning_rate": 4.285928007885716e-06, "loss": 1.0081, "step": 14275 }, { "epoch": 0.27, "learning_rate": 4.285821104279713e-06, "loss": 1.0552, "step": 14276 }, { "epoch": 0.27, "learning_rate": 4.285714194005509e-06, "loss": 0.8337, "step": 14277 }, { "epoch": 0.27, "learning_rate": 4.285607277063503e-06, "loss": 0.9968, "step": 14278 }, { "epoch": 0.27, "learning_rate": 4.285500353454094e-06, "loss": 0.9956, "step": 14279 }, { "epoch": 0.27, "learning_rate": 4.285393423177681e-06, "loss": 0.9483, "step": 14280 }, { "epoch": 0.27, "learning_rate": 4.285286486234665e-06, "loss": 0.9188, "step": 14281 }, { "epoch": 0.27, "learning_rate": 4.285179542625443e-06, "loss": 1.1216, "step": 14282 }, { "epoch": 0.27, "learning_rate": 4.285072592350415e-06, "loss": 0.9716, "step": 14283 }, { "epoch": 0.27, "learning_rate": 4.284965635409982e-06, "loss": 0.7675, "step": 14284 }, { "epoch": 0.27, "learning_rate": 4.2848586718045415e-06, "loss": 0.8084, "step": 14285 }, { "epoch": 0.27, "learning_rate": 4.284751701534493e-06, "loss": 0.8849, "step": 14286 }, { "epoch": 0.27, "learning_rate": 4.284644724600237e-06, "loss": 1.2704, "step": 14287 }, { "epoch": 0.27, "learning_rate": 4.284537741002172e-06, "loss": 1.0191, "step": 14288 }, { "epoch": 0.27, "learning_rate": 4.284430750740696e-06, "loss": 0.9373, "step": 14289 }, { "epoch": 0.27, "learning_rate": 4.284323753816213e-06, "loss": 0.8138, "step": 14290 }, { "epoch": 0.27, "learning_rate": 4.284216750229119e-06, "loss": 1.0043, "step": 14291 }, { "epoch": 0.27, "learning_rate": 4.284109739979814e-06, "loss": 0.7351, "step": 14292 }, { "epoch": 0.27, "learning_rate": 4.2840027230686976e-06, "loss": 1.0009, "step": 14293 }, { "epoch": 0.27, "learning_rate": 4.28389569949617e-06, "loss": 1.1844, "step": 14294 }, { "epoch": 0.27, "learning_rate": 4.283788669262632e-06, "loss": 1.0022, "step": 14295 }, { "epoch": 0.27, "learning_rate": 4.28368163236848e-06, "loss": 0.7852, "step": 14296 }, { "epoch": 0.27, "learning_rate": 4.283574588814115e-06, "loss": 0.9728, "step": 14297 }, { "epoch": 0.27, "learning_rate": 4.283467538599939e-06, "loss": 0.8925, "step": 14298 }, { "epoch": 0.27, "learning_rate": 4.28336048172635e-06, "loss": 1.0322, "step": 14299 }, { "epoch": 0.27, "learning_rate": 4.283253418193746e-06, "loss": 1.1502, "step": 14300 }, { "epoch": 0.27, "learning_rate": 4.283146348002529e-06, "loss": 0.9996, "step": 14301 }, { "epoch": 0.27, "learning_rate": 4.283039271153099e-06, "loss": 1.1017, "step": 14302 }, { "epoch": 0.27, "learning_rate": 4.282932187645854e-06, "loss": 1.017, "step": 14303 }, { "epoch": 0.27, "learning_rate": 4.282825097481195e-06, "loss": 0.9487, "step": 14304 }, { "epoch": 0.27, "learning_rate": 4.2827180006595225e-06, "loss": 1.0928, "step": 14305 }, { "epoch": 0.27, "learning_rate": 4.282610897181235e-06, "loss": 1.0605, "step": 14306 }, { "epoch": 0.27, "learning_rate": 4.282503787046733e-06, "loss": 0.9706, "step": 14307 }, { "epoch": 0.27, "learning_rate": 4.282396670256417e-06, "loss": 0.8518, "step": 14308 }, { "epoch": 0.27, "learning_rate": 4.282289546810686e-06, "loss": 0.9694, "step": 14309 }, { "epoch": 0.27, "learning_rate": 4.28218241670994e-06, "loss": 0.946, "step": 14310 }, { "epoch": 0.27, "learning_rate": 4.2820752799545806e-06, "loss": 1.0175, "step": 14311 }, { "epoch": 0.27, "learning_rate": 4.281968136545007e-06, "loss": 1.0637, "step": 14312 }, { "epoch": 0.27, "learning_rate": 4.281860986481618e-06, "loss": 0.9843, "step": 14313 }, { "epoch": 0.27, "learning_rate": 4.281753829764815e-06, "loss": 0.8699, "step": 14314 }, { "epoch": 0.27, "learning_rate": 4.281646666394998e-06, "loss": 0.8467, "step": 14315 }, { "epoch": 0.27, "learning_rate": 4.281539496372566e-06, "loss": 0.8818, "step": 14316 }, { "epoch": 0.27, "learning_rate": 4.2814323196979215e-06, "loss": 0.9109, "step": 14317 }, { "epoch": 0.27, "learning_rate": 4.2813251363714634e-06, "loss": 1.0363, "step": 14318 }, { "epoch": 0.27, "learning_rate": 4.281217946393591e-06, "loss": 1.1909, "step": 14319 }, { "epoch": 0.27, "learning_rate": 4.281110749764706e-06, "loss": 0.9781, "step": 14320 }, { "epoch": 0.27, "learning_rate": 4.281003546485208e-06, "loss": 1.0652, "step": 14321 }, { "epoch": 0.27, "learning_rate": 4.280896336555497e-06, "loss": 0.8673, "step": 14322 }, { "epoch": 0.27, "learning_rate": 4.280789119975973e-06, "loss": 0.7772, "step": 14323 }, { "epoch": 0.27, "learning_rate": 4.280681896747039e-06, "loss": 1.0182, "step": 14324 }, { "epoch": 0.27, "learning_rate": 4.280574666869092e-06, "loss": 1.2074, "step": 14325 }, { "epoch": 0.27, "learning_rate": 4.280467430342534e-06, "loss": 0.9009, "step": 14326 }, { "epoch": 0.27, "learning_rate": 4.2803601871677644e-06, "loss": 0.8339, "step": 14327 }, { "epoch": 0.27, "learning_rate": 4.280252937345186e-06, "loss": 0.9156, "step": 14328 }, { "epoch": 0.27, "learning_rate": 4.280145680875196e-06, "loss": 0.9609, "step": 14329 }, { "epoch": 0.27, "learning_rate": 4.280038417758198e-06, "loss": 0.8885, "step": 14330 }, { "epoch": 0.27, "learning_rate": 4.279931147994591e-06, "loss": 1.1589, "step": 14331 }, { "epoch": 0.27, "learning_rate": 4.279823871584775e-06, "loss": 1.0524, "step": 14332 }, { "epoch": 0.27, "learning_rate": 4.279716588529152e-06, "loss": 0.8191, "step": 14333 }, { "epoch": 0.27, "learning_rate": 4.279609298828121e-06, "loss": 0.8044, "step": 14334 }, { "epoch": 0.27, "learning_rate": 4.279502002482084e-06, "loss": 0.8599, "step": 14335 }, { "epoch": 0.27, "learning_rate": 4.279394699491441e-06, "loss": 0.8273, "step": 14336 }, { "epoch": 0.27, "learning_rate": 4.279287389856593e-06, "loss": 1.0107, "step": 14337 }, { "epoch": 0.27, "learning_rate": 4.27918007357794e-06, "loss": 0.9815, "step": 14338 }, { "epoch": 0.27, "learning_rate": 4.279072750655884e-06, "loss": 0.8318, "step": 14339 }, { "epoch": 0.27, "learning_rate": 4.278965421090824e-06, "loss": 0.8386, "step": 14340 }, { "epoch": 0.27, "learning_rate": 4.278858084883162e-06, "loss": 0.9417, "step": 14341 }, { "epoch": 0.27, "learning_rate": 4.278750742033298e-06, "loss": 0.8486, "step": 14342 }, { "epoch": 0.27, "learning_rate": 4.278643392541633e-06, "loss": 1.0038, "step": 14343 }, { "epoch": 0.27, "learning_rate": 4.278536036408569e-06, "loss": 1.062, "step": 14344 }, { "epoch": 0.27, "learning_rate": 4.278428673634506e-06, "loss": 0.8393, "step": 14345 }, { "epoch": 0.27, "learning_rate": 4.278321304219844e-06, "loss": 1.2432, "step": 14346 }, { "epoch": 0.27, "learning_rate": 4.278213928164986e-06, "loss": 0.7607, "step": 14347 }, { "epoch": 0.27, "learning_rate": 4.27810654547033e-06, "loss": 0.664, "step": 14348 }, { "epoch": 0.27, "learning_rate": 4.277999156136281e-06, "loss": 1.0084, "step": 14349 }, { "epoch": 0.27, "learning_rate": 4.277891760163237e-06, "loss": 1.2361, "step": 14350 }, { "epoch": 0.27, "learning_rate": 4.277784357551598e-06, "loss": 0.8842, "step": 14351 }, { "epoch": 0.27, "learning_rate": 4.277676948301768e-06, "loss": 0.8614, "step": 14352 }, { "epoch": 0.27, "learning_rate": 4.277569532414146e-06, "loss": 0.9819, "step": 14353 }, { "epoch": 0.27, "learning_rate": 4.277462109889135e-06, "loss": 0.7334, "step": 14354 }, { "epoch": 0.27, "learning_rate": 4.277354680727135e-06, "loss": 1.0704, "step": 14355 }, { "epoch": 0.27, "learning_rate": 4.2772472449285465e-06, "loss": 1.0637, "step": 14356 }, { "epoch": 0.27, "learning_rate": 4.2771398024937705e-06, "loss": 1.0542, "step": 14357 }, { "epoch": 0.27, "learning_rate": 4.27703235342321e-06, "loss": 0.9119, "step": 14358 }, { "epoch": 0.27, "learning_rate": 4.2769248977172655e-06, "loss": 0.9234, "step": 14359 }, { "epoch": 0.27, "learning_rate": 4.276817435376337e-06, "loss": 1.0124, "step": 14360 }, { "epoch": 0.27, "learning_rate": 4.276709966400827e-06, "loss": 0.8591, "step": 14361 }, { "epoch": 0.27, "learning_rate": 4.276602490791137e-06, "loss": 1.2091, "step": 14362 }, { "epoch": 0.27, "learning_rate": 4.276495008547666e-06, "loss": 0.7949, "step": 14363 }, { "epoch": 0.27, "learning_rate": 4.276387519670819e-06, "loss": 0.8176, "step": 14364 }, { "epoch": 0.27, "learning_rate": 4.276280024160995e-06, "loss": 0.8512, "step": 14365 }, { "epoch": 0.27, "learning_rate": 4.276172522018596e-06, "loss": 1.0203, "step": 14366 }, { "epoch": 0.27, "learning_rate": 4.276065013244022e-06, "loss": 1.1268, "step": 14367 }, { "epoch": 0.27, "learning_rate": 4.275957497837677e-06, "loss": 1.1231, "step": 14368 }, { "epoch": 0.27, "learning_rate": 4.27584997579996e-06, "loss": 0.9993, "step": 14369 }, { "epoch": 0.27, "learning_rate": 4.275742447131276e-06, "loss": 1.1239, "step": 14370 }, { "epoch": 0.27, "learning_rate": 4.275634911832022e-06, "loss": 0.8846, "step": 14371 }, { "epoch": 0.27, "learning_rate": 4.275527369902602e-06, "loss": 0.9835, "step": 14372 }, { "epoch": 0.27, "learning_rate": 4.275419821343417e-06, "loss": 0.9282, "step": 14373 }, { "epoch": 0.27, "learning_rate": 4.27531226615487e-06, "loss": 0.9722, "step": 14374 }, { "epoch": 0.27, "learning_rate": 4.275204704337362e-06, "loss": 0.8212, "step": 14375 }, { "epoch": 0.27, "learning_rate": 4.2750971358912915e-06, "loss": 0.934, "step": 14376 }, { "epoch": 0.27, "learning_rate": 4.274989560817064e-06, "loss": 0.7603, "step": 14377 }, { "epoch": 0.27, "learning_rate": 4.27488197911508e-06, "loss": 0.903, "step": 14378 }, { "epoch": 0.27, "learning_rate": 4.2747743907857406e-06, "loss": 0.8258, "step": 14379 }, { "epoch": 0.27, "learning_rate": 4.274666795829449e-06, "loss": 1.0396, "step": 14380 }, { "epoch": 0.27, "learning_rate": 4.274559194246606e-06, "loss": 1.0741, "step": 14381 }, { "epoch": 0.27, "learning_rate": 4.274451586037612e-06, "loss": 0.9749, "step": 14382 }, { "epoch": 0.27, "learning_rate": 4.274343971202871e-06, "loss": 0.8829, "step": 14383 }, { "epoch": 0.27, "learning_rate": 4.2742363497427845e-06, "loss": 0.8143, "step": 14384 }, { "epoch": 0.27, "learning_rate": 4.274128721657753e-06, "loss": 0.9011, "step": 14385 }, { "epoch": 0.27, "learning_rate": 4.27402108694818e-06, "loss": 1.0347, "step": 14386 }, { "epoch": 0.27, "learning_rate": 4.273913445614467e-06, "loss": 1.0406, "step": 14387 }, { "epoch": 0.27, "learning_rate": 4.273805797657015e-06, "loss": 0.8399, "step": 14388 }, { "epoch": 0.27, "learning_rate": 4.273698143076226e-06, "loss": 1.1246, "step": 14389 }, { "epoch": 0.27, "learning_rate": 4.273590481872503e-06, "loss": 0.9109, "step": 14390 }, { "epoch": 0.27, "learning_rate": 4.273482814046247e-06, "loss": 1.1033, "step": 14391 }, { "epoch": 0.27, "learning_rate": 4.2733751395978614e-06, "loss": 1.0487, "step": 14392 }, { "epoch": 0.27, "learning_rate": 4.273267458527747e-06, "loss": 0.9404, "step": 14393 }, { "epoch": 0.27, "learning_rate": 4.273159770836306e-06, "loss": 0.8816, "step": 14394 }, { "epoch": 0.27, "learning_rate": 4.2730520765239416e-06, "loss": 1.0515, "step": 14395 }, { "epoch": 0.27, "learning_rate": 4.272944375591055e-06, "loss": 0.9057, "step": 14396 }, { "epoch": 0.27, "learning_rate": 4.2728366680380475e-06, "loss": 0.5542, "step": 14397 }, { "epoch": 0.27, "learning_rate": 4.272728953865323e-06, "loss": 0.8894, "step": 14398 }, { "epoch": 0.27, "learning_rate": 4.272621233073283e-06, "loss": 1.0806, "step": 14399 }, { "epoch": 0.27, "learning_rate": 4.272513505662329e-06, "loss": 1.2352, "step": 14400 }, { "epoch": 0.27, "learning_rate": 4.272405771632864e-06, "loss": 1.0655, "step": 14401 }, { "epoch": 0.27, "learning_rate": 4.272298030985291e-06, "loss": 0.8831, "step": 14402 }, { "epoch": 0.27, "learning_rate": 4.272190283720011e-06, "loss": 0.8793, "step": 14403 }, { "epoch": 0.27, "learning_rate": 4.2720825298374265e-06, "loss": 0.8041, "step": 14404 }, { "epoch": 0.27, "learning_rate": 4.271974769337941e-06, "loss": 1.0605, "step": 14405 }, { "epoch": 0.27, "learning_rate": 4.271867002221956e-06, "loss": 1.2061, "step": 14406 }, { "epoch": 0.27, "learning_rate": 4.271759228489873e-06, "loss": 1.1714, "step": 14407 }, { "epoch": 0.27, "learning_rate": 4.271651448142096e-06, "loss": 0.9059, "step": 14408 }, { "epoch": 0.27, "learning_rate": 4.271543661179026e-06, "loss": 0.8224, "step": 14409 }, { "epoch": 0.27, "learning_rate": 4.271435867601067e-06, "loss": 0.7249, "step": 14410 }, { "epoch": 0.27, "learning_rate": 4.271328067408621e-06, "loss": 0.8167, "step": 14411 }, { "epoch": 0.27, "learning_rate": 4.271220260602091e-06, "loss": 1.0453, "step": 14412 }, { "epoch": 0.27, "learning_rate": 4.271112447181877e-06, "loss": 1.0527, "step": 14413 }, { "epoch": 0.27, "learning_rate": 4.271004627148384e-06, "loss": 0.925, "step": 14414 }, { "epoch": 0.27, "learning_rate": 4.270896800502015e-06, "loss": 0.7669, "step": 14415 }, { "epoch": 0.27, "learning_rate": 4.270788967243171e-06, "loss": 0.8486, "step": 14416 }, { "epoch": 0.27, "learning_rate": 4.270681127372255e-06, "loss": 0.9582, "step": 14417 }, { "epoch": 0.27, "learning_rate": 4.270573280889671e-06, "loss": 0.9565, "step": 14418 }, { "epoch": 0.27, "learning_rate": 4.270465427795819e-06, "loss": 1.2072, "step": 14419 }, { "epoch": 0.27, "learning_rate": 4.270357568091104e-06, "loss": 0.9402, "step": 14420 }, { "epoch": 0.27, "learning_rate": 4.27024970177593e-06, "loss": 0.9409, "step": 14421 }, { "epoch": 0.27, "learning_rate": 4.270141828850694e-06, "loss": 0.8865, "step": 14422 }, { "epoch": 0.27, "learning_rate": 4.270033949315806e-06, "loss": 0.7924, "step": 14423 }, { "epoch": 0.27, "learning_rate": 4.2699260631716645e-06, "loss": 1.0763, "step": 14424 }, { "epoch": 0.27, "learning_rate": 4.269818170418674e-06, "loss": 1.0549, "step": 14425 }, { "epoch": 0.27, "learning_rate": 4.269710271057235e-06, "loss": 1.1214, "step": 14426 }, { "epoch": 0.27, "learning_rate": 4.269602365087754e-06, "loss": 1.0352, "step": 14427 }, { "epoch": 0.27, "learning_rate": 4.269494452510631e-06, "loss": 0.9726, "step": 14428 }, { "epoch": 0.27, "learning_rate": 4.26938653332627e-06, "loss": 0.7724, "step": 14429 }, { "epoch": 0.27, "learning_rate": 4.269278607535074e-06, "loss": 0.9595, "step": 14430 }, { "epoch": 0.27, "learning_rate": 4.2691706751374465e-06, "loss": 1.1385, "step": 14431 }, { "epoch": 0.27, "learning_rate": 4.269062736133789e-06, "loss": 1.0469, "step": 14432 }, { "epoch": 0.27, "learning_rate": 4.2689547905245055e-06, "loss": 0.8317, "step": 14433 }, { "epoch": 0.27, "learning_rate": 4.268846838309999e-06, "loss": 0.8863, "step": 14434 }, { "epoch": 0.27, "learning_rate": 4.268738879490674e-06, "loss": 0.7346, "step": 14435 }, { "epoch": 0.27, "learning_rate": 4.268630914066931e-06, "loss": 1.0455, "step": 14436 }, { "epoch": 0.27, "learning_rate": 4.268522942039175e-06, "loss": 0.9671, "step": 14437 }, { "epoch": 0.27, "learning_rate": 4.268414963407809e-06, "loss": 1.0453, "step": 14438 }, { "epoch": 0.27, "learning_rate": 4.268306978173234e-06, "loss": 0.8202, "step": 14439 }, { "epoch": 0.27, "learning_rate": 4.268198986335857e-06, "loss": 0.8889, "step": 14440 }, { "epoch": 0.27, "learning_rate": 4.268090987896077e-06, "loss": 0.8534, "step": 14441 }, { "epoch": 0.27, "learning_rate": 4.267982982854302e-06, "loss": 0.8134, "step": 14442 }, { "epoch": 0.27, "learning_rate": 4.26787497121093e-06, "loss": 0.8851, "step": 14443 }, { "epoch": 0.27, "learning_rate": 4.267766952966369e-06, "loss": 1.057, "step": 14444 }, { "epoch": 0.27, "learning_rate": 4.26765892812102e-06, "loss": 0.9613, "step": 14445 }, { "epoch": 0.27, "learning_rate": 4.267550896675286e-06, "loss": 0.8289, "step": 14446 }, { "epoch": 0.27, "learning_rate": 4.267442858629573e-06, "loss": 0.9217, "step": 14447 }, { "epoch": 0.27, "learning_rate": 4.267334813984281e-06, "loss": 0.9871, "step": 14448 }, { "epoch": 0.27, "learning_rate": 4.267226762739815e-06, "loss": 1.0467, "step": 14449 }, { "epoch": 0.27, "learning_rate": 4.267118704896579e-06, "loss": 1.1945, "step": 14450 }, { "epoch": 0.27, "learning_rate": 4.267010640454976e-06, "loss": 0.895, "step": 14451 }, { "epoch": 0.27, "learning_rate": 4.26690256941541e-06, "loss": 0.9284, "step": 14452 }, { "epoch": 0.27, "learning_rate": 4.266794491778282e-06, "loss": 0.8983, "step": 14453 }, { "epoch": 0.27, "learning_rate": 4.266686407543998e-06, "loss": 0.8068, "step": 14454 }, { "epoch": 0.27, "learning_rate": 4.2665783167129625e-06, "loss": 0.9567, "step": 14455 }, { "epoch": 0.27, "learning_rate": 4.266470219285578e-06, "loss": 1.0708, "step": 14456 }, { "epoch": 0.27, "learning_rate": 4.266362115262246e-06, "loss": 0.9542, "step": 14457 }, { "epoch": 0.27, "learning_rate": 4.266254004643373e-06, "loss": 0.7849, "step": 14458 }, { "epoch": 0.27, "learning_rate": 4.266145887429362e-06, "loss": 0.8955, "step": 14459 }, { "epoch": 0.27, "learning_rate": 4.266037763620616e-06, "loss": 0.7843, "step": 14460 }, { "epoch": 0.27, "learning_rate": 4.26592963321754e-06, "loss": 0.8553, "step": 14461 }, { "epoch": 0.27, "learning_rate": 4.265821496220535e-06, "loss": 1.0789, "step": 14462 }, { "epoch": 0.27, "learning_rate": 4.265713352630008e-06, "loss": 1.2314, "step": 14463 }, { "epoch": 0.27, "learning_rate": 4.265605202446361e-06, "loss": 0.9736, "step": 14464 }, { "epoch": 0.27, "learning_rate": 4.265497045669998e-06, "loss": 0.8623, "step": 14465 }, { "epoch": 0.27, "learning_rate": 4.265388882301324e-06, "loss": 0.8948, "step": 14466 }, { "epoch": 0.27, "learning_rate": 4.265280712340743e-06, "loss": 0.9415, "step": 14467 }, { "epoch": 0.27, "learning_rate": 4.265172535788656e-06, "loss": 1.1721, "step": 14468 }, { "epoch": 0.27, "learning_rate": 4.265064352645469e-06, "loss": 1.163, "step": 14469 }, { "epoch": 0.27, "learning_rate": 4.264956162911587e-06, "loss": 0.9067, "step": 14470 }, { "epoch": 0.27, "learning_rate": 4.264847966587412e-06, "loss": 0.9001, "step": 14471 }, { "epoch": 0.27, "learning_rate": 4.264739763673349e-06, "loss": 0.8764, "step": 14472 }, { "epoch": 0.27, "learning_rate": 4.264631554169803e-06, "loss": 1.0604, "step": 14473 }, { "epoch": 0.27, "learning_rate": 4.264523338077174e-06, "loss": 0.8588, "step": 14474 }, { "epoch": 0.27, "learning_rate": 4.264415115395871e-06, "loss": 1.1052, "step": 14475 }, { "epoch": 0.27, "learning_rate": 4.264306886126296e-06, "loss": 0.8895, "step": 14476 }, { "epoch": 0.27, "learning_rate": 4.264198650268852e-06, "loss": 0.7905, "step": 14477 }, { "epoch": 0.27, "learning_rate": 4.264090407823946e-06, "loss": 0.9121, "step": 14478 }, { "epoch": 0.27, "learning_rate": 4.26398215879198e-06, "loss": 0.7346, "step": 14479 }, { "epoch": 0.27, "learning_rate": 4.263873903173359e-06, "loss": 0.9441, "step": 14480 }, { "epoch": 0.27, "learning_rate": 4.263765640968486e-06, "loss": 1.1429, "step": 14481 }, { "epoch": 0.27, "learning_rate": 4.263657372177766e-06, "loss": 0.8967, "step": 14482 }, { "epoch": 0.27, "learning_rate": 4.263549096801605e-06, "loss": 1.0582, "step": 14483 }, { "epoch": 0.27, "learning_rate": 4.263440814840404e-06, "loss": 0.793, "step": 14484 }, { "epoch": 0.27, "learning_rate": 4.26333252629457e-06, "loss": 0.9644, "step": 14485 }, { "epoch": 0.27, "learning_rate": 4.263224231164506e-06, "loss": 0.8409, "step": 14486 }, { "epoch": 0.27, "learning_rate": 4.263115929450617e-06, "loss": 1.0303, "step": 14487 }, { "epoch": 0.27, "learning_rate": 4.263007621153307e-06, "loss": 1.1508, "step": 14488 }, { "epoch": 0.27, "learning_rate": 4.262899306272981e-06, "loss": 0.7425, "step": 14489 }, { "epoch": 0.27, "learning_rate": 4.262790984810043e-06, "loss": 0.8651, "step": 14490 }, { "epoch": 0.27, "learning_rate": 4.2626826567648975e-06, "loss": 0.9379, "step": 14491 }, { "epoch": 0.27, "learning_rate": 4.262574322137948e-06, "loss": 0.8569, "step": 14492 }, { "epoch": 0.27, "learning_rate": 4.262465980929601e-06, "loss": 0.967, "step": 14493 }, { "epoch": 0.27, "learning_rate": 4.26235763314026e-06, "loss": 1.1162, "step": 14494 }, { "epoch": 0.27, "learning_rate": 4.26224927877033e-06, "loss": 0.7717, "step": 14495 }, { "epoch": 0.27, "learning_rate": 4.2621409178202145e-06, "loss": 0.7356, "step": 14496 }, { "epoch": 0.27, "learning_rate": 4.262032550290319e-06, "loss": 0.8192, "step": 14497 }, { "epoch": 0.27, "learning_rate": 4.2619241761810485e-06, "loss": 0.9921, "step": 14498 }, { "epoch": 0.27, "learning_rate": 4.2618157954928065e-06, "loss": 0.9717, "step": 14499 }, { "epoch": 0.27, "learning_rate": 4.261707408225999e-06, "loss": 1.0911, "step": 14500 }, { "epoch": 0.27, "learning_rate": 4.261599014381029e-06, "loss": 0.9215, "step": 14501 }, { "epoch": 0.27, "learning_rate": 4.261490613958304e-06, "loss": 1.0865, "step": 14502 }, { "epoch": 0.27, "learning_rate": 4.261382206958226e-06, "loss": 1.072, "step": 14503 }, { "epoch": 0.27, "learning_rate": 4.2612737933812e-06, "loss": 0.7443, "step": 14504 }, { "epoch": 0.27, "learning_rate": 4.261165373227633e-06, "loss": 0.9901, "step": 14505 }, { "epoch": 0.27, "learning_rate": 4.2610569464979275e-06, "loss": 1.0698, "step": 14506 }, { "epoch": 0.27, "learning_rate": 4.26094851319249e-06, "loss": 1.0471, "step": 14507 }, { "epoch": 0.27, "learning_rate": 4.260840073311725e-06, "loss": 0.9268, "step": 14508 }, { "epoch": 0.27, "learning_rate": 4.260731626856036e-06, "loss": 0.9698, "step": 14509 }, { "epoch": 0.27, "learning_rate": 4.26062317382583e-06, "loss": 0.9176, "step": 14510 }, { "epoch": 0.27, "learning_rate": 4.260514714221511e-06, "loss": 1.0989, "step": 14511 }, { "epoch": 0.27, "learning_rate": 4.260406248043484e-06, "loss": 1.062, "step": 14512 }, { "epoch": 0.27, "learning_rate": 4.260297775292154e-06, "loss": 0.9402, "step": 14513 }, { "epoch": 0.27, "learning_rate": 4.260189295967926e-06, "loss": 0.8457, "step": 14514 }, { "epoch": 0.27, "learning_rate": 4.2600808100712055e-06, "loss": 0.8405, "step": 14515 }, { "epoch": 0.27, "learning_rate": 4.259972317602396e-06, "loss": 1.0399, "step": 14516 }, { "epoch": 0.27, "learning_rate": 4.259863818561906e-06, "loss": 1.0052, "step": 14517 }, { "epoch": 0.27, "learning_rate": 4.259755312950137e-06, "loss": 1.3326, "step": 14518 }, { "epoch": 0.27, "learning_rate": 4.259646800767495e-06, "loss": 1.1394, "step": 14519 }, { "epoch": 0.27, "learning_rate": 4.259538282014387e-06, "loss": 0.9763, "step": 14520 }, { "epoch": 0.27, "learning_rate": 4.259429756691217e-06, "loss": 0.8739, "step": 14521 }, { "epoch": 0.27, "learning_rate": 4.2593212247983895e-06, "loss": 0.8929, "step": 14522 }, { "epoch": 0.27, "learning_rate": 4.2592126863363105e-06, "loss": 0.7859, "step": 14523 }, { "epoch": 0.27, "learning_rate": 4.259104141305386e-06, "loss": 1.1297, "step": 14524 }, { "epoch": 0.27, "learning_rate": 4.25899558970602e-06, "loss": 1.1414, "step": 14525 }, { "epoch": 0.27, "learning_rate": 4.258887031538619e-06, "loss": 0.9339, "step": 14526 }, { "epoch": 0.27, "learning_rate": 4.258778466803587e-06, "loss": 0.9573, "step": 14527 }, { "epoch": 0.27, "learning_rate": 4.258669895501331e-06, "loss": 0.83, "step": 14528 }, { "epoch": 0.27, "learning_rate": 4.2585613176322546e-06, "loss": 0.9521, "step": 14529 }, { "epoch": 0.27, "learning_rate": 4.258452733196764e-06, "loss": 1.0289, "step": 14530 }, { "epoch": 0.27, "learning_rate": 4.2583441421952654e-06, "loss": 1.0618, "step": 14531 }, { "epoch": 0.27, "learning_rate": 4.258235544628164e-06, "loss": 0.885, "step": 14532 }, { "epoch": 0.27, "learning_rate": 4.258126940495865e-06, "loss": 0.9186, "step": 14533 }, { "epoch": 0.27, "learning_rate": 4.258018329798773e-06, "loss": 0.8788, "step": 14534 }, { "epoch": 0.27, "learning_rate": 4.257909712537295e-06, "loss": 0.9595, "step": 14535 }, { "epoch": 0.27, "learning_rate": 4.257801088711836e-06, "loss": 0.7623, "step": 14536 }, { "epoch": 0.27, "learning_rate": 4.257692458322802e-06, "loss": 1.2093, "step": 14537 }, { "epoch": 0.27, "learning_rate": 4.2575838213705974e-06, "loss": 1.0055, "step": 14538 }, { "epoch": 0.27, "learning_rate": 4.25747517785563e-06, "loss": 1.0467, "step": 14539 }, { "epoch": 0.27, "learning_rate": 4.2573665277783025e-06, "loss": 0.9505, "step": 14540 }, { "epoch": 0.27, "learning_rate": 4.2572578711390236e-06, "loss": 0.9062, "step": 14541 }, { "epoch": 0.27, "learning_rate": 4.257149207938197e-06, "loss": 0.7752, "step": 14542 }, { "epoch": 0.27, "learning_rate": 4.257040538176229e-06, "loss": 1.1378, "step": 14543 }, { "epoch": 0.27, "learning_rate": 4.2569318618535264e-06, "loss": 0.8582, "step": 14544 }, { "epoch": 0.27, "learning_rate": 4.2568231789704936e-06, "loss": 0.9866, "step": 14545 }, { "epoch": 0.27, "learning_rate": 4.256714489527537e-06, "loss": 0.8536, "step": 14546 }, { "epoch": 0.27, "learning_rate": 4.256605793525062e-06, "loss": 0.8077, "step": 14547 }, { "epoch": 0.27, "learning_rate": 4.2564970909634755e-06, "loss": 0.8163, "step": 14548 }, { "epoch": 0.27, "learning_rate": 4.256388381843182e-06, "loss": 0.9068, "step": 14549 }, { "epoch": 0.27, "learning_rate": 4.256279666164589e-06, "loss": 1.2614, "step": 14550 }, { "epoch": 0.27, "learning_rate": 4.2561709439281e-06, "loss": 1.1559, "step": 14551 }, { "epoch": 0.27, "learning_rate": 4.256062215134124e-06, "loss": 1.0477, "step": 14552 }, { "epoch": 0.27, "learning_rate": 4.255953479783065e-06, "loss": 0.9751, "step": 14553 }, { "epoch": 0.27, "learning_rate": 4.255844737875329e-06, "loss": 0.8496, "step": 14554 }, { "epoch": 0.27, "learning_rate": 4.255735989411324e-06, "loss": 1.0067, "step": 14555 }, { "epoch": 0.27, "learning_rate": 4.255627234391454e-06, "loss": 0.9587, "step": 14556 }, { "epoch": 0.27, "learning_rate": 4.255518472816125e-06, "loss": 1.0258, "step": 14557 }, { "epoch": 0.27, "learning_rate": 4.255409704685745e-06, "loss": 0.9908, "step": 14558 }, { "epoch": 0.27, "learning_rate": 4.255300930000718e-06, "loss": 0.7231, "step": 14559 }, { "epoch": 0.27, "learning_rate": 4.2551921487614515e-06, "loss": 0.9643, "step": 14560 }, { "epoch": 0.27, "learning_rate": 4.255083360968352e-06, "loss": 0.9136, "step": 14561 }, { "epoch": 0.27, "learning_rate": 4.254974566621824e-06, "loss": 1.0872, "step": 14562 }, { "epoch": 0.27, "learning_rate": 4.254865765722275e-06, "loss": 0.9658, "step": 14563 }, { "epoch": 0.27, "learning_rate": 4.254756958270111e-06, "loss": 0.8809, "step": 14564 }, { "epoch": 0.27, "learning_rate": 4.254648144265739e-06, "loss": 0.8707, "step": 14565 }, { "epoch": 0.27, "learning_rate": 4.254539323709564e-06, "loss": 0.8557, "step": 14566 }, { "epoch": 0.27, "learning_rate": 4.254430496601993e-06, "loss": 1.0074, "step": 14567 }, { "epoch": 0.27, "learning_rate": 4.254321662943432e-06, "loss": 1.5758, "step": 14568 }, { "epoch": 0.27, "learning_rate": 4.254212822734289e-06, "loss": 1.1064, "step": 14569 }, { "epoch": 0.27, "learning_rate": 4.254103975974968e-06, "loss": 0.9897, "step": 14570 }, { "epoch": 0.27, "learning_rate": 4.253995122665877e-06, "loss": 0.953, "step": 14571 }, { "epoch": 0.27, "learning_rate": 4.253886262807422e-06, "loss": 0.9537, "step": 14572 }, { "epoch": 0.27, "learning_rate": 4.253777396400008e-06, "loss": 0.7292, "step": 14573 }, { "epoch": 0.27, "learning_rate": 4.253668523444046e-06, "loss": 0.8331, "step": 14574 }, { "epoch": 0.27, "learning_rate": 4.253559643939937e-06, "loss": 1.1323, "step": 14575 }, { "epoch": 0.28, "learning_rate": 4.25345075788809e-06, "loss": 1.134, "step": 14576 }, { "epoch": 0.28, "learning_rate": 4.253341865288914e-06, "loss": 0.828, "step": 14577 }, { "epoch": 0.28, "learning_rate": 4.25323296614281e-06, "loss": 0.834, "step": 14578 }, { "epoch": 0.28, "learning_rate": 4.25312406045019e-06, "loss": 0.7666, "step": 14579 }, { "epoch": 0.28, "learning_rate": 4.2530151482114585e-06, "loss": 0.9133, "step": 14580 }, { "epoch": 0.28, "learning_rate": 4.2529062294270215e-06, "loss": 1.1995, "step": 14581 }, { "epoch": 0.28, "learning_rate": 4.252797304097287e-06, "loss": 1.1752, "step": 14582 }, { "epoch": 0.28, "learning_rate": 4.252688372222661e-06, "loss": 0.915, "step": 14583 }, { "epoch": 0.28, "learning_rate": 4.25257943380355e-06, "loss": 0.8971, "step": 14584 }, { "epoch": 0.28, "learning_rate": 4.252470488840361e-06, "loss": 0.8539, "step": 14585 }, { "epoch": 0.28, "learning_rate": 4.252361537333501e-06, "loss": 1.0081, "step": 14586 }, { "epoch": 0.28, "learning_rate": 4.2522525792833765e-06, "loss": 1.0171, "step": 14587 }, { "epoch": 0.28, "learning_rate": 4.252143614690395e-06, "loss": 0.9798, "step": 14588 }, { "epoch": 0.28, "learning_rate": 4.252034643554963e-06, "loss": 0.8936, "step": 14589 }, { "epoch": 0.28, "learning_rate": 4.251925665877487e-06, "loss": 0.9293, "step": 14590 }, { "epoch": 0.28, "learning_rate": 4.251816681658375e-06, "loss": 0.7558, "step": 14591 }, { "epoch": 0.28, "learning_rate": 4.251707690898033e-06, "loss": 1.1196, "step": 14592 }, { "epoch": 0.28, "learning_rate": 4.251598693596868e-06, "loss": 0.8598, "step": 14593 }, { "epoch": 0.28, "learning_rate": 4.2514896897552875e-06, "loss": 1.0375, "step": 14594 }, { "epoch": 0.28, "learning_rate": 4.251380679373698e-06, "loss": 0.8521, "step": 14595 }, { "epoch": 0.28, "learning_rate": 4.2512716624525055e-06, "loss": 1.1075, "step": 14596 }, { "epoch": 0.28, "learning_rate": 4.25116263899212e-06, "loss": 0.8553, "step": 14597 }, { "epoch": 0.28, "learning_rate": 4.251053608992946e-06, "loss": 0.9538, "step": 14598 }, { "epoch": 0.28, "learning_rate": 4.250944572455392e-06, "loss": 1.0543, "step": 14599 }, { "epoch": 0.28, "learning_rate": 4.250835529379864e-06, "loss": 1.0464, "step": 14600 }, { "epoch": 0.28, "learning_rate": 4.2507264797667705e-06, "loss": 0.8451, "step": 14601 }, { "epoch": 0.28, "learning_rate": 4.250617423616518e-06, "loss": 0.7545, "step": 14602 }, { "epoch": 0.28, "learning_rate": 4.250508360929514e-06, "loss": 0.9988, "step": 14603 }, { "epoch": 0.28, "learning_rate": 4.250399291706165e-06, "loss": 0.8836, "step": 14604 }, { "epoch": 0.28, "learning_rate": 4.250290215946878e-06, "loss": 0.95, "step": 14605 }, { "epoch": 0.28, "learning_rate": 4.250181133652062e-06, "loss": 1.0141, "step": 14606 }, { "epoch": 0.28, "learning_rate": 4.2500720448221226e-06, "loss": 0.8599, "step": 14607 }, { "epoch": 0.28, "learning_rate": 4.249962949457468e-06, "loss": 0.8969, "step": 14608 }, { "epoch": 0.28, "learning_rate": 4.249853847558506e-06, "loss": 1.0556, "step": 14609 }, { "epoch": 0.28, "learning_rate": 4.249744739125643e-06, "loss": 1.0656, "step": 14610 }, { "epoch": 0.28, "learning_rate": 4.249635624159287e-06, "loss": 1.0278, "step": 14611 }, { "epoch": 0.28, "learning_rate": 4.249526502659845e-06, "loss": 1.0136, "step": 14612 }, { "epoch": 0.28, "learning_rate": 4.249417374627724e-06, "loss": 0.8596, "step": 14613 }, { "epoch": 0.28, "learning_rate": 4.249308240063333e-06, "loss": 0.8398, "step": 14614 }, { "epoch": 0.28, "learning_rate": 4.249199098967079e-06, "loss": 0.9679, "step": 14615 }, { "epoch": 0.28, "learning_rate": 4.249089951339369e-06, "loss": 0.9045, "step": 14616 }, { "epoch": 0.28, "learning_rate": 4.24898079718061e-06, "loss": 0.9857, "step": 14617 }, { "epoch": 0.28, "learning_rate": 4.248871636491211e-06, "loss": 1.0304, "step": 14618 }, { "epoch": 0.28, "learning_rate": 4.248762469271579e-06, "loss": 0.8188, "step": 14619 }, { "epoch": 0.28, "learning_rate": 4.2486532955221214e-06, "loss": 0.9513, "step": 14620 }, { "epoch": 0.28, "learning_rate": 4.248544115243246e-06, "loss": 1.0437, "step": 14621 }, { "epoch": 0.28, "learning_rate": 4.24843492843536e-06, "loss": 0.9481, "step": 14622 }, { "epoch": 0.28, "learning_rate": 4.248325735098872e-06, "loss": 0.8025, "step": 14623 }, { "epoch": 0.28, "learning_rate": 4.24821653523419e-06, "loss": 1.1428, "step": 14624 }, { "epoch": 0.28, "learning_rate": 4.24810732884172e-06, "loss": 1.0836, "step": 14625 }, { "epoch": 0.28, "learning_rate": 4.247998115921871e-06, "loss": 0.9544, "step": 14626 }, { "epoch": 0.28, "learning_rate": 4.247888896475051e-06, "loss": 0.9384, "step": 14627 }, { "epoch": 0.28, "learning_rate": 4.2477796705016675e-06, "loss": 1.1758, "step": 14628 }, { "epoch": 0.28, "learning_rate": 4.2476704380021275e-06, "loss": 1.0264, "step": 14629 }, { "epoch": 0.28, "learning_rate": 4.247561198976841e-06, "loss": 0.9407, "step": 14630 }, { "epoch": 0.28, "learning_rate": 4.2474519534262135e-06, "loss": 1.0552, "step": 14631 }, { "epoch": 0.28, "learning_rate": 4.2473427013506545e-06, "loss": 0.9712, "step": 14632 }, { "epoch": 0.28, "learning_rate": 4.247233442750571e-06, "loss": 0.9297, "step": 14633 }, { "epoch": 0.28, "learning_rate": 4.247124177626371e-06, "loss": 0.983, "step": 14634 }, { "epoch": 0.28, "learning_rate": 4.247014905978464e-06, "loss": 0.8828, "step": 14635 }, { "epoch": 0.28, "learning_rate": 4.246905627807256e-06, "loss": 0.9362, "step": 14636 }, { "epoch": 0.28, "learning_rate": 4.2467963431131565e-06, "loss": 1.1887, "step": 14637 }, { "epoch": 0.28, "learning_rate": 4.2466870518965734e-06, "loss": 0.9412, "step": 14638 }, { "epoch": 0.28, "learning_rate": 4.246577754157914e-06, "loss": 0.9224, "step": 14639 }, { "epoch": 0.28, "learning_rate": 4.246468449897586e-06, "loss": 0.9692, "step": 14640 }, { "epoch": 0.28, "learning_rate": 4.2463591391159984e-06, "loss": 0.8904, "step": 14641 }, { "epoch": 0.28, "learning_rate": 4.24624982181356e-06, "loss": 0.8068, "step": 14642 }, { "epoch": 0.28, "learning_rate": 4.246140497990679e-06, "loss": 1.0247, "step": 14643 }, { "epoch": 0.28, "learning_rate": 4.246031167647761e-06, "loss": 1.1146, "step": 14644 }, { "epoch": 0.28, "learning_rate": 4.245921830785218e-06, "loss": 1.0889, "step": 14645 }, { "epoch": 0.28, "learning_rate": 4.245812487403456e-06, "loss": 0.9576, "step": 14646 }, { "epoch": 0.28, "learning_rate": 4.245703137502883e-06, "loss": 0.8387, "step": 14647 }, { "epoch": 0.28, "learning_rate": 4.245593781083909e-06, "loss": 0.7472, "step": 14648 }, { "epoch": 0.28, "learning_rate": 4.245484418146941e-06, "loss": 0.8362, "step": 14649 }, { "epoch": 0.28, "learning_rate": 4.245375048692387e-06, "loss": 1.0783, "step": 14650 }, { "epoch": 0.28, "learning_rate": 4.245265672720657e-06, "loss": 0.9449, "step": 14651 }, { "epoch": 0.28, "learning_rate": 4.245156290232158e-06, "loss": 0.6328, "step": 14652 }, { "epoch": 0.28, "learning_rate": 4.2450469012272985e-06, "loss": 0.8658, "step": 14653 }, { "epoch": 0.28, "learning_rate": 4.244937505706489e-06, "loss": 0.9218, "step": 14654 }, { "epoch": 0.28, "learning_rate": 4.244828103670135e-06, "loss": 1.0219, "step": 14655 }, { "epoch": 0.28, "learning_rate": 4.2447186951186455e-06, "loss": 0.9411, "step": 14656 }, { "epoch": 0.28, "learning_rate": 4.244609280052432e-06, "loss": 0.91, "step": 14657 }, { "epoch": 0.28, "learning_rate": 4.2444998584719e-06, "loss": 0.8141, "step": 14658 }, { "epoch": 0.28, "learning_rate": 4.244390430377459e-06, "loss": 0.7103, "step": 14659 }, { "epoch": 0.28, "learning_rate": 4.2442809957695175e-06, "loss": 0.8936, "step": 14660 }, { "epoch": 0.28, "learning_rate": 4.244171554648484e-06, "loss": 0.8684, "step": 14661 }, { "epoch": 0.28, "learning_rate": 4.244062107014767e-06, "loss": 1.001, "step": 14662 }, { "epoch": 0.28, "learning_rate": 4.243952652868777e-06, "loss": 0.7484, "step": 14663 }, { "epoch": 0.28, "learning_rate": 4.24384319221092e-06, "loss": 0.8326, "step": 14664 }, { "epoch": 0.28, "learning_rate": 4.243733725041606e-06, "loss": 1.101, "step": 14665 }, { "epoch": 0.28, "learning_rate": 4.243624251361245e-06, "loss": 0.8616, "step": 14666 }, { "epoch": 0.28, "learning_rate": 4.243514771170244e-06, "loss": 0.9508, "step": 14667 }, { "epoch": 0.28, "learning_rate": 4.2434052844690115e-06, "loss": 0.987, "step": 14668 }, { "epoch": 0.28, "learning_rate": 4.243295791257957e-06, "loss": 1.0282, "step": 14669 }, { "epoch": 0.28, "learning_rate": 4.243186291537491e-06, "loss": 0.9292, "step": 14670 }, { "epoch": 0.28, "learning_rate": 4.24307678530802e-06, "loss": 0.9277, "step": 14671 }, { "epoch": 0.28, "learning_rate": 4.242967272569953e-06, "loss": 0.8401, "step": 14672 }, { "epoch": 0.28, "learning_rate": 4.242857753323701e-06, "loss": 0.7094, "step": 14673 }, { "epoch": 0.28, "learning_rate": 4.242748227569671e-06, "loss": 1.0561, "step": 14674 }, { "epoch": 0.28, "learning_rate": 4.242638695308272e-06, "loss": 0.998, "step": 14675 }, { "epoch": 0.28, "learning_rate": 4.242529156539914e-06, "loss": 1.0753, "step": 14676 }, { "epoch": 0.28, "learning_rate": 4.242419611265006e-06, "loss": 0.7511, "step": 14677 }, { "epoch": 0.28, "learning_rate": 4.242310059483956e-06, "loss": 0.7751, "step": 14678 }, { "epoch": 0.28, "learning_rate": 4.242200501197173e-06, "loss": 0.8323, "step": 14679 }, { "epoch": 0.28, "learning_rate": 4.242090936405069e-06, "loss": 0.8252, "step": 14680 }, { "epoch": 0.28, "learning_rate": 4.241981365108049e-06, "loss": 0.8758, "step": 14681 }, { "epoch": 0.28, "learning_rate": 4.241871787306524e-06, "loss": 0.818, "step": 14682 }, { "epoch": 0.28, "learning_rate": 4.241762203000904e-06, "loss": 0.8137, "step": 14683 }, { "epoch": 0.28, "learning_rate": 4.241652612191597e-06, "loss": 0.96, "step": 14684 }, { "epoch": 0.28, "learning_rate": 4.241543014879013e-06, "loss": 0.8688, "step": 14685 }, { "epoch": 0.28, "learning_rate": 4.241433411063559e-06, "loss": 0.8328, "step": 14686 }, { "epoch": 0.28, "learning_rate": 4.2413238007456485e-06, "loss": 1.0206, "step": 14687 }, { "epoch": 0.28, "learning_rate": 4.241214183925686e-06, "loss": 1.0557, "step": 14688 }, { "epoch": 0.28, "learning_rate": 4.241104560604085e-06, "loss": 0.8853, "step": 14689 }, { "epoch": 0.28, "learning_rate": 4.240994930781251e-06, "loss": 0.8799, "step": 14690 }, { "epoch": 0.28, "learning_rate": 4.240885294457597e-06, "loss": 0.9166, "step": 14691 }, { "epoch": 0.28, "learning_rate": 4.24077565163353e-06, "loss": 0.8352, "step": 14692 }, { "epoch": 0.28, "learning_rate": 4.24066600230946e-06, "loss": 1.1644, "step": 14693 }, { "epoch": 0.28, "learning_rate": 4.2405563464857975e-06, "loss": 0.9736, "step": 14694 }, { "epoch": 0.28, "learning_rate": 4.24044668416295e-06, "loss": 1.2045, "step": 14695 }, { "epoch": 0.28, "learning_rate": 4.240337015341328e-06, "loss": 0.9346, "step": 14696 }, { "epoch": 0.28, "learning_rate": 4.240227340021341e-06, "loss": 0.7979, "step": 14697 }, { "epoch": 0.28, "learning_rate": 4.240117658203399e-06, "loss": 0.8422, "step": 14698 }, { "epoch": 0.28, "learning_rate": 4.240007969887911e-06, "loss": 1.0279, "step": 14699 }, { "epoch": 0.28, "learning_rate": 4.239898275075286e-06, "loss": 1.0822, "step": 14700 }, { "epoch": 0.28, "learning_rate": 4.239788573765934e-06, "loss": 0.95, "step": 14701 }, { "epoch": 0.28, "learning_rate": 4.239678865960265e-06, "loss": 0.7544, "step": 14702 }, { "epoch": 0.28, "learning_rate": 4.239569151658689e-06, "loss": 0.7575, "step": 14703 }, { "epoch": 0.28, "learning_rate": 4.239459430861614e-06, "loss": 0.7765, "step": 14704 }, { "epoch": 0.28, "learning_rate": 4.239349703569452e-06, "loss": 0.8276, "step": 14705 }, { "epoch": 0.28, "learning_rate": 4.2392399697826115e-06, "loss": 0.9999, "step": 14706 }, { "epoch": 0.28, "learning_rate": 4.239130229501502e-06, "loss": 0.8106, "step": 14707 }, { "epoch": 0.28, "learning_rate": 4.239020482726533e-06, "loss": 1.0244, "step": 14708 }, { "epoch": 0.28, "learning_rate": 4.238910729458116e-06, "loss": 0.8266, "step": 14709 }, { "epoch": 0.28, "learning_rate": 4.238800969696659e-06, "loss": 0.7636, "step": 14710 }, { "epoch": 0.28, "learning_rate": 4.238691203442572e-06, "loss": 1.1082, "step": 14711 }, { "epoch": 0.28, "learning_rate": 4.2385814306962655e-06, "loss": 0.951, "step": 14712 }, { "epoch": 0.28, "learning_rate": 4.238471651458151e-06, "loss": 0.9716, "step": 14713 }, { "epoch": 0.28, "learning_rate": 4.238361865728634e-06, "loss": 0.9007, "step": 14714 }, { "epoch": 0.28, "learning_rate": 4.238252073508128e-06, "loss": 0.9135, "step": 14715 }, { "epoch": 0.28, "learning_rate": 4.238142274797043e-06, "loss": 0.7489, "step": 14716 }, { "epoch": 0.28, "learning_rate": 4.238032469595788e-06, "loss": 1.0149, "step": 14717 }, { "epoch": 0.28, "learning_rate": 4.237922657904772e-06, "loss": 1.2666, "step": 14718 }, { "epoch": 0.28, "learning_rate": 4.237812839724406e-06, "loss": 0.8998, "step": 14719 }, { "epoch": 0.28, "learning_rate": 4.237703015055101e-06, "loss": 0.8409, "step": 14720 }, { "epoch": 0.28, "learning_rate": 4.237593183897266e-06, "loss": 0.8272, "step": 14721 }, { "epoch": 0.28, "learning_rate": 4.237483346251311e-06, "loss": 0.8823, "step": 14722 }, { "epoch": 0.28, "learning_rate": 4.237373502117646e-06, "loss": 0.9636, "step": 14723 }, { "epoch": 0.28, "learning_rate": 4.237263651496683e-06, "loss": 1.0052, "step": 14724 }, { "epoch": 0.28, "learning_rate": 4.237153794388829e-06, "loss": 1.0833, "step": 14725 }, { "epoch": 0.28, "learning_rate": 4.237043930794498e-06, "loss": 0.7695, "step": 14726 }, { "epoch": 0.28, "learning_rate": 4.236934060714097e-06, "loss": 0.8127, "step": 14727 }, { "epoch": 0.28, "learning_rate": 4.236824184148038e-06, "loss": 0.7719, "step": 14728 }, { "epoch": 0.28, "learning_rate": 4.23671430109673e-06, "loss": 0.9382, "step": 14729 }, { "epoch": 0.28, "learning_rate": 4.236604411560585e-06, "loss": 0.8848, "step": 14730 }, { "epoch": 0.28, "learning_rate": 4.236494515540012e-06, "loss": 1.0496, "step": 14731 }, { "epoch": 0.28, "learning_rate": 4.236384613035421e-06, "loss": 0.9818, "step": 14732 }, { "epoch": 0.28, "learning_rate": 4.236274704047224e-06, "loss": 0.7692, "step": 14733 }, { "epoch": 0.28, "learning_rate": 4.236164788575831e-06, "loss": 0.9221, "step": 14734 }, { "epoch": 0.28, "learning_rate": 4.2360548666216506e-06, "loss": 1.1143, "step": 14735 }, { "epoch": 0.28, "learning_rate": 4.235944938185095e-06, "loss": 0.9518, "step": 14736 }, { "epoch": 0.28, "learning_rate": 4.235835003266575e-06, "loss": 1.1068, "step": 14737 }, { "epoch": 0.28, "learning_rate": 4.235725061866499e-06, "loss": 1.0676, "step": 14738 }, { "epoch": 0.28, "learning_rate": 4.2356151139852796e-06, "loss": 0.953, "step": 14739 }, { "epoch": 0.28, "learning_rate": 4.235505159623327e-06, "loss": 1.0287, "step": 14740 }, { "epoch": 0.28, "learning_rate": 4.235395198781051e-06, "loss": 0.9053, "step": 14741 }, { "epoch": 0.28, "learning_rate": 4.235285231458861e-06, "loss": 0.8643, "step": 14742 }, { "epoch": 0.28, "learning_rate": 4.235175257657171e-06, "loss": 0.813, "step": 14743 }, { "epoch": 0.28, "learning_rate": 4.23506527737639e-06, "loss": 1.1716, "step": 14744 }, { "epoch": 0.28, "learning_rate": 4.234955290616927e-06, "loss": 0.7924, "step": 14745 }, { "epoch": 0.28, "learning_rate": 4.2348452973791955e-06, "loss": 0.8305, "step": 14746 }, { "epoch": 0.28, "learning_rate": 4.234735297663604e-06, "loss": 0.9439, "step": 14747 }, { "epoch": 0.28, "learning_rate": 4.2346252914705645e-06, "loss": 0.8851, "step": 14748 }, { "epoch": 0.28, "learning_rate": 4.234515278800486e-06, "loss": 1.1228, "step": 14749 }, { "epoch": 0.28, "learning_rate": 4.234405259653782e-06, "loss": 1.2267, "step": 14750 }, { "epoch": 0.28, "learning_rate": 4.234295234030862e-06, "loss": 0.8985, "step": 14751 }, { "epoch": 0.28, "learning_rate": 4.234185201932137e-06, "loss": 0.9125, "step": 14752 }, { "epoch": 0.28, "learning_rate": 4.234075163358017e-06, "loss": 0.8969, "step": 14753 }, { "epoch": 0.28, "learning_rate": 4.233965118308913e-06, "loss": 0.8557, "step": 14754 }, { "epoch": 0.28, "learning_rate": 4.233855066785237e-06, "loss": 0.8655, "step": 14755 }, { "epoch": 0.28, "learning_rate": 4.2337450087874e-06, "loss": 1.1439, "step": 14756 }, { "epoch": 0.28, "learning_rate": 4.233634944315811e-06, "loss": 0.9164, "step": 14757 }, { "epoch": 0.28, "learning_rate": 4.233524873370884e-06, "loss": 0.9795, "step": 14758 }, { "epoch": 0.28, "learning_rate": 4.233414795953027e-06, "loss": 1.0526, "step": 14759 }, { "epoch": 0.28, "learning_rate": 4.2333047120626516e-06, "loss": 0.6907, "step": 14760 }, { "epoch": 0.28, "learning_rate": 4.233194621700171e-06, "loss": 0.807, "step": 14761 }, { "epoch": 0.28, "learning_rate": 4.233084524865995e-06, "loss": 1.1531, "step": 14762 }, { "epoch": 0.28, "learning_rate": 4.232974421560533e-06, "loss": 1.0813, "step": 14763 }, { "epoch": 0.28, "learning_rate": 4.232864311784198e-06, "loss": 0.9786, "step": 14764 }, { "epoch": 0.28, "learning_rate": 4.232754195537402e-06, "loss": 0.8264, "step": 14765 }, { "epoch": 0.28, "learning_rate": 4.232644072820554e-06, "loss": 1.0891, "step": 14766 }, { "epoch": 0.28, "learning_rate": 4.2325339436340665e-06, "loss": 0.9985, "step": 14767 }, { "epoch": 0.28, "learning_rate": 4.23242380797835e-06, "loss": 1.076, "step": 14768 }, { "epoch": 0.28, "learning_rate": 4.232313665853817e-06, "loss": 0.9924, "step": 14769 }, { "epoch": 0.28, "learning_rate": 4.232203517260877e-06, "loss": 1.0447, "step": 14770 }, { "epoch": 0.28, "learning_rate": 4.232093362199942e-06, "loss": 0.845, "step": 14771 }, { "epoch": 0.28, "learning_rate": 4.231983200671424e-06, "loss": 0.7095, "step": 14772 }, { "epoch": 0.28, "learning_rate": 4.231873032675734e-06, "loss": 0.7382, "step": 14773 }, { "epoch": 0.28, "learning_rate": 4.231762858213283e-06, "loss": 1.1491, "step": 14774 }, { "epoch": 0.28, "learning_rate": 4.231652677284483e-06, "loss": 1.1512, "step": 14775 }, { "epoch": 0.28, "learning_rate": 4.231542489889744e-06, "loss": 1.0399, "step": 14776 }, { "epoch": 0.28, "learning_rate": 4.2314322960294785e-06, "loss": 0.8579, "step": 14777 }, { "epoch": 0.28, "learning_rate": 4.2313220957040985e-06, "loss": 0.7818, "step": 14778 }, { "epoch": 0.28, "learning_rate": 4.231211888914016e-06, "loss": 0.8934, "step": 14779 }, { "epoch": 0.28, "learning_rate": 4.231101675659639e-06, "loss": 0.8828, "step": 14780 }, { "epoch": 0.28, "learning_rate": 4.230991455941382e-06, "loss": 0.9716, "step": 14781 }, { "epoch": 0.28, "learning_rate": 4.230881229759657e-06, "loss": 0.899, "step": 14782 }, { "epoch": 0.28, "learning_rate": 4.2307709971148745e-06, "loss": 0.9238, "step": 14783 }, { "epoch": 0.28, "learning_rate": 4.230660758007446e-06, "loss": 0.7734, "step": 14784 }, { "epoch": 0.28, "learning_rate": 4.230550512437782e-06, "loss": 0.9888, "step": 14785 }, { "epoch": 0.28, "learning_rate": 4.230440260406296e-06, "loss": 1.0804, "step": 14786 }, { "epoch": 0.28, "learning_rate": 4.230330001913401e-06, "loss": 0.9995, "step": 14787 }, { "epoch": 0.28, "learning_rate": 4.230219736959505e-06, "loss": 1.1197, "step": 14788 }, { "epoch": 0.28, "learning_rate": 4.230109465545022e-06, "loss": 0.9997, "step": 14789 }, { "epoch": 0.28, "learning_rate": 4.229999187670363e-06, "loss": 0.8929, "step": 14790 }, { "epoch": 0.28, "learning_rate": 4.22988890333594e-06, "loss": 1.0892, "step": 14791 }, { "epoch": 0.28, "learning_rate": 4.229778612542166e-06, "loss": 0.8726, "step": 14792 }, { "epoch": 0.28, "learning_rate": 4.2296683152894505e-06, "loss": 1.2556, "step": 14793 }, { "epoch": 0.28, "learning_rate": 4.229558011578208e-06, "loss": 0.8661, "step": 14794 }, { "epoch": 0.28, "learning_rate": 4.229447701408847e-06, "loss": 0.8682, "step": 14795 }, { "epoch": 0.28, "learning_rate": 4.229337384781782e-06, "loss": 1.1055, "step": 14796 }, { "epoch": 0.28, "learning_rate": 4.229227061697425e-06, "loss": 1.0093, "step": 14797 }, { "epoch": 0.28, "learning_rate": 4.229116732156186e-06, "loss": 0.8716, "step": 14798 }, { "epoch": 0.28, "learning_rate": 4.229006396158479e-06, "loss": 1.1277, "step": 14799 }, { "epoch": 0.28, "learning_rate": 4.228896053704716e-06, "loss": 1.0524, "step": 14800 }, { "epoch": 0.28, "learning_rate": 4.228785704795305e-06, "loss": 0.978, "step": 14801 }, { "epoch": 0.28, "learning_rate": 4.228675349430664e-06, "loss": 0.7117, "step": 14802 }, { "epoch": 0.28, "learning_rate": 4.228564987611202e-06, "loss": 0.8335, "step": 14803 }, { "epoch": 0.28, "learning_rate": 4.22845461933733e-06, "loss": 0.9159, "step": 14804 }, { "epoch": 0.28, "learning_rate": 4.228344244609463e-06, "loss": 0.8931, "step": 14805 }, { "epoch": 0.28, "learning_rate": 4.228233863428011e-06, "loss": 1.1254, "step": 14806 }, { "epoch": 0.28, "learning_rate": 4.228123475793386e-06, "loss": 1.1653, "step": 14807 }, { "epoch": 0.28, "learning_rate": 4.2280130817060015e-06, "loss": 1.0909, "step": 14808 }, { "epoch": 0.28, "learning_rate": 4.227902681166269e-06, "loss": 0.9042, "step": 14809 }, { "epoch": 0.28, "learning_rate": 4.227792274174601e-06, "loss": 0.8521, "step": 14810 }, { "epoch": 0.28, "learning_rate": 4.22768186073141e-06, "loss": 0.9091, "step": 14811 }, { "epoch": 0.28, "learning_rate": 4.227571440837107e-06, "loss": 1.099, "step": 14812 }, { "epoch": 0.28, "learning_rate": 4.227461014492106e-06, "loss": 1.0254, "step": 14813 }, { "epoch": 0.28, "learning_rate": 4.227350581696817e-06, "loss": 0.7212, "step": 14814 }, { "epoch": 0.28, "learning_rate": 4.227240142451656e-06, "loss": 0.9587, "step": 14815 }, { "epoch": 0.28, "learning_rate": 4.227129696757032e-06, "loss": 0.9539, "step": 14816 }, { "epoch": 0.28, "learning_rate": 4.22701924461336e-06, "loss": 0.8713, "step": 14817 }, { "epoch": 0.28, "learning_rate": 4.226908786021049e-06, "loss": 1.0305, "step": 14818 }, { "epoch": 0.28, "learning_rate": 4.226798320980515e-06, "loss": 1.1721, "step": 14819 }, { "epoch": 0.28, "learning_rate": 4.226687849492169e-06, "loss": 0.9785, "step": 14820 }, { "epoch": 0.28, "learning_rate": 4.226577371556423e-06, "loss": 0.943, "step": 14821 }, { "epoch": 0.28, "learning_rate": 4.22646688717369e-06, "loss": 0.8806, "step": 14822 }, { "epoch": 0.28, "learning_rate": 4.226356396344383e-06, "loss": 0.9053, "step": 14823 }, { "epoch": 0.28, "learning_rate": 4.226245899068915e-06, "loss": 1.2712, "step": 14824 }, { "epoch": 0.28, "learning_rate": 4.226135395347696e-06, "loss": 0.9774, "step": 14825 }, { "epoch": 0.28, "learning_rate": 4.226024885181141e-06, "loss": 0.9919, "step": 14826 }, { "epoch": 0.28, "learning_rate": 4.225914368569663e-06, "loss": 0.8094, "step": 14827 }, { "epoch": 0.28, "learning_rate": 4.225803845513672e-06, "loss": 0.9877, "step": 14828 }, { "epoch": 0.28, "learning_rate": 4.225693316013583e-06, "loss": 0.8581, "step": 14829 }, { "epoch": 0.28, "learning_rate": 4.225582780069808e-06, "loss": 1.1552, "step": 14830 }, { "epoch": 0.28, "learning_rate": 4.225472237682761e-06, "loss": 0.986, "step": 14831 }, { "epoch": 0.28, "learning_rate": 4.225361688852851e-06, "loss": 1.0132, "step": 14832 }, { "epoch": 0.28, "learning_rate": 4.225251133580496e-06, "loss": 1.0262, "step": 14833 }, { "epoch": 0.28, "learning_rate": 4.225140571866105e-06, "loss": 0.905, "step": 14834 }, { "epoch": 0.28, "learning_rate": 4.225030003710091e-06, "loss": 0.9094, "step": 14835 }, { "epoch": 0.28, "learning_rate": 4.22491942911287e-06, "loss": 0.9721, "step": 14836 }, { "epoch": 0.28, "learning_rate": 4.224808848074852e-06, "loss": 1.1481, "step": 14837 }, { "epoch": 0.28, "learning_rate": 4.22469826059645e-06, "loss": 1.0352, "step": 14838 }, { "epoch": 0.28, "learning_rate": 4.224587666678077e-06, "loss": 0.9974, "step": 14839 }, { "epoch": 0.28, "learning_rate": 4.2244770663201475e-06, "loss": 0.9534, "step": 14840 }, { "epoch": 0.28, "learning_rate": 4.2243664595230735e-06, "loss": 0.9681, "step": 14841 }, { "epoch": 0.28, "learning_rate": 4.224255846287268e-06, "loss": 0.9355, "step": 14842 }, { "epoch": 0.28, "learning_rate": 4.2241452266131446e-06, "loss": 0.9486, "step": 14843 }, { "epoch": 0.28, "learning_rate": 4.224034600501115e-06, "loss": 1.207, "step": 14844 }, { "epoch": 0.28, "learning_rate": 4.223923967951593e-06, "loss": 0.9683, "step": 14845 }, { "epoch": 0.28, "learning_rate": 4.223813328964992e-06, "loss": 0.8647, "step": 14846 }, { "epoch": 0.28, "learning_rate": 4.2237026835417246e-06, "loss": 0.9686, "step": 14847 }, { "epoch": 0.28, "learning_rate": 4.223592031682205e-06, "loss": 0.7492, "step": 14848 }, { "epoch": 0.28, "learning_rate": 4.223481373386845e-06, "loss": 0.9753, "step": 14849 }, { "epoch": 0.28, "learning_rate": 4.2233707086560585e-06, "loss": 1.0434, "step": 14850 }, { "epoch": 0.28, "learning_rate": 4.223260037490259e-06, "loss": 1.0572, "step": 14851 }, { "epoch": 0.28, "learning_rate": 4.223149359889858e-06, "loss": 0.9906, "step": 14852 }, { "epoch": 0.28, "learning_rate": 4.223038675855272e-06, "loss": 0.8984, "step": 14853 }, { "epoch": 0.28, "learning_rate": 4.222927985386911e-06, "loss": 0.807, "step": 14854 }, { "epoch": 0.28, "learning_rate": 4.22281728848519e-06, "loss": 0.9717, "step": 14855 }, { "epoch": 0.28, "learning_rate": 4.222706585150522e-06, "loss": 0.9187, "step": 14856 }, { "epoch": 0.28, "learning_rate": 4.222595875383321e-06, "loss": 0.9567, "step": 14857 }, { "epoch": 0.28, "learning_rate": 4.222485159184e-06, "loss": 0.9226, "step": 14858 }, { "epoch": 0.28, "learning_rate": 4.2223744365529715e-06, "loss": 0.9816, "step": 14859 }, { "epoch": 0.28, "learning_rate": 4.2222637074906506e-06, "loss": 0.9155, "step": 14860 }, { "epoch": 0.28, "learning_rate": 4.222152971997449e-06, "loss": 0.8328, "step": 14861 }, { "epoch": 0.28, "learning_rate": 4.2220422300737804e-06, "loss": 1.1105, "step": 14862 }, { "epoch": 0.28, "learning_rate": 4.2219314817200605e-06, "loss": 0.9105, "step": 14863 }, { "epoch": 0.28, "learning_rate": 4.2218207269367e-06, "loss": 0.9698, "step": 14864 }, { "epoch": 0.28, "learning_rate": 4.221709965724114e-06, "loss": 0.9754, "step": 14865 }, { "epoch": 0.28, "learning_rate": 4.2215991980827155e-06, "loss": 0.9108, "step": 14866 }, { "epoch": 0.28, "learning_rate": 4.2214884240129195e-06, "loss": 0.9043, "step": 14867 }, { "epoch": 0.28, "learning_rate": 4.221377643515138e-06, "loss": 0.9294, "step": 14868 }, { "epoch": 0.28, "learning_rate": 4.221266856589784e-06, "loss": 1.0907, "step": 14869 }, { "epoch": 0.28, "learning_rate": 4.221156063237274e-06, "loss": 0.8757, "step": 14870 }, { "epoch": 0.28, "learning_rate": 4.221045263458019e-06, "loss": 0.8685, "step": 14871 }, { "epoch": 0.28, "learning_rate": 4.220934457252433e-06, "loss": 0.8647, "step": 14872 }, { "epoch": 0.28, "learning_rate": 4.220823644620933e-06, "loss": 0.8599, "step": 14873 }, { "epoch": 0.28, "learning_rate": 4.220712825563929e-06, "loss": 0.9871, "step": 14874 }, { "epoch": 0.28, "learning_rate": 4.220602000081835e-06, "loss": 1.0157, "step": 14875 }, { "epoch": 0.28, "learning_rate": 4.220491168175067e-06, "loss": 0.9792, "step": 14876 }, { "epoch": 0.28, "learning_rate": 4.220380329844037e-06, "loss": 0.9229, "step": 14877 }, { "epoch": 0.28, "learning_rate": 4.22026948508916e-06, "loss": 0.9329, "step": 14878 }, { "epoch": 0.28, "learning_rate": 4.22015863391085e-06, "loss": 0.9549, "step": 14879 }, { "epoch": 0.28, "learning_rate": 4.22004777630952e-06, "loss": 0.8719, "step": 14880 }, { "epoch": 0.28, "learning_rate": 4.219936912285584e-06, "loss": 1.0333, "step": 14881 }, { "epoch": 0.28, "learning_rate": 4.219826041839457e-06, "loss": 0.9874, "step": 14882 }, { "epoch": 0.28, "learning_rate": 4.219715164971552e-06, "loss": 0.9012, "step": 14883 }, { "epoch": 0.28, "learning_rate": 4.219604281682283e-06, "loss": 0.8431, "step": 14884 }, { "epoch": 0.28, "learning_rate": 4.219493391972065e-06, "loss": 0.8136, "step": 14885 }, { "epoch": 0.28, "learning_rate": 4.219382495841311e-06, "loss": 1.1475, "step": 14886 }, { "epoch": 0.28, "learning_rate": 4.219271593290435e-06, "loss": 1.1081, "step": 14887 }, { "epoch": 0.28, "learning_rate": 4.219160684319852e-06, "loss": 1.0428, "step": 14888 }, { "epoch": 0.28, "learning_rate": 4.219049768929976e-06, "loss": 0.9729, "step": 14889 }, { "epoch": 0.28, "learning_rate": 4.218938847121221e-06, "loss": 0.8601, "step": 14890 }, { "epoch": 0.28, "learning_rate": 4.218827918894e-06, "loss": 1.173, "step": 14891 }, { "epoch": 0.28, "learning_rate": 4.218716984248729e-06, "loss": 0.7342, "step": 14892 }, { "epoch": 0.28, "learning_rate": 4.218606043185821e-06, "loss": 0.8633, "step": 14893 }, { "epoch": 0.28, "learning_rate": 4.218495095705691e-06, "loss": 0.9977, "step": 14894 }, { "epoch": 0.28, "learning_rate": 4.218384141808753e-06, "loss": 0.9236, "step": 14895 }, { "epoch": 0.28, "learning_rate": 4.218273181495422e-06, "loss": 0.9064, "step": 14896 }, { "epoch": 0.28, "learning_rate": 4.218162214766111e-06, "loss": 0.9202, "step": 14897 }, { "epoch": 0.28, "learning_rate": 4.218051241621235e-06, "loss": 0.7603, "step": 14898 }, { "epoch": 0.28, "learning_rate": 4.217940262061209e-06, "loss": 1.0433, "step": 14899 }, { "epoch": 0.28, "learning_rate": 4.217829276086445e-06, "loss": 1.189, "step": 14900 }, { "epoch": 0.28, "learning_rate": 4.21771828369736e-06, "loss": 0.9783, "step": 14901 }, { "epoch": 0.28, "learning_rate": 4.217607284894368e-06, "loss": 0.8283, "step": 14902 }, { "epoch": 0.28, "learning_rate": 4.2174962796778834e-06, "loss": 0.7248, "step": 14903 }, { "epoch": 0.28, "learning_rate": 4.21738526804832e-06, "loss": 0.8137, "step": 14904 }, { "epoch": 0.28, "learning_rate": 4.2172742500060925e-06, "loss": 0.9264, "step": 14905 }, { "epoch": 0.28, "learning_rate": 4.217163225551616e-06, "loss": 1.2495, "step": 14906 }, { "epoch": 0.28, "learning_rate": 4.217052194685304e-06, "loss": 0.8422, "step": 14907 }, { "epoch": 0.28, "learning_rate": 4.216941157407572e-06, "loss": 0.7714, "step": 14908 }, { "epoch": 0.28, "learning_rate": 4.216830113718834e-06, "loss": 0.9676, "step": 14909 }, { "epoch": 0.28, "learning_rate": 4.2167190636195055e-06, "loss": 0.8795, "step": 14910 }, { "epoch": 0.28, "learning_rate": 4.216608007110001e-06, "loss": 0.9465, "step": 14911 }, { "epoch": 0.28, "learning_rate": 4.216496944190734e-06, "loss": 0.9307, "step": 14912 }, { "epoch": 0.28, "learning_rate": 4.2163858748621205e-06, "loss": 1.1714, "step": 14913 }, { "epoch": 0.28, "learning_rate": 4.216274799124574e-06, "loss": 0.8993, "step": 14914 }, { "epoch": 0.28, "learning_rate": 4.216163716978512e-06, "loss": 1.0477, "step": 14915 }, { "epoch": 0.28, "learning_rate": 4.2160526284243456e-06, "loss": 1.0568, "step": 14916 }, { "epoch": 0.28, "learning_rate": 4.215941533462491e-06, "loss": 0.8812, "step": 14917 }, { "epoch": 0.28, "learning_rate": 4.215830432093364e-06, "loss": 1.1858, "step": 14918 }, { "epoch": 0.28, "learning_rate": 4.215719324317379e-06, "loss": 0.9383, "step": 14919 }, { "epoch": 0.28, "learning_rate": 4.215608210134951e-06, "loss": 0.9793, "step": 14920 }, { "epoch": 0.28, "learning_rate": 4.2154970895464934e-06, "loss": 0.8397, "step": 14921 }, { "epoch": 0.28, "learning_rate": 4.215385962552423e-06, "loss": 0.9297, "step": 14922 }, { "epoch": 0.28, "learning_rate": 4.215274829153154e-06, "loss": 0.7961, "step": 14923 }, { "epoch": 0.28, "learning_rate": 4.215163689349101e-06, "loss": 0.9995, "step": 14924 }, { "epoch": 0.28, "learning_rate": 4.21505254314068e-06, "loss": 1.215, "step": 14925 }, { "epoch": 0.28, "learning_rate": 4.214941390528305e-06, "loss": 0.905, "step": 14926 }, { "epoch": 0.28, "learning_rate": 4.214830231512391e-06, "loss": 0.9577, "step": 14927 }, { "epoch": 0.28, "learning_rate": 4.214719066093355e-06, "loss": 0.9922, "step": 14928 }, { "epoch": 0.28, "learning_rate": 4.214607894271609e-06, "loss": 0.8938, "step": 14929 }, { "epoch": 0.28, "learning_rate": 4.21449671604757e-06, "loss": 0.8687, "step": 14930 }, { "epoch": 0.28, "learning_rate": 4.214385531421653e-06, "loss": 1.1072, "step": 14931 }, { "epoch": 0.28, "learning_rate": 4.214274340394273e-06, "loss": 0.9337, "step": 14932 }, { "epoch": 0.28, "learning_rate": 4.214163142965845e-06, "loss": 1.1456, "step": 14933 }, { "epoch": 0.28, "learning_rate": 4.214051939136785e-06, "loss": 0.9672, "step": 14934 }, { "epoch": 0.28, "learning_rate": 4.213940728907508e-06, "loss": 0.9069, "step": 14935 }, { "epoch": 0.28, "learning_rate": 4.213829512278427e-06, "loss": 0.8171, "step": 14936 }, { "epoch": 0.28, "learning_rate": 4.213718289249961e-06, "loss": 1.2197, "step": 14937 }, { "epoch": 0.28, "learning_rate": 4.2136070598225224e-06, "loss": 0.9974, "step": 14938 }, { "epoch": 0.28, "learning_rate": 4.213495823996528e-06, "loss": 0.9136, "step": 14939 }, { "epoch": 0.28, "learning_rate": 4.213384581772392e-06, "loss": 1.0405, "step": 14940 }, { "epoch": 0.28, "learning_rate": 4.213273333150531e-06, "loss": 0.9749, "step": 14941 }, { "epoch": 0.28, "learning_rate": 4.21316207813136e-06, "loss": 0.7716, "step": 14942 }, { "epoch": 0.28, "learning_rate": 4.213050816715295e-06, "loss": 1.1873, "step": 14943 }, { "epoch": 0.28, "learning_rate": 4.212939548902749e-06, "loss": 1.1335, "step": 14944 }, { "epoch": 0.28, "learning_rate": 4.2128282746941405e-06, "loss": 0.8018, "step": 14945 }, { "epoch": 0.28, "learning_rate": 4.212716994089884e-06, "loss": 0.968, "step": 14946 }, { "epoch": 0.28, "learning_rate": 4.212605707090394e-06, "loss": 0.8413, "step": 14947 }, { "epoch": 0.28, "learning_rate": 4.212494413696087e-06, "loss": 1.0488, "step": 14948 }, { "epoch": 0.28, "learning_rate": 4.212383113907379e-06, "loss": 1.1138, "step": 14949 }, { "epoch": 0.28, "learning_rate": 4.212271807724684e-06, "loss": 1.1798, "step": 14950 }, { "epoch": 0.28, "learning_rate": 4.212160495148419e-06, "loss": 0.9838, "step": 14951 }, { "epoch": 0.28, "learning_rate": 4.212049176178999e-06, "loss": 0.856, "step": 14952 }, { "epoch": 0.28, "learning_rate": 4.211937850816841e-06, "loss": 0.9093, "step": 14953 }, { "epoch": 0.28, "learning_rate": 4.211826519062359e-06, "loss": 0.8212, "step": 14954 }, { "epoch": 0.28, "learning_rate": 4.211715180915968e-06, "loss": 0.8864, "step": 14955 }, { "epoch": 0.28, "learning_rate": 4.211603836378086e-06, "loss": 1.129, "step": 14956 }, { "epoch": 0.28, "learning_rate": 4.211492485449128e-06, "loss": 1.0449, "step": 14957 }, { "epoch": 0.28, "learning_rate": 4.211381128129509e-06, "loss": 1.0053, "step": 14958 }, { "epoch": 0.28, "learning_rate": 4.211269764419645e-06, "loss": 0.9672, "step": 14959 }, { "epoch": 0.28, "learning_rate": 4.211158394319953e-06, "loss": 0.8254, "step": 14960 }, { "epoch": 0.28, "learning_rate": 4.2110470178308485e-06, "loss": 1.0942, "step": 14961 }, { "epoch": 0.28, "learning_rate": 4.210935634952745e-06, "loss": 0.8259, "step": 14962 }, { "epoch": 0.28, "learning_rate": 4.210824245686061e-06, "loss": 0.8897, "step": 14963 }, { "epoch": 0.28, "learning_rate": 4.210712850031213e-06, "loss": 0.7975, "step": 14964 }, { "epoch": 0.28, "learning_rate": 4.210601447988615e-06, "loss": 1.0626, "step": 14965 }, { "epoch": 0.28, "learning_rate": 4.210490039558683e-06, "loss": 0.8206, "step": 14966 }, { "epoch": 0.28, "learning_rate": 4.210378624741835e-06, "loss": 0.7847, "step": 14967 }, { "epoch": 0.28, "learning_rate": 4.210267203538484e-06, "loss": 0.9547, "step": 14968 }, { "epoch": 0.28, "learning_rate": 4.210155775949049e-06, "loss": 1.0789, "step": 14969 }, { "epoch": 0.28, "learning_rate": 4.210044341973944e-06, "loss": 0.7346, "step": 14970 }, { "epoch": 0.28, "learning_rate": 4.2099329016135855e-06, "loss": 0.7319, "step": 14971 }, { "epoch": 0.28, "learning_rate": 4.209821454868392e-06, "loss": 1.0175, "step": 14972 }, { "epoch": 0.28, "learning_rate": 4.209710001738775e-06, "loss": 0.7658, "step": 14973 }, { "epoch": 0.28, "learning_rate": 4.209598542225154e-06, "loss": 0.9448, "step": 14974 }, { "epoch": 0.28, "learning_rate": 4.209487076327945e-06, "loss": 0.9395, "step": 14975 }, { "epoch": 0.28, "learning_rate": 4.209375604047564e-06, "loss": 0.952, "step": 14976 }, { "epoch": 0.28, "learning_rate": 4.209264125384427e-06, "loss": 0.8966, "step": 14977 }, { "epoch": 0.28, "learning_rate": 4.209152640338949e-06, "loss": 0.8565, "step": 14978 }, { "epoch": 0.28, "learning_rate": 4.209041148911548e-06, "loss": 0.9073, "step": 14979 }, { "epoch": 0.28, "learning_rate": 4.20892965110264e-06, "loss": 1.0714, "step": 14980 }, { "epoch": 0.28, "learning_rate": 4.208818146912641e-06, "loss": 1.0666, "step": 14981 }, { "epoch": 0.28, "learning_rate": 4.2087066363419675e-06, "loss": 0.8996, "step": 14982 }, { "epoch": 0.28, "learning_rate": 4.208595119391036e-06, "loss": 0.9142, "step": 14983 }, { "epoch": 0.28, "learning_rate": 4.208483596060262e-06, "loss": 0.7858, "step": 14984 }, { "epoch": 0.28, "learning_rate": 4.208372066350063e-06, "loss": 0.7601, "step": 14985 }, { "epoch": 0.28, "learning_rate": 4.208260530260855e-06, "loss": 0.8807, "step": 14986 }, { "epoch": 0.28, "learning_rate": 4.2081489877930544e-06, "loss": 1.0911, "step": 14987 }, { "epoch": 0.28, "learning_rate": 4.2080374389470775e-06, "loss": 1.1459, "step": 14988 }, { "epoch": 0.28, "learning_rate": 4.207925883723342e-06, "loss": 0.9222, "step": 14989 }, { "epoch": 0.28, "learning_rate": 4.207814322122264e-06, "loss": 0.7769, "step": 14990 }, { "epoch": 0.28, "learning_rate": 4.207702754144259e-06, "loss": 1.0449, "step": 14991 }, { "epoch": 0.28, "learning_rate": 4.207591179789744e-06, "loss": 0.7997, "step": 14992 }, { "epoch": 0.28, "learning_rate": 4.207479599059137e-06, "loss": 0.8988, "step": 14993 }, { "epoch": 0.28, "learning_rate": 4.207368011952853e-06, "loss": 0.9805, "step": 14994 }, { "epoch": 0.28, "learning_rate": 4.207256418471308e-06, "loss": 1.0559, "step": 14995 }, { "epoch": 0.28, "learning_rate": 4.207144818614921e-06, "loss": 0.9336, "step": 14996 }, { "epoch": 0.28, "learning_rate": 4.207033212384108e-06, "loss": 0.7997, "step": 14997 }, { "epoch": 0.28, "learning_rate": 4.206921599779284e-06, "loss": 0.7988, "step": 14998 }, { "epoch": 0.28, "learning_rate": 4.206809980800867e-06, "loss": 1.0803, "step": 14999 }, { "epoch": 0.28, "learning_rate": 4.2066983554492756e-06, "loss": 0.8824, "step": 15000 }, { "epoch": 0.28, "learning_rate": 4.206586723724924e-06, "loss": 1.0793, "step": 15001 }, { "epoch": 0.28, "learning_rate": 4.2064750856282295e-06, "loss": 0.9258, "step": 15002 }, { "epoch": 0.28, "learning_rate": 4.20636344115961e-06, "loss": 0.9303, "step": 15003 }, { "epoch": 0.28, "learning_rate": 4.206251790319481e-06, "loss": 0.7136, "step": 15004 }, { "epoch": 0.28, "learning_rate": 4.206140133108261e-06, "loss": 1.0398, "step": 15005 }, { "epoch": 0.28, "learning_rate": 4.206028469526366e-06, "loss": 1.1201, "step": 15006 }, { "epoch": 0.28, "learning_rate": 4.205916799574212e-06, "loss": 1.0708, "step": 15007 }, { "epoch": 0.28, "learning_rate": 4.205805123252218e-06, "loss": 0.9774, "step": 15008 }, { "epoch": 0.28, "learning_rate": 4.2056934405607995e-06, "loss": 0.9825, "step": 15009 }, { "epoch": 0.28, "learning_rate": 4.205581751500374e-06, "loss": 0.8328, "step": 15010 }, { "epoch": 0.28, "learning_rate": 4.205470056071359e-06, "loss": 0.9133, "step": 15011 }, { "epoch": 0.28, "learning_rate": 4.20535835427417e-06, "loss": 0.9988, "step": 15012 }, { "epoch": 0.28, "learning_rate": 4.205246646109227e-06, "loss": 0.8923, "step": 15013 }, { "epoch": 0.28, "learning_rate": 4.205134931576943e-06, "loss": 1.0748, "step": 15014 }, { "epoch": 0.28, "learning_rate": 4.205023210677739e-06, "loss": 0.7761, "step": 15015 }, { "epoch": 0.28, "learning_rate": 4.20491148341203e-06, "loss": 1.0663, "step": 15016 }, { "epoch": 0.28, "learning_rate": 4.204799749780234e-06, "loss": 0.8846, "step": 15017 }, { "epoch": 0.28, "learning_rate": 4.204688009782768e-06, "loss": 1.0195, "step": 15018 }, { "epoch": 0.28, "learning_rate": 4.204576263420049e-06, "loss": 1.1453, "step": 15019 }, { "epoch": 0.28, "learning_rate": 4.2044645106924955e-06, "loss": 0.9734, "step": 15020 }, { "epoch": 0.28, "learning_rate": 4.204352751600523e-06, "loss": 0.9774, "step": 15021 }, { "epoch": 0.28, "learning_rate": 4.204240986144549e-06, "loss": 1.0217, "step": 15022 }, { "epoch": 0.28, "learning_rate": 4.2041292143249926e-06, "loss": 0.8892, "step": 15023 }, { "epoch": 0.28, "learning_rate": 4.204017436142269e-06, "loss": 1.0947, "step": 15024 }, { "epoch": 0.28, "learning_rate": 4.2039056515967965e-06, "loss": 1.0751, "step": 15025 }, { "epoch": 0.28, "learning_rate": 4.203793860688994e-06, "loss": 0.9657, "step": 15026 }, { "epoch": 0.28, "learning_rate": 4.203682063419276e-06, "loss": 0.9493, "step": 15027 }, { "epoch": 0.28, "learning_rate": 4.203570259788062e-06, "loss": 1.0808, "step": 15028 }, { "epoch": 0.28, "learning_rate": 4.203458449795769e-06, "loss": 0.7352, "step": 15029 }, { "epoch": 0.28, "learning_rate": 4.203346633442814e-06, "loss": 0.9194, "step": 15030 }, { "epoch": 0.28, "learning_rate": 4.203234810729615e-06, "loss": 1.0516, "step": 15031 }, { "epoch": 0.28, "learning_rate": 4.20312298165659e-06, "loss": 0.9073, "step": 15032 }, { "epoch": 0.28, "learning_rate": 4.203011146224155e-06, "loss": 0.8629, "step": 15033 }, { "epoch": 0.28, "learning_rate": 4.20289930443273e-06, "loss": 0.9559, "step": 15034 }, { "epoch": 0.28, "learning_rate": 4.2027874562827295e-06, "loss": 0.8929, "step": 15035 }, { "epoch": 0.28, "learning_rate": 4.202675601774574e-06, "loss": 0.8914, "step": 15036 }, { "epoch": 0.28, "learning_rate": 4.202563740908679e-06, "loss": 1.0792, "step": 15037 }, { "epoch": 0.28, "learning_rate": 4.202451873685463e-06, "loss": 1.1296, "step": 15038 }, { "epoch": 0.28, "learning_rate": 4.202340000105345e-06, "loss": 0.9627, "step": 15039 }, { "epoch": 0.28, "learning_rate": 4.202228120168742e-06, "loss": 0.9128, "step": 15040 }, { "epoch": 0.28, "learning_rate": 4.202116233876071e-06, "loss": 0.864, "step": 15041 }, { "epoch": 0.28, "learning_rate": 4.20200434122775e-06, "loss": 1.0498, "step": 15042 }, { "epoch": 0.28, "learning_rate": 4.201892442224196e-06, "loss": 1.2314, "step": 15043 }, { "epoch": 0.28, "learning_rate": 4.201780536865829e-06, "loss": 1.0862, "step": 15044 }, { "epoch": 0.28, "learning_rate": 4.2016686251530656e-06, "loss": 0.962, "step": 15045 }, { "epoch": 0.28, "learning_rate": 4.201556707086323e-06, "loss": 0.866, "step": 15046 }, { "epoch": 0.28, "learning_rate": 4.201444782666021e-06, "loss": 0.8222, "step": 15047 }, { "epoch": 0.28, "learning_rate": 4.201332851892576e-06, "loss": 0.9985, "step": 15048 }, { "epoch": 0.28, "learning_rate": 4.2012209147664055e-06, "loss": 0.8145, "step": 15049 }, { "epoch": 0.28, "learning_rate": 4.2011089712879285e-06, "loss": 0.9316, "step": 15050 }, { "epoch": 0.28, "learning_rate": 4.200997021457563e-06, "loss": 0.9832, "step": 15051 }, { "epoch": 0.28, "learning_rate": 4.200885065275726e-06, "loss": 0.972, "step": 15052 }, { "epoch": 0.28, "learning_rate": 4.2007731027428374e-06, "loss": 0.9393, "step": 15053 }, { "epoch": 0.28, "learning_rate": 4.200661133859314e-06, "loss": 0.7092, "step": 15054 }, { "epoch": 0.28, "learning_rate": 4.200549158625574e-06, "loss": 1.0453, "step": 15055 }, { "epoch": 0.28, "learning_rate": 4.200437177042036e-06, "loss": 1.1877, "step": 15056 }, { "epoch": 0.28, "learning_rate": 4.2003251891091165e-06, "loss": 0.9851, "step": 15057 }, { "epoch": 0.28, "learning_rate": 4.200213194827236e-06, "loss": 0.6554, "step": 15058 }, { "epoch": 0.28, "learning_rate": 4.200101194196811e-06, "loss": 0.7879, "step": 15059 }, { "epoch": 0.28, "learning_rate": 4.19998918721826e-06, "loss": 1.0743, "step": 15060 }, { "epoch": 0.28, "learning_rate": 4.199877173892002e-06, "loss": 0.8864, "step": 15061 }, { "epoch": 0.28, "learning_rate": 4.199765154218455e-06, "loss": 1.1125, "step": 15062 }, { "epoch": 0.28, "learning_rate": 4.199653128198037e-06, "loss": 0.9625, "step": 15063 }, { "epoch": 0.28, "learning_rate": 4.199541095831165e-06, "loss": 0.8193, "step": 15064 }, { "epoch": 0.28, "learning_rate": 4.199429057118261e-06, "loss": 0.8804, "step": 15065 }, { "epoch": 0.28, "learning_rate": 4.19931701205974e-06, "loss": 0.8649, "step": 15066 }, { "epoch": 0.28, "learning_rate": 4.19920496065602e-06, "loss": 0.8702, "step": 15067 }, { "epoch": 0.28, "learning_rate": 4.199092902907522e-06, "loss": 1.0616, "step": 15068 }, { "epoch": 0.28, "learning_rate": 4.198980838814663e-06, "loss": 1.0032, "step": 15069 }, { "epoch": 0.28, "learning_rate": 4.198868768377861e-06, "loss": 1.0364, "step": 15070 }, { "epoch": 0.28, "learning_rate": 4.198756691597537e-06, "loss": 0.678, "step": 15071 }, { "epoch": 0.28, "learning_rate": 4.198644608474106e-06, "loss": 0.7551, "step": 15072 }, { "epoch": 0.28, "learning_rate": 4.198532519007989e-06, "loss": 1.0229, "step": 15073 }, { "epoch": 0.28, "learning_rate": 4.198420423199603e-06, "loss": 1.1556, "step": 15074 }, { "epoch": 0.28, "learning_rate": 4.198308321049367e-06, "loss": 1.2008, "step": 15075 }, { "epoch": 0.28, "learning_rate": 4.1981962125577e-06, "loss": 0.8446, "step": 15076 }, { "epoch": 0.28, "learning_rate": 4.198084097725021e-06, "loss": 0.978, "step": 15077 }, { "epoch": 0.28, "learning_rate": 4.197971976551747e-06, "loss": 1.0056, "step": 15078 }, { "epoch": 0.28, "learning_rate": 4.197859849038299e-06, "loss": 0.9437, "step": 15079 }, { "epoch": 0.28, "learning_rate": 4.197747715185093e-06, "loss": 1.0175, "step": 15080 }, { "epoch": 0.28, "learning_rate": 4.19763557499255e-06, "loss": 0.9569, "step": 15081 }, { "epoch": 0.28, "learning_rate": 4.197523428461087e-06, "loss": 0.924, "step": 15082 }, { "epoch": 0.28, "learning_rate": 4.197411275591125e-06, "loss": 0.8121, "step": 15083 }, { "epoch": 0.28, "learning_rate": 4.197299116383081e-06, "loss": 1.0571, "step": 15084 }, { "epoch": 0.28, "learning_rate": 4.197186950837373e-06, "loss": 1.0427, "step": 15085 }, { "epoch": 0.28, "learning_rate": 4.197074778954422e-06, "loss": 1.0768, "step": 15086 }, { "epoch": 0.28, "learning_rate": 4.196962600734646e-06, "loss": 0.9454, "step": 15087 }, { "epoch": 0.28, "learning_rate": 4.196850416178463e-06, "loss": 1.0358, "step": 15088 }, { "epoch": 0.28, "learning_rate": 4.196738225286292e-06, "loss": 0.8447, "step": 15089 }, { "epoch": 0.28, "learning_rate": 4.1966260280585534e-06, "loss": 0.7538, "step": 15090 }, { "epoch": 0.28, "learning_rate": 4.196513824495665e-06, "loss": 0.8939, "step": 15091 }, { "epoch": 0.28, "learning_rate": 4.196401614598045e-06, "loss": 1.0178, "step": 15092 }, { "epoch": 0.28, "learning_rate": 4.196289398366115e-06, "loss": 1.0881, "step": 15093 }, { "epoch": 0.28, "learning_rate": 4.1961771758002925e-06, "loss": 1.0009, "step": 15094 }, { "epoch": 0.28, "learning_rate": 4.196064946900995e-06, "loss": 0.945, "step": 15095 }, { "epoch": 0.28, "learning_rate": 4.195952711668644e-06, "loss": 0.6648, "step": 15096 }, { "epoch": 0.28, "learning_rate": 4.195840470103657e-06, "loss": 0.9104, "step": 15097 }, { "epoch": 0.28, "learning_rate": 4.1957282222064545e-06, "loss": 1.0762, "step": 15098 }, { "epoch": 0.28, "learning_rate": 4.195615967977454e-06, "loss": 1.2263, "step": 15099 }, { "epoch": 0.28, "learning_rate": 4.1955037074170755e-06, "loss": 1.1504, "step": 15100 }, { "epoch": 0.28, "learning_rate": 4.195391440525738e-06, "loss": 0.9021, "step": 15101 }, { "epoch": 0.28, "learning_rate": 4.195279167303862e-06, "loss": 0.8163, "step": 15102 }, { "epoch": 0.28, "learning_rate": 4.1951668877518645e-06, "loss": 0.8548, "step": 15103 }, { "epoch": 0.28, "learning_rate": 4.195054601870166e-06, "loss": 0.7863, "step": 15104 }, { "epoch": 0.28, "learning_rate": 4.194942309659186e-06, "loss": 0.9595, "step": 15105 }, { "epoch": 0.29, "learning_rate": 4.194830011119343e-06, "loss": 1.2168, "step": 15106 }, { "epoch": 0.29, "learning_rate": 4.194717706251057e-06, "loss": 0.9859, "step": 15107 }, { "epoch": 0.29, "learning_rate": 4.194605395054746e-06, "loss": 0.8231, "step": 15108 }, { "epoch": 0.29, "learning_rate": 4.194493077530832e-06, "loss": 0.9547, "step": 15109 }, { "epoch": 0.29, "learning_rate": 4.194380753679731e-06, "loss": 0.8991, "step": 15110 }, { "epoch": 0.29, "learning_rate": 4.1942684235018655e-06, "loss": 0.982, "step": 15111 }, { "epoch": 0.29, "learning_rate": 4.194156086997654e-06, "loss": 0.9441, "step": 15112 }, { "epoch": 0.29, "learning_rate": 4.194043744167515e-06, "loss": 0.8418, "step": 15113 }, { "epoch": 0.29, "learning_rate": 4.193931395011868e-06, "loss": 1.2091, "step": 15114 }, { "epoch": 0.29, "learning_rate": 4.193819039531134e-06, "loss": 0.8063, "step": 15115 }, { "epoch": 0.29, "learning_rate": 4.193706677725732e-06, "loss": 0.9549, "step": 15116 }, { "epoch": 0.29, "learning_rate": 4.1935943095960795e-06, "loss": 0.864, "step": 15117 }, { "epoch": 0.29, "learning_rate": 4.1934819351426e-06, "loss": 0.9693, "step": 15118 }, { "epoch": 0.29, "learning_rate": 4.19336955436571e-06, "loss": 0.9965, "step": 15119 }, { "epoch": 0.29, "learning_rate": 4.193257167265828e-06, "loss": 0.7717, "step": 15120 }, { "epoch": 0.29, "learning_rate": 4.193144773843378e-06, "loss": 0.8845, "step": 15121 }, { "epoch": 0.29, "learning_rate": 4.193032374098777e-06, "loss": 0.8435, "step": 15122 }, { "epoch": 0.29, "learning_rate": 4.192919968032444e-06, "loss": 0.8614, "step": 15123 }, { "epoch": 0.29, "learning_rate": 4.192807555644801e-06, "loss": 1.1324, "step": 15124 }, { "epoch": 0.29, "learning_rate": 4.192695136936266e-06, "loss": 1.0713, "step": 15125 }, { "epoch": 0.29, "learning_rate": 4.1925827119072595e-06, "loss": 0.8638, "step": 15126 }, { "epoch": 0.29, "learning_rate": 4.1924702805582005e-06, "loss": 0.7918, "step": 15127 }, { "epoch": 0.29, "learning_rate": 4.192357842889509e-06, "loss": 0.8569, "step": 15128 }, { "epoch": 0.29, "learning_rate": 4.192245398901606e-06, "loss": 0.9633, "step": 15129 }, { "epoch": 0.29, "learning_rate": 4.192132948594911e-06, "loss": 0.8999, "step": 15130 }, { "epoch": 0.29, "learning_rate": 4.192020491969842e-06, "loss": 1.0612, "step": 15131 }, { "epoch": 0.29, "learning_rate": 4.191908029026822e-06, "loss": 0.8492, "step": 15132 }, { "epoch": 0.29, "learning_rate": 4.191795559766268e-06, "loss": 0.7607, "step": 15133 }, { "epoch": 0.29, "learning_rate": 4.191683084188602e-06, "loss": 0.9595, "step": 15134 }, { "epoch": 0.29, "learning_rate": 4.191570602294243e-06, "loss": 0.7708, "step": 15135 }, { "epoch": 0.29, "learning_rate": 4.191458114083611e-06, "loss": 0.8817, "step": 15136 }, { "epoch": 0.29, "learning_rate": 4.191345619557127e-06, "loss": 1.1151, "step": 15137 }, { "epoch": 0.29, "learning_rate": 4.191233118715209e-06, "loss": 1.1004, "step": 15138 }, { "epoch": 0.29, "learning_rate": 4.19112061155828e-06, "loss": 0.8864, "step": 15139 }, { "epoch": 0.29, "learning_rate": 4.191008098086757e-06, "loss": 0.9238, "step": 15140 }, { "epoch": 0.29, "learning_rate": 4.1908955783010624e-06, "loss": 0.9163, "step": 15141 }, { "epoch": 0.29, "learning_rate": 4.1907830522016155e-06, "loss": 0.9813, "step": 15142 }, { "epoch": 0.29, "learning_rate": 4.1906705197888365e-06, "loss": 1.015, "step": 15143 }, { "epoch": 0.29, "learning_rate": 4.1905579810631456e-06, "loss": 1.1536, "step": 15144 }, { "epoch": 0.29, "learning_rate": 4.190445436024963e-06, "loss": 0.9049, "step": 15145 }, { "epoch": 0.29, "learning_rate": 4.190332884674709e-06, "loss": 0.9037, "step": 15146 }, { "epoch": 0.29, "learning_rate": 4.190220327012804e-06, "loss": 1.0143, "step": 15147 }, { "epoch": 0.29, "learning_rate": 4.190107763039668e-06, "loss": 0.7996, "step": 15148 }, { "epoch": 0.29, "learning_rate": 4.189995192755721e-06, "loss": 1.2453, "step": 15149 }, { "epoch": 0.29, "learning_rate": 4.1898826161613834e-06, "loss": 1.1789, "step": 15150 }, { "epoch": 0.29, "learning_rate": 4.189770033257078e-06, "loss": 0.7557, "step": 15151 }, { "epoch": 0.29, "learning_rate": 4.189657444043222e-06, "loss": 1.0318, "step": 15152 }, { "epoch": 0.29, "learning_rate": 4.189544848520236e-06, "loss": 0.855, "step": 15153 }, { "epoch": 0.29, "learning_rate": 4.189432246688542e-06, "loss": 0.7982, "step": 15154 }, { "epoch": 0.29, "learning_rate": 4.18931963854856e-06, "loss": 0.8698, "step": 15155 }, { "epoch": 0.29, "learning_rate": 4.18920702410071e-06, "loss": 1.1577, "step": 15156 }, { "epoch": 0.29, "learning_rate": 4.189094403345413e-06, "loss": 1.1048, "step": 15157 }, { "epoch": 0.29, "learning_rate": 4.188981776283089e-06, "loss": 0.8437, "step": 15158 }, { "epoch": 0.29, "learning_rate": 4.1888691429141585e-06, "loss": 0.8983, "step": 15159 }, { "epoch": 0.29, "learning_rate": 4.188756503239043e-06, "loss": 0.8006, "step": 15160 }, { "epoch": 0.29, "learning_rate": 4.188643857258162e-06, "loss": 0.7634, "step": 15161 }, { "epoch": 0.29, "learning_rate": 4.188531204971937e-06, "loss": 1.1707, "step": 15162 }, { "epoch": 0.29, "learning_rate": 4.1884185463807885e-06, "loss": 1.0416, "step": 15163 }, { "epoch": 0.29, "learning_rate": 4.188305881485137e-06, "loss": 1.0522, "step": 15164 }, { "epoch": 0.29, "learning_rate": 4.188193210285402e-06, "loss": 0.8165, "step": 15165 }, { "epoch": 0.29, "learning_rate": 4.188080532782006e-06, "loss": 0.8431, "step": 15166 }, { "epoch": 0.29, "learning_rate": 4.187967848975369e-06, "loss": 0.735, "step": 15167 }, { "epoch": 0.29, "learning_rate": 4.187855158865912e-06, "loss": 0.9602, "step": 15168 }, { "epoch": 0.29, "learning_rate": 4.187742462454056e-06, "loss": 1.0615, "step": 15169 }, { "epoch": 0.29, "learning_rate": 4.187629759740221e-06, "loss": 0.8396, "step": 15170 }, { "epoch": 0.29, "learning_rate": 4.187517050724827e-06, "loss": 0.8535, "step": 15171 }, { "epoch": 0.29, "learning_rate": 4.187404335408298e-06, "loss": 1.0312, "step": 15172 }, { "epoch": 0.29, "learning_rate": 4.187291613791052e-06, "loss": 1.0054, "step": 15173 }, { "epoch": 0.29, "learning_rate": 4.187178885873511e-06, "loss": 1.0352, "step": 15174 }, { "epoch": 0.29, "learning_rate": 4.187066151656096e-06, "loss": 1.1063, "step": 15175 }, { "epoch": 0.29, "learning_rate": 4.186953411139227e-06, "loss": 1.0198, "step": 15176 }, { "epoch": 0.29, "learning_rate": 4.1868406643233265e-06, "loss": 0.944, "step": 15177 }, { "epoch": 0.29, "learning_rate": 4.186727911208814e-06, "loss": 1.0142, "step": 15178 }, { "epoch": 0.29, "learning_rate": 4.186615151796112e-06, "loss": 0.7513, "step": 15179 }, { "epoch": 0.29, "learning_rate": 4.1865023860856406e-06, "loss": 0.8478, "step": 15180 }, { "epoch": 0.29, "learning_rate": 4.18638961407782e-06, "loss": 0.8568, "step": 15181 }, { "epoch": 0.29, "learning_rate": 4.186276835773073e-06, "loss": 0.9755, "step": 15182 }, { "epoch": 0.29, "learning_rate": 4.186164051171821e-06, "loss": 0.9951, "step": 15183 }, { "epoch": 0.29, "learning_rate": 4.186051260274482e-06, "loss": 0.9155, "step": 15184 }, { "epoch": 0.29, "learning_rate": 4.185938463081481e-06, "loss": 0.9212, "step": 15185 }, { "epoch": 0.29, "learning_rate": 4.185825659593237e-06, "loss": 0.8683, "step": 15186 }, { "epoch": 0.29, "learning_rate": 4.185712849810171e-06, "loss": 1.1403, "step": 15187 }, { "epoch": 0.29, "learning_rate": 4.185600033732705e-06, "loss": 0.8871, "step": 15188 }, { "epoch": 0.29, "learning_rate": 4.185487211361261e-06, "loss": 1.0884, "step": 15189 }, { "epoch": 0.29, "learning_rate": 4.185374382696259e-06, "loss": 0.9836, "step": 15190 }, { "epoch": 0.29, "learning_rate": 4.1852615477381205e-06, "loss": 0.8549, "step": 15191 }, { "epoch": 0.29, "learning_rate": 4.185148706487268e-06, "loss": 0.7844, "step": 15192 }, { "epoch": 0.29, "learning_rate": 4.185035858944121e-06, "loss": 0.9739, "step": 15193 }, { "epoch": 0.29, "learning_rate": 4.184923005109102e-06, "loss": 1.1085, "step": 15194 }, { "epoch": 0.29, "learning_rate": 4.184810144982632e-06, "loss": 0.8853, "step": 15195 }, { "epoch": 0.29, "learning_rate": 4.184697278565132e-06, "loss": 0.8958, "step": 15196 }, { "epoch": 0.29, "learning_rate": 4.184584405857025e-06, "loss": 0.8707, "step": 15197 }, { "epoch": 0.29, "learning_rate": 4.184471526858731e-06, "loss": 0.8478, "step": 15198 }, { "epoch": 0.29, "learning_rate": 4.184358641570673e-06, "loss": 1.0071, "step": 15199 }, { "epoch": 0.29, "learning_rate": 4.18424574999327e-06, "loss": 1.0396, "step": 15200 }, { "epoch": 0.29, "learning_rate": 4.184132852126945e-06, "loss": 0.9968, "step": 15201 }, { "epoch": 0.29, "learning_rate": 4.184019947972121e-06, "loss": 0.9618, "step": 15202 }, { "epoch": 0.29, "learning_rate": 4.183907037529217e-06, "loss": 0.9221, "step": 15203 }, { "epoch": 0.29, "learning_rate": 4.183794120798657e-06, "loss": 0.8908, "step": 15204 }, { "epoch": 0.29, "learning_rate": 4.18368119778086e-06, "loss": 0.9145, "step": 15205 }, { "epoch": 0.29, "learning_rate": 4.183568268476249e-06, "loss": 1.2926, "step": 15206 }, { "epoch": 0.29, "learning_rate": 4.183455332885247e-06, "loss": 0.9918, "step": 15207 }, { "epoch": 0.29, "learning_rate": 4.1833423910082725e-06, "loss": 1.0103, "step": 15208 }, { "epoch": 0.29, "learning_rate": 4.183229442845751e-06, "loss": 0.8705, "step": 15209 }, { "epoch": 0.29, "learning_rate": 4.183116488398102e-06, "loss": 0.8898, "step": 15210 }, { "epoch": 0.29, "learning_rate": 4.183003527665747e-06, "loss": 0.8544, "step": 15211 }, { "epoch": 0.29, "learning_rate": 4.182890560649108e-06, "loss": 1.1436, "step": 15212 }, { "epoch": 0.29, "learning_rate": 4.182777587348608e-06, "loss": 1.032, "step": 15213 }, { "epoch": 0.29, "learning_rate": 4.182664607764668e-06, "loss": 0.8811, "step": 15214 }, { "epoch": 0.29, "learning_rate": 4.18255162189771e-06, "loss": 0.8712, "step": 15215 }, { "epoch": 0.29, "learning_rate": 4.1824386297481565e-06, "loss": 0.9234, "step": 15216 }, { "epoch": 0.29, "learning_rate": 4.182325631316427e-06, "loss": 0.9629, "step": 15217 }, { "epoch": 0.29, "learning_rate": 4.182212626602947e-06, "loss": 0.9821, "step": 15218 }, { "epoch": 0.29, "learning_rate": 4.182099615608136e-06, "loss": 1.1124, "step": 15219 }, { "epoch": 0.29, "learning_rate": 4.181986598332416e-06, "loss": 0.9588, "step": 15220 }, { "epoch": 0.29, "learning_rate": 4.18187357477621e-06, "loss": 0.7054, "step": 15221 }, { "epoch": 0.29, "learning_rate": 4.18176054493994e-06, "loss": 0.8895, "step": 15222 }, { "epoch": 0.29, "learning_rate": 4.181647508824027e-06, "loss": 0.8206, "step": 15223 }, { "epoch": 0.29, "learning_rate": 4.1815344664288934e-06, "loss": 1.0391, "step": 15224 }, { "epoch": 0.29, "learning_rate": 4.1814214177549626e-06, "loss": 1.1108, "step": 15225 }, { "epoch": 0.29, "learning_rate": 4.181308362802657e-06, "loss": 0.9607, "step": 15226 }, { "epoch": 0.29, "learning_rate": 4.181195301572395e-06, "loss": 0.9558, "step": 15227 }, { "epoch": 0.29, "learning_rate": 4.181082234064603e-06, "loss": 0.8793, "step": 15228 }, { "epoch": 0.29, "learning_rate": 4.180969160279701e-06, "loss": 0.7693, "step": 15229 }, { "epoch": 0.29, "learning_rate": 4.180856080218111e-06, "loss": 1.1328, "step": 15230 }, { "epoch": 0.29, "learning_rate": 4.180742993880257e-06, "loss": 1.1401, "step": 15231 }, { "epoch": 0.29, "learning_rate": 4.180629901266559e-06, "loss": 0.7732, "step": 15232 }, { "epoch": 0.29, "learning_rate": 4.180516802377441e-06, "loss": 0.8563, "step": 15233 }, { "epoch": 0.29, "learning_rate": 4.180403697213325e-06, "loss": 0.9822, "step": 15234 }, { "epoch": 0.29, "learning_rate": 4.180290585774633e-06, "loss": 0.8974, "step": 15235 }, { "epoch": 0.29, "learning_rate": 4.180177468061788e-06, "loss": 1.1069, "step": 15236 }, { "epoch": 0.29, "learning_rate": 4.180064344075212e-06, "loss": 1.2682, "step": 15237 }, { "epoch": 0.29, "learning_rate": 4.1799512138153265e-06, "loss": 0.9486, "step": 15238 }, { "epoch": 0.29, "learning_rate": 4.179838077282554e-06, "loss": 0.9224, "step": 15239 }, { "epoch": 0.29, "learning_rate": 4.179724934477319e-06, "loss": 0.8778, "step": 15240 }, { "epoch": 0.29, "learning_rate": 4.1796117854000414e-06, "loss": 0.9816, "step": 15241 }, { "epoch": 0.29, "learning_rate": 4.179498630051146e-06, "loss": 0.8954, "step": 15242 }, { "epoch": 0.29, "learning_rate": 4.179385468431054e-06, "loss": 1.0091, "step": 15243 }, { "epoch": 0.29, "learning_rate": 4.1792723005401875e-06, "loss": 1.045, "step": 15244 }, { "epoch": 0.29, "learning_rate": 4.17915912637897e-06, "loss": 0.9532, "step": 15245 }, { "epoch": 0.29, "learning_rate": 4.179045945947824e-06, "loss": 0.9028, "step": 15246 }, { "epoch": 0.29, "learning_rate": 4.178932759247172e-06, "loss": 1.0148, "step": 15247 }, { "epoch": 0.29, "learning_rate": 4.178819566277436e-06, "loss": 1.0753, "step": 15248 }, { "epoch": 0.29, "learning_rate": 4.17870636703904e-06, "loss": 1.1094, "step": 15249 }, { "epoch": 0.29, "learning_rate": 4.178593161532405e-06, "loss": 1.2535, "step": 15250 }, { "epoch": 0.29, "learning_rate": 4.1784799497579555e-06, "loss": 0.8288, "step": 15251 }, { "epoch": 0.29, "learning_rate": 4.178366731716113e-06, "loss": 1.1507, "step": 15252 }, { "epoch": 0.29, "learning_rate": 4.1782535074073e-06, "loss": 1.0005, "step": 15253 }, { "epoch": 0.29, "learning_rate": 4.17814027683194e-06, "loss": 0.8436, "step": 15254 }, { "epoch": 0.29, "learning_rate": 4.178027039990457e-06, "loss": 1.0132, "step": 15255 }, { "epoch": 0.29, "learning_rate": 4.1779137968832715e-06, "loss": 1.056, "step": 15256 }, { "epoch": 0.29, "learning_rate": 4.177800547510807e-06, "loss": 1.1308, "step": 15257 }, { "epoch": 0.29, "learning_rate": 4.177687291873487e-06, "loss": 0.8939, "step": 15258 }, { "epoch": 0.29, "learning_rate": 4.177574029971735e-06, "loss": 0.8449, "step": 15259 }, { "epoch": 0.29, "learning_rate": 4.177460761805972e-06, "loss": 0.7661, "step": 15260 }, { "epoch": 0.29, "learning_rate": 4.177347487376622e-06, "loss": 0.7249, "step": 15261 }, { "epoch": 0.29, "learning_rate": 4.177234206684107e-06, "loss": 1.014, "step": 15262 }, { "epoch": 0.29, "learning_rate": 4.177120919728853e-06, "loss": 0.9343, "step": 15263 }, { "epoch": 0.29, "learning_rate": 4.177007626511279e-06, "loss": 0.9377, "step": 15264 }, { "epoch": 0.29, "learning_rate": 4.17689432703181e-06, "loss": 0.8354, "step": 15265 }, { "epoch": 0.29, "learning_rate": 4.176781021290871e-06, "loss": 0.9315, "step": 15266 }, { "epoch": 0.29, "learning_rate": 4.176667709288882e-06, "loss": 0.8769, "step": 15267 }, { "epoch": 0.29, "learning_rate": 4.176554391026266e-06, "loss": 1.0226, "step": 15268 }, { "epoch": 0.29, "learning_rate": 4.1764410665034485e-06, "loss": 1.0757, "step": 15269 }, { "epoch": 0.29, "learning_rate": 4.176327735720852e-06, "loss": 0.8006, "step": 15270 }, { "epoch": 0.29, "learning_rate": 4.1762143986788985e-06, "loss": 1.0411, "step": 15271 }, { "epoch": 0.29, "learning_rate": 4.176101055378011e-06, "loss": 0.8926, "step": 15272 }, { "epoch": 0.29, "learning_rate": 4.175987705818615e-06, "loss": 0.8744, "step": 15273 }, { "epoch": 0.29, "learning_rate": 4.175874350001131e-06, "loss": 0.8198, "step": 15274 }, { "epoch": 0.29, "learning_rate": 4.175760987925984e-06, "loss": 1.1064, "step": 15275 }, { "epoch": 0.29, "learning_rate": 4.175647619593598e-06, "loss": 0.9335, "step": 15276 }, { "epoch": 0.29, "learning_rate": 4.175534245004393e-06, "loss": 1.0457, "step": 15277 }, { "epoch": 0.29, "learning_rate": 4.175420864158796e-06, "loss": 0.9569, "step": 15278 }, { "epoch": 0.29, "learning_rate": 4.1753074770572285e-06, "loss": 0.9468, "step": 15279 }, { "epoch": 0.29, "learning_rate": 4.175194083700115e-06, "loss": 1.2464, "step": 15280 }, { "epoch": 0.29, "learning_rate": 4.175080684087877e-06, "loss": 1.1325, "step": 15281 }, { "epoch": 0.29, "learning_rate": 4.174967278220939e-06, "loss": 0.7617, "step": 15282 }, { "epoch": 0.29, "learning_rate": 4.174853866099725e-06, "loss": 0.9163, "step": 15283 }, { "epoch": 0.29, "learning_rate": 4.174740447724659e-06, "loss": 0.9667, "step": 15284 }, { "epoch": 0.29, "learning_rate": 4.174627023096162e-06, "loss": 0.8085, "step": 15285 }, { "epoch": 0.29, "learning_rate": 4.17451359221466e-06, "loss": 0.8804, "step": 15286 }, { "epoch": 0.29, "learning_rate": 4.174400155080575e-06, "loss": 0.8374, "step": 15287 }, { "epoch": 0.29, "learning_rate": 4.1742867116943304e-06, "loss": 1.2533, "step": 15288 }, { "epoch": 0.29, "learning_rate": 4.174173262056353e-06, "loss": 0.8256, "step": 15289 }, { "epoch": 0.29, "learning_rate": 4.174059806167062e-06, "loss": 0.8919, "step": 15290 }, { "epoch": 0.29, "learning_rate": 4.1739463440268835e-06, "loss": 0.9134, "step": 15291 }, { "epoch": 0.29, "learning_rate": 4.17383287563624e-06, "loss": 0.7295, "step": 15292 }, { "epoch": 0.29, "learning_rate": 4.173719400995556e-06, "loss": 1.0752, "step": 15293 }, { "epoch": 0.29, "learning_rate": 4.173605920105257e-06, "loss": 1.0504, "step": 15294 }, { "epoch": 0.29, "learning_rate": 4.173492432965763e-06, "loss": 0.9229, "step": 15295 }, { "epoch": 0.29, "learning_rate": 4.1733789395775e-06, "loss": 0.8404, "step": 15296 }, { "epoch": 0.29, "learning_rate": 4.173265439940891e-06, "loss": 1.0514, "step": 15297 }, { "epoch": 0.29, "learning_rate": 4.173151934056361e-06, "loss": 0.8405, "step": 15298 }, { "epoch": 0.29, "learning_rate": 4.173038421924332e-06, "loss": 1.1119, "step": 15299 }, { "epoch": 0.29, "learning_rate": 4.17292490354523e-06, "loss": 1.0752, "step": 15300 }, { "epoch": 0.29, "learning_rate": 4.172811378919477e-06, "loss": 0.8262, "step": 15301 }, { "epoch": 0.29, "learning_rate": 4.172697848047497e-06, "loss": 1.0683, "step": 15302 }, { "epoch": 0.29, "learning_rate": 4.172584310929716e-06, "loss": 0.798, "step": 15303 }, { "epoch": 0.29, "learning_rate": 4.172470767566555e-06, "loss": 0.9323, "step": 15304 }, { "epoch": 0.29, "learning_rate": 4.17235721795844e-06, "loss": 1.059, "step": 15305 }, { "epoch": 0.29, "learning_rate": 4.172243662105794e-06, "loss": 1.1373, "step": 15306 }, { "epoch": 0.29, "learning_rate": 4.172130100009042e-06, "loss": 0.8582, "step": 15307 }, { "epoch": 0.29, "learning_rate": 4.172016531668607e-06, "loss": 1.0506, "step": 15308 }, { "epoch": 0.29, "learning_rate": 4.1719029570849145e-06, "loss": 0.8848, "step": 15309 }, { "epoch": 0.29, "learning_rate": 4.1717893762583866e-06, "loss": 0.7862, "step": 15310 }, { "epoch": 0.29, "learning_rate": 4.171675789189449e-06, "loss": 1.0258, "step": 15311 }, { "epoch": 0.29, "learning_rate": 4.171562195878525e-06, "loss": 0.9686, "step": 15312 }, { "epoch": 0.29, "learning_rate": 4.171448596326039e-06, "loss": 0.9852, "step": 15313 }, { "epoch": 0.29, "learning_rate": 4.1713349905324155e-06, "loss": 0.8612, "step": 15314 }, { "epoch": 0.29, "learning_rate": 4.1712213784980785e-06, "loss": 0.9822, "step": 15315 }, { "epoch": 0.29, "learning_rate": 4.1711077602234515e-06, "loss": 1.0608, "step": 15316 }, { "epoch": 0.29, "learning_rate": 4.17099413570896e-06, "loss": 0.8145, "step": 15317 }, { "epoch": 0.29, "learning_rate": 4.170880504955027e-06, "loss": 0.9995, "step": 15318 }, { "epoch": 0.29, "learning_rate": 4.170766867962078e-06, "loss": 1.0056, "step": 15319 }, { "epoch": 0.29, "learning_rate": 4.170653224730536e-06, "loss": 0.7398, "step": 15320 }, { "epoch": 0.29, "learning_rate": 4.170539575260827e-06, "loss": 0.9157, "step": 15321 }, { "epoch": 0.29, "learning_rate": 4.170425919553374e-06, "loss": 0.9686, "step": 15322 }, { "epoch": 0.29, "learning_rate": 4.170312257608602e-06, "loss": 0.8273, "step": 15323 }, { "epoch": 0.29, "learning_rate": 4.1701985894269344e-06, "loss": 0.9775, "step": 15324 }, { "epoch": 0.29, "learning_rate": 4.170084915008798e-06, "loss": 1.4551, "step": 15325 }, { "epoch": 0.29, "learning_rate": 4.169971234354614e-06, "loss": 0.8821, "step": 15326 }, { "epoch": 0.29, "learning_rate": 4.169857547464809e-06, "loss": 0.7667, "step": 15327 }, { "epoch": 0.29, "learning_rate": 4.1697438543398086e-06, "loss": 0.9166, "step": 15328 }, { "epoch": 0.29, "learning_rate": 4.169630154980035e-06, "loss": 0.9517, "step": 15329 }, { "epoch": 0.29, "learning_rate": 4.169516449385913e-06, "loss": 1.0181, "step": 15330 }, { "epoch": 0.29, "learning_rate": 4.169402737557868e-06, "loss": 1.1965, "step": 15331 }, { "epoch": 0.29, "learning_rate": 4.169289019496325e-06, "loss": 1.0507, "step": 15332 }, { "epoch": 0.29, "learning_rate": 4.169175295201707e-06, "loss": 0.8409, "step": 15333 }, { "epoch": 0.29, "learning_rate": 4.16906156467444e-06, "loss": 0.7693, "step": 15334 }, { "epoch": 0.29, "learning_rate": 4.168947827914949e-06, "loss": 0.8387, "step": 15335 }, { "epoch": 0.29, "learning_rate": 4.1688340849236574e-06, "loss": 0.7254, "step": 15336 }, { "epoch": 0.29, "learning_rate": 4.168720335700989e-06, "loss": 0.8741, "step": 15337 }, { "epoch": 0.29, "learning_rate": 4.168606580247373e-06, "loss": 0.93, "step": 15338 }, { "epoch": 0.29, "learning_rate": 4.16849281856323e-06, "loss": 0.9361, "step": 15339 }, { "epoch": 0.29, "learning_rate": 4.168379050648985e-06, "loss": 0.8673, "step": 15340 }, { "epoch": 0.29, "learning_rate": 4.168265276505065e-06, "loss": 1.0714, "step": 15341 }, { "epoch": 0.29, "learning_rate": 4.168151496131893e-06, "loss": 0.8436, "step": 15342 }, { "epoch": 0.29, "learning_rate": 4.1680377095298945e-06, "loss": 0.9372, "step": 15343 }, { "epoch": 0.29, "learning_rate": 4.1679239166994945e-06, "loss": 0.8485, "step": 15344 }, { "epoch": 0.29, "learning_rate": 4.167810117641118e-06, "loss": 0.9225, "step": 15345 }, { "epoch": 0.29, "learning_rate": 4.167696312355189e-06, "loss": 0.7748, "step": 15346 }, { "epoch": 0.29, "learning_rate": 4.167582500842133e-06, "loss": 0.9153, "step": 15347 }, { "epoch": 0.29, "learning_rate": 4.167468683102376e-06, "loss": 0.8056, "step": 15348 }, { "epoch": 0.29, "learning_rate": 4.167354859136341e-06, "loss": 0.9475, "step": 15349 }, { "epoch": 0.29, "learning_rate": 4.167241028944455e-06, "loss": 0.8867, "step": 15350 }, { "epoch": 0.29, "learning_rate": 4.1671271925271415e-06, "loss": 1.0036, "step": 15351 }, { "epoch": 0.29, "learning_rate": 4.167013349884827e-06, "loss": 0.8284, "step": 15352 }, { "epoch": 0.29, "learning_rate": 4.166899501017935e-06, "loss": 1.0062, "step": 15353 }, { "epoch": 0.29, "learning_rate": 4.166785645926891e-06, "loss": 1.1776, "step": 15354 }, { "epoch": 0.29, "learning_rate": 4.1666717846121215e-06, "loss": 1.0425, "step": 15355 }, { "epoch": 0.29, "learning_rate": 4.16655791707405e-06, "loss": 1.0931, "step": 15356 }, { "epoch": 0.29, "learning_rate": 4.166444043313103e-06, "loss": 1.0916, "step": 15357 }, { "epoch": 0.29, "learning_rate": 4.166330163329704e-06, "loss": 0.7746, "step": 15358 }, { "epoch": 0.29, "learning_rate": 4.166216277124281e-06, "loss": 0.8528, "step": 15359 }, { "epoch": 0.29, "learning_rate": 4.166102384697256e-06, "loss": 1.0834, "step": 15360 }, { "epoch": 0.29, "learning_rate": 4.1659884860490554e-06, "loss": 0.7285, "step": 15361 }, { "epoch": 0.29, "learning_rate": 4.165874581180106e-06, "loss": 0.9165, "step": 15362 }, { "epoch": 0.29, "learning_rate": 4.165760670090831e-06, "loss": 0.8992, "step": 15363 }, { "epoch": 0.29, "learning_rate": 4.165646752781658e-06, "loss": 1.0809, "step": 15364 }, { "epoch": 0.29, "learning_rate": 4.165532829253011e-06, "loss": 0.9821, "step": 15365 }, { "epoch": 0.29, "learning_rate": 4.1654188995053145e-06, "loss": 0.98, "step": 15366 }, { "epoch": 0.29, "learning_rate": 4.165304963538995e-06, "loss": 1.0989, "step": 15367 }, { "epoch": 0.29, "learning_rate": 4.165191021354478e-06, "loss": 0.8582, "step": 15368 }, { "epoch": 0.29, "learning_rate": 4.165077072952189e-06, "loss": 1.0892, "step": 15369 }, { "epoch": 0.29, "learning_rate": 4.164963118332553e-06, "loss": 1.0579, "step": 15370 }, { "epoch": 0.29, "learning_rate": 4.164849157495996e-06, "loss": 0.7134, "step": 15371 }, { "epoch": 0.29, "learning_rate": 4.164735190442943e-06, "loss": 1.2273, "step": 15372 }, { "epoch": 0.29, "learning_rate": 4.16462121717382e-06, "loss": 1.0255, "step": 15373 }, { "epoch": 0.29, "learning_rate": 4.164507237689052e-06, "loss": 0.7298, "step": 15374 }, { "epoch": 0.29, "learning_rate": 4.1643932519890665e-06, "loss": 1.2325, "step": 15375 }, { "epoch": 0.29, "learning_rate": 4.164279260074286e-06, "loss": 1.027, "step": 15376 }, { "epoch": 0.29, "learning_rate": 4.164165261945139e-06, "loss": 0.9246, "step": 15377 }, { "epoch": 0.29, "learning_rate": 4.164051257602048e-06, "loss": 0.9655, "step": 15378 }, { "epoch": 0.29, "learning_rate": 4.1639372470454435e-06, "loss": 0.9904, "step": 15379 }, { "epoch": 0.29, "learning_rate": 4.163823230275746e-06, "loss": 1.0383, "step": 15380 }, { "epoch": 0.29, "learning_rate": 4.163709207293385e-06, "loss": 1.0751, "step": 15381 }, { "epoch": 0.29, "learning_rate": 4.163595178098784e-06, "loss": 1.1537, "step": 15382 }, { "epoch": 0.29, "learning_rate": 4.163481142692369e-06, "loss": 0.9491, "step": 15383 }, { "epoch": 0.29, "learning_rate": 4.163367101074568e-06, "loss": 0.8798, "step": 15384 }, { "epoch": 0.29, "learning_rate": 4.163253053245804e-06, "loss": 0.8694, "step": 15385 }, { "epoch": 0.29, "learning_rate": 4.163138999206505e-06, "loss": 0.8417, "step": 15386 }, { "epoch": 0.29, "learning_rate": 4.163024938957095e-06, "loss": 1.202, "step": 15387 }, { "epoch": 0.29, "learning_rate": 4.162910872498002e-06, "loss": 0.8035, "step": 15388 }, { "epoch": 0.29, "learning_rate": 4.162796799829649e-06, "loss": 0.7427, "step": 15389 }, { "epoch": 0.29, "learning_rate": 4.162682720952466e-06, "loss": 0.9659, "step": 15390 }, { "epoch": 0.29, "learning_rate": 4.162568635866875e-06, "loss": 1.0668, "step": 15391 }, { "epoch": 0.29, "learning_rate": 4.162454544573305e-06, "loss": 0.8882, "step": 15392 }, { "epoch": 0.29, "learning_rate": 4.16234044707218e-06, "loss": 1.0651, "step": 15393 }, { "epoch": 0.29, "learning_rate": 4.162226343363926e-06, "loss": 1.0067, "step": 15394 }, { "epoch": 0.29, "learning_rate": 4.162112233448971e-06, "loss": 1.0457, "step": 15395 }, { "epoch": 0.29, "learning_rate": 4.161998117327739e-06, "loss": 0.9721, "step": 15396 }, { "epoch": 0.29, "learning_rate": 4.161883995000658e-06, "loss": 0.9001, "step": 15397 }, { "epoch": 0.29, "learning_rate": 4.161769866468153e-06, "loss": 0.7924, "step": 15398 }, { "epoch": 0.29, "learning_rate": 4.16165573173065e-06, "loss": 1.1002, "step": 15399 }, { "epoch": 0.29, "learning_rate": 4.1615415907885735e-06, "loss": 1.0595, "step": 15400 }, { "epoch": 0.29, "learning_rate": 4.1614274436423544e-06, "loss": 0.8161, "step": 15401 }, { "epoch": 0.29, "learning_rate": 4.161313290292414e-06, "loss": 0.9106, "step": 15402 }, { "epoch": 0.29, "learning_rate": 4.161199130739183e-06, "loss": 0.9283, "step": 15403 }, { "epoch": 0.29, "learning_rate": 4.161084964983084e-06, "loss": 0.9242, "step": 15404 }, { "epoch": 0.29, "learning_rate": 4.160970793024544e-06, "loss": 1.0099, "step": 15405 }, { "epoch": 0.29, "learning_rate": 4.160856614863992e-06, "loss": 1.2798, "step": 15406 }, { "epoch": 0.29, "learning_rate": 4.160742430501851e-06, "loss": 0.9147, "step": 15407 }, { "epoch": 0.29, "learning_rate": 4.160628239938549e-06, "loss": 0.8551, "step": 15408 }, { "epoch": 0.29, "learning_rate": 4.160514043174511e-06, "loss": 0.7296, "step": 15409 }, { "epoch": 0.29, "learning_rate": 4.160399840210166e-06, "loss": 0.9871, "step": 15410 }, { "epoch": 0.29, "learning_rate": 4.160285631045939e-06, "loss": 0.8953, "step": 15411 }, { "epoch": 0.29, "learning_rate": 4.160171415682255e-06, "loss": 0.9546, "step": 15412 }, { "epoch": 0.29, "learning_rate": 4.160057194119543e-06, "loss": 0.9558, "step": 15413 }, { "epoch": 0.29, "learning_rate": 4.159942966358228e-06, "loss": 0.9237, "step": 15414 }, { "epoch": 0.29, "learning_rate": 4.1598287323987365e-06, "loss": 1.0221, "step": 15415 }, { "epoch": 0.29, "learning_rate": 4.159714492241496e-06, "loss": 0.8787, "step": 15416 }, { "epoch": 0.29, "learning_rate": 4.1596002458869315e-06, "loss": 0.8463, "step": 15417 }, { "epoch": 0.29, "learning_rate": 4.159485993335472e-06, "loss": 0.8902, "step": 15418 }, { "epoch": 0.29, "learning_rate": 4.1593717345875415e-06, "loss": 0.8376, "step": 15419 }, { "epoch": 0.29, "learning_rate": 4.159257469643569e-06, "loss": 0.976, "step": 15420 }, { "epoch": 0.29, "learning_rate": 4.159143198503978e-06, "loss": 1.1987, "step": 15421 }, { "epoch": 0.29, "learning_rate": 4.159028921169199e-06, "loss": 0.817, "step": 15422 }, { "epoch": 0.29, "learning_rate": 4.158914637639656e-06, "loss": 0.8662, "step": 15423 }, { "epoch": 0.29, "learning_rate": 4.158800347915777e-06, "loss": 0.9845, "step": 15424 }, { "epoch": 0.29, "learning_rate": 4.158686051997988e-06, "loss": 1.1089, "step": 15425 }, { "epoch": 0.29, "learning_rate": 4.158571749886716e-06, "loss": 0.8047, "step": 15426 }, { "epoch": 0.29, "learning_rate": 4.158457441582389e-06, "loss": 0.9827, "step": 15427 }, { "epoch": 0.29, "learning_rate": 4.158343127085432e-06, "loss": 0.8419, "step": 15428 }, { "epoch": 0.29, "learning_rate": 4.158228806396272e-06, "loss": 0.8892, "step": 15429 }, { "epoch": 0.29, "learning_rate": 4.158114479515337e-06, "loss": 1.0188, "step": 15430 }, { "epoch": 0.29, "learning_rate": 4.1580001464430534e-06, "loss": 1.1816, "step": 15431 }, { "epoch": 0.29, "learning_rate": 4.157885807179848e-06, "loss": 0.958, "step": 15432 }, { "epoch": 0.29, "learning_rate": 4.157771461726149e-06, "loss": 0.9487, "step": 15433 }, { "epoch": 0.29, "learning_rate": 4.15765711008238e-06, "loss": 1.0081, "step": 15434 }, { "epoch": 0.29, "learning_rate": 4.157542752248972e-06, "loss": 0.9766, "step": 15435 }, { "epoch": 0.29, "learning_rate": 4.157428388226349e-06, "loss": 0.9603, "step": 15436 }, { "epoch": 0.29, "learning_rate": 4.157314018014941e-06, "loss": 0.9866, "step": 15437 }, { "epoch": 0.29, "learning_rate": 4.157199641615171e-06, "loss": 0.8457, "step": 15438 }, { "epoch": 0.29, "learning_rate": 4.1570852590274705e-06, "loss": 0.8764, "step": 15439 }, { "epoch": 0.29, "learning_rate": 4.156970870252262e-06, "loss": 0.9938, "step": 15440 }, { "epoch": 0.29, "learning_rate": 4.156856475289976e-06, "loss": 1.0275, "step": 15441 }, { "epoch": 0.29, "learning_rate": 4.156742074141041e-06, "loss": 0.9016, "step": 15442 }, { "epoch": 0.29, "learning_rate": 4.156627666805879e-06, "loss": 1.181, "step": 15443 }, { "epoch": 0.29, "learning_rate": 4.156513253284921e-06, "loss": 1.1791, "step": 15444 }, { "epoch": 0.29, "learning_rate": 4.156398833578594e-06, "loss": 0.817, "step": 15445 }, { "epoch": 0.29, "learning_rate": 4.156284407687323e-06, "loss": 0.8124, "step": 15446 }, { "epoch": 0.29, "learning_rate": 4.1561699756115385e-06, "loss": 0.8518, "step": 15447 }, { "epoch": 0.29, "learning_rate": 4.156055537351665e-06, "loss": 0.8834, "step": 15448 }, { "epoch": 0.29, "learning_rate": 4.155941092908131e-06, "loss": 1.1561, "step": 15449 }, { "epoch": 0.29, "learning_rate": 4.155826642281364e-06, "loss": 1.1235, "step": 15450 }, { "epoch": 0.29, "learning_rate": 4.155712185471791e-06, "loss": 0.8004, "step": 15451 }, { "epoch": 0.29, "learning_rate": 4.1555977224798396e-06, "loss": 0.7929, "step": 15452 }, { "epoch": 0.29, "learning_rate": 4.155483253305938e-06, "loss": 0.9048, "step": 15453 }, { "epoch": 0.29, "learning_rate": 4.155368777950511e-06, "loss": 0.884, "step": 15454 }, { "epoch": 0.29, "learning_rate": 4.155254296413988e-06, "loss": 0.8809, "step": 15455 }, { "epoch": 0.29, "learning_rate": 4.155139808696797e-06, "loss": 1.018, "step": 15456 }, { "epoch": 0.29, "learning_rate": 4.155025314799365e-06, "loss": 1.0053, "step": 15457 }, { "epoch": 0.29, "learning_rate": 4.154910814722119e-06, "loss": 0.8815, "step": 15458 }, { "epoch": 0.29, "learning_rate": 4.1547963084654854e-06, "loss": 1.0726, "step": 15459 }, { "epoch": 0.29, "learning_rate": 4.154681796029894e-06, "loss": 0.8845, "step": 15460 }, { "epoch": 0.29, "learning_rate": 4.154567277415771e-06, "loss": 1.1225, "step": 15461 }, { "epoch": 0.29, "learning_rate": 4.154452752623545e-06, "loss": 0.8454, "step": 15462 }, { "epoch": 0.29, "learning_rate": 4.154338221653644e-06, "loss": 0.936, "step": 15463 }, { "epoch": 0.29, "learning_rate": 4.1542236845064934e-06, "loss": 1.0172, "step": 15464 }, { "epoch": 0.29, "learning_rate": 4.154109141182523e-06, "loss": 0.8729, "step": 15465 }, { "epoch": 0.29, "learning_rate": 4.15399459168216e-06, "loss": 0.9107, "step": 15466 }, { "epoch": 0.29, "learning_rate": 4.153880036005832e-06, "loss": 0.8373, "step": 15467 }, { "epoch": 0.29, "learning_rate": 4.153765474153966e-06, "loss": 1.1161, "step": 15468 }, { "epoch": 0.29, "learning_rate": 4.153650906126991e-06, "loss": 1.1378, "step": 15469 }, { "epoch": 0.29, "learning_rate": 4.153536331925333e-06, "loss": 0.7018, "step": 15470 }, { "epoch": 0.29, "learning_rate": 4.153421751549422e-06, "loss": 1.11, "step": 15471 }, { "epoch": 0.29, "learning_rate": 4.153307164999685e-06, "loss": 0.7496, "step": 15472 }, { "epoch": 0.29, "learning_rate": 4.1531925722765495e-06, "loss": 0.8124, "step": 15473 }, { "epoch": 0.29, "learning_rate": 4.153077973380443e-06, "loss": 0.9335, "step": 15474 }, { "epoch": 0.29, "learning_rate": 4.152963368311795e-06, "loss": 0.9576, "step": 15475 }, { "epoch": 0.29, "learning_rate": 4.152848757071032e-06, "loss": 0.6422, "step": 15476 }, { "epoch": 0.29, "learning_rate": 4.152734139658583e-06, "loss": 1.0527, "step": 15477 }, { "epoch": 0.29, "learning_rate": 4.152619516074875e-06, "loss": 0.9509, "step": 15478 }, { "epoch": 0.29, "learning_rate": 4.152504886320337e-06, "loss": 1.04, "step": 15479 }, { "epoch": 0.29, "learning_rate": 4.152390250395395e-06, "loss": 0.9547, "step": 15480 }, { "epoch": 0.29, "learning_rate": 4.1522756083004795e-06, "loss": 1.1663, "step": 15481 }, { "epoch": 0.29, "learning_rate": 4.152160960036017e-06, "loss": 0.9159, "step": 15482 }, { "epoch": 0.29, "learning_rate": 4.152046305602436e-06, "loss": 1.0262, "step": 15483 }, { "epoch": 0.29, "learning_rate": 4.1519316450001655e-06, "loss": 0.9641, "step": 15484 }, { "epoch": 0.29, "learning_rate": 4.1518169782296325e-06, "loss": 0.9514, "step": 15485 }, { "epoch": 0.29, "learning_rate": 4.151702305291266e-06, "loss": 1.0534, "step": 15486 }, { "epoch": 0.29, "learning_rate": 4.1515876261854934e-06, "loss": 1.0595, "step": 15487 }, { "epoch": 0.29, "learning_rate": 4.151472940912743e-06, "loss": 0.9666, "step": 15488 }, { "epoch": 0.29, "learning_rate": 4.1513582494734425e-06, "loss": 0.966, "step": 15489 }, { "epoch": 0.29, "learning_rate": 4.151243551868023e-06, "loss": 0.9502, "step": 15490 }, { "epoch": 0.29, "learning_rate": 4.1511288480969094e-06, "loss": 0.762, "step": 15491 }, { "epoch": 0.29, "learning_rate": 4.151014138160531e-06, "loss": 0.8933, "step": 15492 }, { "epoch": 0.29, "learning_rate": 4.150899422059317e-06, "loss": 1.0276, "step": 15493 }, { "epoch": 0.29, "learning_rate": 4.150784699793695e-06, "loss": 1.2018, "step": 15494 }, { "epoch": 0.29, "learning_rate": 4.150669971364094e-06, "loss": 1.1484, "step": 15495 }, { "epoch": 0.29, "learning_rate": 4.150555236770942e-06, "loss": 0.8763, "step": 15496 }, { "epoch": 0.29, "learning_rate": 4.150440496014666e-06, "loss": 0.9254, "step": 15497 }, { "epoch": 0.29, "learning_rate": 4.150325749095697e-06, "loss": 0.9514, "step": 15498 }, { "epoch": 0.29, "learning_rate": 4.150210996014462e-06, "loss": 1.0591, "step": 15499 }, { "epoch": 0.29, "learning_rate": 4.15009623677139e-06, "loss": 1.0838, "step": 15500 }, { "epoch": 0.29, "learning_rate": 4.149981471366909e-06, "loss": 1.0159, "step": 15501 }, { "epoch": 0.29, "learning_rate": 4.1498666998014485e-06, "loss": 0.8122, "step": 15502 }, { "epoch": 0.29, "learning_rate": 4.1497519220754346e-06, "loss": 0.9431, "step": 15503 }, { "epoch": 0.29, "learning_rate": 4.149637138189298e-06, "loss": 0.9562, "step": 15504 }, { "epoch": 0.29, "learning_rate": 4.149522348143468e-06, "loss": 1.1399, "step": 15505 }, { "epoch": 0.29, "learning_rate": 4.1494075519383715e-06, "loss": 1.0959, "step": 15506 }, { "epoch": 0.29, "learning_rate": 4.1492927495744375e-06, "loss": 0.8937, "step": 15507 }, { "epoch": 0.29, "learning_rate": 4.149177941052096e-06, "loss": 0.932, "step": 15508 }, { "epoch": 0.29, "learning_rate": 4.149063126371774e-06, "loss": 0.9522, "step": 15509 }, { "epoch": 0.29, "learning_rate": 4.1489483055339005e-06, "loss": 0.9686, "step": 15510 }, { "epoch": 0.29, "learning_rate": 4.148833478538905e-06, "loss": 0.8798, "step": 15511 }, { "epoch": 0.29, "learning_rate": 4.1487186453872156e-06, "loss": 1.0735, "step": 15512 }, { "epoch": 0.29, "learning_rate": 4.148603806079261e-06, "loss": 1.0748, "step": 15513 }, { "epoch": 0.29, "learning_rate": 4.148488960615471e-06, "loss": 0.977, "step": 15514 }, { "epoch": 0.29, "learning_rate": 4.148374108996274e-06, "loss": 0.9733, "step": 15515 }, { "epoch": 0.29, "learning_rate": 4.148259251222097e-06, "loss": 0.9417, "step": 15516 }, { "epoch": 0.29, "learning_rate": 4.148144387293373e-06, "loss": 0.9619, "step": 15517 }, { "epoch": 0.29, "learning_rate": 4.148029517210527e-06, "loss": 1.0305, "step": 15518 }, { "epoch": 0.29, "learning_rate": 4.147914640973989e-06, "loss": 0.9462, "step": 15519 }, { "epoch": 0.29, "learning_rate": 4.147799758584189e-06, "loss": 0.9271, "step": 15520 }, { "epoch": 0.29, "learning_rate": 4.147684870041554e-06, "loss": 0.7935, "step": 15521 }, { "epoch": 0.29, "learning_rate": 4.147569975346515e-06, "loss": 1.0365, "step": 15522 }, { "epoch": 0.29, "learning_rate": 4.147455074499501e-06, "loss": 0.7689, "step": 15523 }, { "epoch": 0.29, "learning_rate": 4.147340167500939e-06, "loss": 1.0245, "step": 15524 }, { "epoch": 0.29, "learning_rate": 4.1472252543512605e-06, "loss": 1.2427, "step": 15525 }, { "epoch": 0.29, "learning_rate": 4.147110335050893e-06, "loss": 0.9406, "step": 15526 }, { "epoch": 0.29, "learning_rate": 4.146995409600265e-06, "loss": 0.8139, "step": 15527 }, { "epoch": 0.29, "learning_rate": 4.1468804779998075e-06, "loss": 1.0677, "step": 15528 }, { "epoch": 0.29, "learning_rate": 4.146765540249949e-06, "loss": 0.9556, "step": 15529 }, { "epoch": 0.29, "learning_rate": 4.1466505963511184e-06, "loss": 0.8561, "step": 15530 }, { "epoch": 0.29, "learning_rate": 4.146535646303744e-06, "loss": 1.0935, "step": 15531 }, { "epoch": 0.29, "learning_rate": 4.146420690108257e-06, "loss": 0.9214, "step": 15532 }, { "epoch": 0.29, "learning_rate": 4.146305727765086e-06, "loss": 0.9899, "step": 15533 }, { "epoch": 0.29, "learning_rate": 4.146190759274658e-06, "loss": 0.8487, "step": 15534 }, { "epoch": 0.29, "learning_rate": 4.146075784637407e-06, "loss": 0.8096, "step": 15535 }, { "epoch": 0.29, "learning_rate": 4.145960803853757e-06, "loss": 0.9155, "step": 15536 }, { "epoch": 0.29, "learning_rate": 4.145845816924141e-06, "loss": 1.1144, "step": 15537 }, { "epoch": 0.29, "learning_rate": 4.145730823848987e-06, "loss": 1.0116, "step": 15538 }, { "epoch": 0.29, "learning_rate": 4.145615824628724e-06, "loss": 0.8047, "step": 15539 }, { "epoch": 0.29, "learning_rate": 4.145500819263782e-06, "loss": 0.7569, "step": 15540 }, { "epoch": 0.29, "learning_rate": 4.145385807754592e-06, "loss": 0.8256, "step": 15541 }, { "epoch": 0.29, "learning_rate": 4.14527079010158e-06, "loss": 0.9299, "step": 15542 }, { "epoch": 0.29, "learning_rate": 4.145155766305178e-06, "loss": 1.1282, "step": 15543 }, { "epoch": 0.29, "learning_rate": 4.145040736365815e-06, "loss": 1.21, "step": 15544 }, { "epoch": 0.29, "learning_rate": 4.144925700283921e-06, "loss": 1.0196, "step": 15545 }, { "epoch": 0.29, "learning_rate": 4.1448106580599225e-06, "loss": 0.7706, "step": 15546 }, { "epoch": 0.29, "learning_rate": 4.1446956096942536e-06, "loss": 0.9034, "step": 15547 }, { "epoch": 0.29, "learning_rate": 4.144580555187341e-06, "loss": 0.9573, "step": 15548 }, { "epoch": 0.29, "learning_rate": 4.144465494539615e-06, "loss": 1.1888, "step": 15549 }, { "epoch": 0.29, "learning_rate": 4.144350427751506e-06, "loss": 1.0353, "step": 15550 }, { "epoch": 0.29, "learning_rate": 4.144235354823442e-06, "loss": 0.7461, "step": 15551 }, { "epoch": 0.29, "learning_rate": 4.144120275755854e-06, "loss": 0.6832, "step": 15552 }, { "epoch": 0.29, "learning_rate": 4.1440051905491705e-06, "loss": 0.7081, "step": 15553 }, { "epoch": 0.29, "learning_rate": 4.143890099203823e-06, "loss": 0.9102, "step": 15554 }, { "epoch": 0.29, "learning_rate": 4.14377500172024e-06, "loss": 0.9531, "step": 15555 }, { "epoch": 0.29, "learning_rate": 4.143659898098852e-06, "loss": 0.8641, "step": 15556 }, { "epoch": 0.29, "learning_rate": 4.143544788340087e-06, "loss": 1.0148, "step": 15557 }, { "epoch": 0.29, "learning_rate": 4.143429672444378e-06, "loss": 0.8996, "step": 15558 }, { "epoch": 0.29, "learning_rate": 4.143314550412151e-06, "loss": 1.1252, "step": 15559 }, { "epoch": 0.29, "learning_rate": 4.143199422243839e-06, "loss": 0.8552, "step": 15560 }, { "epoch": 0.29, "learning_rate": 4.143084287939871e-06, "loss": 0.8405, "step": 15561 }, { "epoch": 0.29, "learning_rate": 4.142969147500676e-06, "loss": 0.923, "step": 15562 }, { "epoch": 0.29, "learning_rate": 4.142854000926685e-06, "loss": 0.985, "step": 15563 }, { "epoch": 0.29, "learning_rate": 4.1427388482183275e-06, "loss": 0.7476, "step": 15564 }, { "epoch": 0.29, "learning_rate": 4.142623689376033e-06, "loss": 1.0641, "step": 15565 }, { "epoch": 0.29, "learning_rate": 4.142508524400232e-06, "loss": 0.8431, "step": 15566 }, { "epoch": 0.29, "learning_rate": 4.142393353291355e-06, "loss": 0.9023, "step": 15567 }, { "epoch": 0.29, "learning_rate": 4.142278176049832e-06, "loss": 1.0514, "step": 15568 }, { "epoch": 0.29, "learning_rate": 4.142162992676092e-06, "loss": 0.9954, "step": 15569 }, { "epoch": 0.29, "learning_rate": 4.1420478031705655e-06, "loss": 0.9668, "step": 15570 }, { "epoch": 0.29, "learning_rate": 4.141932607533683e-06, "loss": 0.8786, "step": 15571 }, { "epoch": 0.29, "learning_rate": 4.141817405765875e-06, "loss": 0.8263, "step": 15572 }, { "epoch": 0.29, "learning_rate": 4.141702197867571e-06, "loss": 0.858, "step": 15573 }, { "epoch": 0.29, "learning_rate": 4.141586983839201e-06, "loss": 1.0761, "step": 15574 }, { "epoch": 0.29, "learning_rate": 4.141471763681195e-06, "loss": 1.0161, "step": 15575 }, { "epoch": 0.29, "learning_rate": 4.141356537393985e-06, "loss": 0.7936, "step": 15576 }, { "epoch": 0.29, "learning_rate": 4.141241304978e-06, "loss": 0.9579, "step": 15577 }, { "epoch": 0.29, "learning_rate": 4.141126066433669e-06, "loss": 0.7974, "step": 15578 }, { "epoch": 0.29, "learning_rate": 4.141010821761425e-06, "loss": 0.8304, "step": 15579 }, { "epoch": 0.29, "learning_rate": 4.140895570961696e-06, "loss": 1.1064, "step": 15580 }, { "epoch": 0.29, "learning_rate": 4.140780314034914e-06, "loss": 1.0839, "step": 15581 }, { "epoch": 0.29, "learning_rate": 4.140665050981508e-06, "loss": 0.7639, "step": 15582 }, { "epoch": 0.29, "learning_rate": 4.140549781801909e-06, "loss": 0.9594, "step": 15583 }, { "epoch": 0.29, "learning_rate": 4.140434506496547e-06, "loss": 0.752, "step": 15584 }, { "epoch": 0.29, "learning_rate": 4.140319225065854e-06, "loss": 0.8917, "step": 15585 }, { "epoch": 0.29, "learning_rate": 4.1402039375102585e-06, "loss": 0.9788, "step": 15586 }, { "epoch": 0.29, "learning_rate": 4.140088643830191e-06, "loss": 1.032, "step": 15587 }, { "epoch": 0.29, "learning_rate": 4.139973344026084e-06, "loss": 1.0453, "step": 15588 }, { "epoch": 0.29, "learning_rate": 4.139858038098366e-06, "loss": 1.0004, "step": 15589 }, { "epoch": 0.29, "learning_rate": 4.13974272604747e-06, "loss": 0.7656, "step": 15590 }, { "epoch": 0.29, "learning_rate": 4.139627407873824e-06, "loss": 0.8609, "step": 15591 }, { "epoch": 0.29, "learning_rate": 4.139512083577859e-06, "loss": 0.7844, "step": 15592 }, { "epoch": 0.29, "learning_rate": 4.139396753160006e-06, "loss": 1.1655, "step": 15593 }, { "epoch": 0.29, "learning_rate": 4.139281416620697e-06, "loss": 1.0974, "step": 15594 }, { "epoch": 0.29, "learning_rate": 4.139166073960361e-06, "loss": 0.8144, "step": 15595 }, { "epoch": 0.29, "learning_rate": 4.1390507251794284e-06, "loss": 0.8217, "step": 15596 }, { "epoch": 0.29, "learning_rate": 4.138935370278332e-06, "loss": 0.9205, "step": 15597 }, { "epoch": 0.29, "learning_rate": 4.1388200092575e-06, "loss": 0.9033, "step": 15598 }, { "epoch": 0.29, "learning_rate": 4.1387046421173644e-06, "loss": 1.0305, "step": 15599 }, { "epoch": 0.29, "learning_rate": 4.138589268858356e-06, "loss": 0.8991, "step": 15600 }, { "epoch": 0.29, "learning_rate": 4.138473889480906e-06, "loss": 0.8978, "step": 15601 }, { "epoch": 0.29, "learning_rate": 4.138358503985445e-06, "loss": 0.9972, "step": 15602 }, { "epoch": 0.29, "learning_rate": 4.138243112372402e-06, "loss": 1.072, "step": 15603 }, { "epoch": 0.29, "learning_rate": 4.138127714642211e-06, "loss": 0.845, "step": 15604 }, { "epoch": 0.29, "learning_rate": 4.1380123107953e-06, "loss": 0.8642, "step": 15605 }, { "epoch": 0.29, "learning_rate": 4.137896900832103e-06, "loss": 0.889, "step": 15606 }, { "epoch": 0.29, "learning_rate": 4.1377814847530485e-06, "loss": 0.985, "step": 15607 }, { "epoch": 0.29, "learning_rate": 4.1376660625585675e-06, "loss": 1.0189, "step": 15608 }, { "epoch": 0.29, "learning_rate": 4.137550634249092e-06, "loss": 0.9382, "step": 15609 }, { "epoch": 0.29, "learning_rate": 4.137435199825053e-06, "loss": 0.9208, "step": 15610 }, { "epoch": 0.29, "learning_rate": 4.137319759286881e-06, "loss": 0.9942, "step": 15611 }, { "epoch": 0.29, "learning_rate": 4.137204312635007e-06, "loss": 1.3474, "step": 15612 }, { "epoch": 0.29, "learning_rate": 4.137088859869862e-06, "loss": 1.0873, "step": 15613 }, { "epoch": 0.29, "learning_rate": 4.136973400991878e-06, "loss": 0.894, "step": 15614 }, { "epoch": 0.29, "learning_rate": 4.136857936001485e-06, "loss": 0.6242, "step": 15615 }, { "epoch": 0.29, "learning_rate": 4.136742464899115e-06, "loss": 0.7197, "step": 15616 }, { "epoch": 0.29, "learning_rate": 4.136626987685198e-06, "loss": 1.0043, "step": 15617 }, { "epoch": 0.29, "learning_rate": 4.136511504360168e-06, "loss": 1.2844, "step": 15618 }, { "epoch": 0.29, "learning_rate": 4.136396014924453e-06, "loss": 1.1844, "step": 15619 }, { "epoch": 0.29, "learning_rate": 4.136280519378485e-06, "loss": 0.6918, "step": 15620 }, { "epoch": 0.29, "learning_rate": 4.136165017722696e-06, "loss": 0.8607, "step": 15621 }, { "epoch": 0.29, "learning_rate": 4.136049509957517e-06, "loss": 0.8788, "step": 15622 }, { "epoch": 0.29, "learning_rate": 4.135933996083379e-06, "loss": 0.8278, "step": 15623 }, { "epoch": 0.29, "learning_rate": 4.135818476100715e-06, "loss": 0.8737, "step": 15624 }, { "epoch": 0.29, "learning_rate": 4.1357029500099534e-06, "loss": 1.2911, "step": 15625 }, { "epoch": 0.29, "learning_rate": 4.135587417811527e-06, "loss": 1.1773, "step": 15626 }, { "epoch": 0.29, "learning_rate": 4.135471879505869e-06, "loss": 0.9359, "step": 15627 }, { "epoch": 0.29, "learning_rate": 4.135356335093408e-06, "loss": 0.9261, "step": 15628 }, { "epoch": 0.29, "learning_rate": 4.135240784574577e-06, "loss": 0.8553, "step": 15629 }, { "epoch": 0.29, "learning_rate": 4.1351252279498066e-06, "loss": 1.0437, "step": 15630 }, { "epoch": 0.29, "learning_rate": 4.135009665219529e-06, "loss": 1.1575, "step": 15631 }, { "epoch": 0.29, "learning_rate": 4.134894096384176e-06, "loss": 0.8599, "step": 15632 }, { "epoch": 0.29, "learning_rate": 4.134778521444177e-06, "loss": 0.8331, "step": 15633 }, { "epoch": 0.29, "learning_rate": 4.134662940399967e-06, "loss": 1.1763, "step": 15634 }, { "epoch": 0.29, "learning_rate": 4.134547353251975e-06, "loss": 0.8557, "step": 15635 }, { "epoch": 0.3, "learning_rate": 4.1344317600006325e-06, "loss": 0.8633, "step": 15636 }, { "epoch": 0.3, "learning_rate": 4.134316160646373e-06, "loss": 1.1733, "step": 15637 }, { "epoch": 0.3, "learning_rate": 4.134200555189626e-06, "loss": 1.0272, "step": 15638 }, { "epoch": 0.3, "learning_rate": 4.134084943630825e-06, "loss": 1.0529, "step": 15639 }, { "epoch": 0.3, "learning_rate": 4.133969325970401e-06, "loss": 0.9683, "step": 15640 }, { "epoch": 0.3, "learning_rate": 4.1338537022087855e-06, "loss": 0.8334, "step": 15641 }, { "epoch": 0.3, "learning_rate": 4.13373807234641e-06, "loss": 1.0402, "step": 15642 }, { "epoch": 0.3, "learning_rate": 4.133622436383707e-06, "loss": 1.0248, "step": 15643 }, { "epoch": 0.3, "learning_rate": 4.133506794321107e-06, "loss": 1.0381, "step": 15644 }, { "epoch": 0.3, "learning_rate": 4.133391146159044e-06, "loss": 0.9155, "step": 15645 }, { "epoch": 0.3, "learning_rate": 4.133275491897948e-06, "loss": 0.8482, "step": 15646 }, { "epoch": 0.3, "learning_rate": 4.1331598315382515e-06, "loss": 1.0233, "step": 15647 }, { "epoch": 0.3, "learning_rate": 4.133044165080387e-06, "loss": 0.868, "step": 15648 }, { "epoch": 0.3, "learning_rate": 4.132928492524785e-06, "loss": 1.0154, "step": 15649 }, { "epoch": 0.3, "learning_rate": 4.132812813871877e-06, "loss": 0.8868, "step": 15650 }, { "epoch": 0.3, "learning_rate": 4.132697129122098e-06, "loss": 0.9722, "step": 15651 }, { "epoch": 0.3, "learning_rate": 4.132581438275876e-06, "loss": 0.8431, "step": 15652 }, { "epoch": 0.3, "learning_rate": 4.132465741333646e-06, "loss": 0.9353, "step": 15653 }, { "epoch": 0.3, "learning_rate": 4.13235003829584e-06, "loss": 1.022, "step": 15654 }, { "epoch": 0.3, "learning_rate": 4.1322343291628865e-06, "loss": 1.0458, "step": 15655 }, { "epoch": 0.3, "learning_rate": 4.132118613935221e-06, "loss": 1.2672, "step": 15656 }, { "epoch": 0.3, "learning_rate": 4.132002892613276e-06, "loss": 1.0369, "step": 15657 }, { "epoch": 0.3, "learning_rate": 4.131887165197482e-06, "loss": 0.8992, "step": 15658 }, { "epoch": 0.3, "learning_rate": 4.1317714316882695e-06, "loss": 0.9787, "step": 15659 }, { "epoch": 0.3, "learning_rate": 4.131655692086074e-06, "loss": 0.8745, "step": 15660 }, { "epoch": 0.3, "learning_rate": 4.131539946391326e-06, "loss": 1.0101, "step": 15661 }, { "epoch": 0.3, "learning_rate": 4.131424194604457e-06, "loss": 1.2476, "step": 15662 }, { "epoch": 0.3, "learning_rate": 4.1313084367259016e-06, "loss": 1.0663, "step": 15663 }, { "epoch": 0.3, "learning_rate": 4.131192672756089e-06, "loss": 0.8302, "step": 15664 }, { "epoch": 0.3, "learning_rate": 4.131076902695454e-06, "loss": 0.8244, "step": 15665 }, { "epoch": 0.3, "learning_rate": 4.1309611265444285e-06, "loss": 0.8742, "step": 15666 }, { "epoch": 0.3, "learning_rate": 4.130845344303442e-06, "loss": 0.8173, "step": 15667 }, { "epoch": 0.3, "learning_rate": 4.130729555972931e-06, "loss": 1.2391, "step": 15668 }, { "epoch": 0.3, "learning_rate": 4.130613761553324e-06, "loss": 1.0389, "step": 15669 }, { "epoch": 0.3, "learning_rate": 4.1304979610450564e-06, "loss": 0.9195, "step": 15670 }, { "epoch": 0.3, "learning_rate": 4.13038215444856e-06, "loss": 0.8464, "step": 15671 }, { "epoch": 0.3, "learning_rate": 4.130266341764266e-06, "loss": 1.029, "step": 15672 }, { "epoch": 0.3, "learning_rate": 4.130150522992607e-06, "loss": 1.0859, "step": 15673 }, { "epoch": 0.3, "learning_rate": 4.130034698134016e-06, "loss": 0.9725, "step": 15674 }, { "epoch": 0.3, "learning_rate": 4.129918867188926e-06, "loss": 1.1694, "step": 15675 }, { "epoch": 0.3, "learning_rate": 4.129803030157768e-06, "loss": 0.9276, "step": 15676 }, { "epoch": 0.3, "learning_rate": 4.129687187040977e-06, "loss": 0.8568, "step": 15677 }, { "epoch": 0.3, "learning_rate": 4.129571337838983e-06, "loss": 0.8718, "step": 15678 }, { "epoch": 0.3, "learning_rate": 4.129455482552219e-06, "loss": 0.7694, "step": 15679 }, { "epoch": 0.3, "learning_rate": 4.129339621181119e-06, "loss": 1.0849, "step": 15680 }, { "epoch": 0.3, "learning_rate": 4.129223753726115e-06, "loss": 1.1465, "step": 15681 }, { "epoch": 0.3, "learning_rate": 4.129107880187639e-06, "loss": 1.0596, "step": 15682 }, { "epoch": 0.3, "learning_rate": 4.128992000566124e-06, "loss": 0.7683, "step": 15683 }, { "epoch": 0.3, "learning_rate": 4.128876114862003e-06, "loss": 0.8337, "step": 15684 }, { "epoch": 0.3, "learning_rate": 4.128760223075708e-06, "loss": 1.1002, "step": 15685 }, { "epoch": 0.3, "learning_rate": 4.128644325207673e-06, "loss": 1.0201, "step": 15686 }, { "epoch": 0.3, "learning_rate": 4.128528421258331e-06, "loss": 1.0017, "step": 15687 }, { "epoch": 0.3, "learning_rate": 4.128412511228112e-06, "loss": 0.9876, "step": 15688 }, { "epoch": 0.3, "learning_rate": 4.128296595117452e-06, "loss": 0.9678, "step": 15689 }, { "epoch": 0.3, "learning_rate": 4.128180672926782e-06, "loss": 0.886, "step": 15690 }, { "epoch": 0.3, "learning_rate": 4.128064744656534e-06, "loss": 1.0188, "step": 15691 }, { "epoch": 0.3, "learning_rate": 4.127948810307143e-06, "loss": 1.0132, "step": 15692 }, { "epoch": 0.3, "learning_rate": 4.127832869879042e-06, "loss": 0.9406, "step": 15693 }, { "epoch": 0.3, "learning_rate": 4.1277169233726614e-06, "loss": 1.1089, "step": 15694 }, { "epoch": 0.3, "learning_rate": 4.127600970788437e-06, "loss": 0.9341, "step": 15695 }, { "epoch": 0.3, "learning_rate": 4.127485012126799e-06, "loss": 1.0608, "step": 15696 }, { "epoch": 0.3, "learning_rate": 4.127369047388183e-06, "loss": 1.012, "step": 15697 }, { "epoch": 0.3, "learning_rate": 4.127253076573021e-06, "loss": 0.9703, "step": 15698 }, { "epoch": 0.3, "learning_rate": 4.127137099681746e-06, "loss": 1.0156, "step": 15699 }, { "epoch": 0.3, "learning_rate": 4.12702111671479e-06, "loss": 1.2258, "step": 15700 }, { "epoch": 0.3, "learning_rate": 4.126905127672589e-06, "loss": 0.9823, "step": 15701 }, { "epoch": 0.3, "learning_rate": 4.126789132555572e-06, "loss": 1.0138, "step": 15702 }, { "epoch": 0.3, "learning_rate": 4.126673131364175e-06, "loss": 0.9011, "step": 15703 }, { "epoch": 0.3, "learning_rate": 4.126557124098831e-06, "loss": 0.8135, "step": 15704 }, { "epoch": 0.3, "learning_rate": 4.126441110759972e-06, "loss": 0.9187, "step": 15705 }, { "epoch": 0.3, "learning_rate": 4.126325091348031e-06, "loss": 1.0699, "step": 15706 }, { "epoch": 0.3, "learning_rate": 4.126209065863443e-06, "loss": 0.8798, "step": 15707 }, { "epoch": 0.3, "learning_rate": 4.1260930343066404e-06, "loss": 0.8378, "step": 15708 }, { "epoch": 0.3, "learning_rate": 4.125976996678056e-06, "loss": 0.8004, "step": 15709 }, { "epoch": 0.3, "learning_rate": 4.125860952978123e-06, "loss": 0.7124, "step": 15710 }, { "epoch": 0.3, "learning_rate": 4.125744903207275e-06, "loss": 0.9239, "step": 15711 }, { "epoch": 0.3, "learning_rate": 4.125628847365945e-06, "loss": 0.9103, "step": 15712 }, { "epoch": 0.3, "learning_rate": 4.125512785454568e-06, "loss": 1.0035, "step": 15713 }, { "epoch": 0.3, "learning_rate": 4.1253967174735755e-06, "loss": 0.8049, "step": 15714 }, { "epoch": 0.3, "learning_rate": 4.125280643423401e-06, "loss": 1.0491, "step": 15715 }, { "epoch": 0.3, "learning_rate": 4.125164563304479e-06, "loss": 1.1094, "step": 15716 }, { "epoch": 0.3, "learning_rate": 4.125048477117242e-06, "loss": 0.9567, "step": 15717 }, { "epoch": 0.3, "learning_rate": 4.1249323848621235e-06, "loss": 1.1379, "step": 15718 }, { "epoch": 0.3, "learning_rate": 4.124816286539558e-06, "loss": 1.0382, "step": 15719 }, { "epoch": 0.3, "learning_rate": 4.124700182149979e-06, "loss": 0.9138, "step": 15720 }, { "epoch": 0.3, "learning_rate": 4.124584071693818e-06, "loss": 1.0175, "step": 15721 }, { "epoch": 0.3, "learning_rate": 4.124467955171511e-06, "loss": 0.7503, "step": 15722 }, { "epoch": 0.3, "learning_rate": 4.124351832583488e-06, "loss": 0.9412, "step": 15723 }, { "epoch": 0.3, "learning_rate": 4.124235703930187e-06, "loss": 1.2402, "step": 15724 }, { "epoch": 0.3, "learning_rate": 4.1241195692120405e-06, "loss": 1.1667, "step": 15725 }, { "epoch": 0.3, "learning_rate": 4.12400342842948e-06, "loss": 0.9692, "step": 15726 }, { "epoch": 0.3, "learning_rate": 4.12388728158294e-06, "loss": 0.9237, "step": 15727 }, { "epoch": 0.3, "learning_rate": 4.123771128672856e-06, "loss": 0.9827, "step": 15728 }, { "epoch": 0.3, "learning_rate": 4.123654969699661e-06, "loss": 0.9422, "step": 15729 }, { "epoch": 0.3, "learning_rate": 4.123538804663787e-06, "loss": 0.9783, "step": 15730 }, { "epoch": 0.3, "learning_rate": 4.123422633565668e-06, "loss": 0.9549, "step": 15731 }, { "epoch": 0.3, "learning_rate": 4.12330645640574e-06, "loss": 0.939, "step": 15732 }, { "epoch": 0.3, "learning_rate": 4.123190273184435e-06, "loss": 0.7479, "step": 15733 }, { "epoch": 0.3, "learning_rate": 4.123074083902187e-06, "loss": 0.8647, "step": 15734 }, { "epoch": 0.3, "learning_rate": 4.12295788855943e-06, "loss": 0.8458, "step": 15735 }, { "epoch": 0.3, "learning_rate": 4.122841687156599e-06, "loss": 0.7668, "step": 15736 }, { "epoch": 0.3, "learning_rate": 4.122725479694127e-06, "loss": 1.2371, "step": 15737 }, { "epoch": 0.3, "learning_rate": 4.122609266172446e-06, "loss": 1.103, "step": 15738 }, { "epoch": 0.3, "learning_rate": 4.122493046591993e-06, "loss": 0.9117, "step": 15739 }, { "epoch": 0.3, "learning_rate": 4.122376820953201e-06, "loss": 0.9654, "step": 15740 }, { "epoch": 0.3, "learning_rate": 4.122260589256504e-06, "loss": 0.7116, "step": 15741 }, { "epoch": 0.3, "learning_rate": 4.122144351502334e-06, "loss": 0.821, "step": 15742 }, { "epoch": 0.3, "learning_rate": 4.122028107691128e-06, "loss": 1.0897, "step": 15743 }, { "epoch": 0.3, "learning_rate": 4.121911857823319e-06, "loss": 1.0535, "step": 15744 }, { "epoch": 0.3, "learning_rate": 4.12179560189934e-06, "loss": 0.9246, "step": 15745 }, { "epoch": 0.3, "learning_rate": 4.121679339919627e-06, "loss": 0.8541, "step": 15746 }, { "epoch": 0.3, "learning_rate": 4.1215630718846124e-06, "loss": 0.9456, "step": 15747 }, { "epoch": 0.3, "learning_rate": 4.121446797794731e-06, "loss": 0.8466, "step": 15748 }, { "epoch": 0.3, "learning_rate": 4.121330517650417e-06, "loss": 1.0455, "step": 15749 }, { "epoch": 0.3, "learning_rate": 4.121214231452104e-06, "loss": 1.1003, "step": 15750 }, { "epoch": 0.3, "learning_rate": 4.121097939200227e-06, "loss": 1.1463, "step": 15751 }, { "epoch": 0.3, "learning_rate": 4.120981640895221e-06, "loss": 0.8159, "step": 15752 }, { "epoch": 0.3, "learning_rate": 4.120865336537518e-06, "loss": 0.9358, "step": 15753 }, { "epoch": 0.3, "learning_rate": 4.120749026127554e-06, "loss": 0.8876, "step": 15754 }, { "epoch": 0.3, "learning_rate": 4.120632709665763e-06, "loss": 0.8124, "step": 15755 }, { "epoch": 0.3, "learning_rate": 4.120516387152579e-06, "loss": 1.1833, "step": 15756 }, { "epoch": 0.3, "learning_rate": 4.120400058588436e-06, "loss": 1.0498, "step": 15757 }, { "epoch": 0.3, "learning_rate": 4.12028372397377e-06, "loss": 0.9203, "step": 15758 }, { "epoch": 0.3, "learning_rate": 4.120167383309014e-06, "loss": 0.9211, "step": 15759 }, { "epoch": 0.3, "learning_rate": 4.120051036594602e-06, "loss": 0.7594, "step": 15760 }, { "epoch": 0.3, "learning_rate": 4.11993468383097e-06, "loss": 1.0276, "step": 15761 }, { "epoch": 0.3, "learning_rate": 4.11981832501855e-06, "loss": 0.9099, "step": 15762 }, { "epoch": 0.3, "learning_rate": 4.119701960157779e-06, "loss": 0.9977, "step": 15763 }, { "epoch": 0.3, "learning_rate": 4.119585589249091e-06, "loss": 1.0182, "step": 15764 }, { "epoch": 0.3, "learning_rate": 4.11946921229292e-06, "loss": 0.8067, "step": 15765 }, { "epoch": 0.3, "learning_rate": 4.1193528292897e-06, "loss": 0.9264, "step": 15766 }, { "epoch": 0.3, "learning_rate": 4.1192364402398665e-06, "loss": 0.8478, "step": 15767 }, { "epoch": 0.3, "learning_rate": 4.119120045143854e-06, "loss": 0.899, "step": 15768 }, { "epoch": 0.3, "learning_rate": 4.119003644002096e-06, "loss": 1.045, "step": 15769 }, { "epoch": 0.3, "learning_rate": 4.118887236815029e-06, "loss": 1.0362, "step": 15770 }, { "epoch": 0.3, "learning_rate": 4.1187708235830865e-06, "loss": 0.8779, "step": 15771 }, { "epoch": 0.3, "learning_rate": 4.118654404306703e-06, "loss": 0.9214, "step": 15772 }, { "epoch": 0.3, "learning_rate": 4.118537978986314e-06, "loss": 1.0638, "step": 15773 }, { "epoch": 0.3, "learning_rate": 4.118421547622353e-06, "loss": 1.054, "step": 15774 }, { "epoch": 0.3, "learning_rate": 4.118305110215257e-06, "loss": 1.09, "step": 15775 }, { "epoch": 0.3, "learning_rate": 4.118188666765458e-06, "loss": 1.1278, "step": 15776 }, { "epoch": 0.3, "learning_rate": 4.1180722172733925e-06, "loss": 0.7788, "step": 15777 }, { "epoch": 0.3, "learning_rate": 4.117955761739495e-06, "loss": 0.8383, "step": 15778 }, { "epoch": 0.3, "learning_rate": 4.117839300164201e-06, "loss": 0.8654, "step": 15779 }, { "epoch": 0.3, "learning_rate": 4.117722832547943e-06, "loss": 0.7825, "step": 15780 }, { "epoch": 0.3, "learning_rate": 4.11760635889116e-06, "loss": 1.019, "step": 15781 }, { "epoch": 0.3, "learning_rate": 4.1174898791942825e-06, "loss": 0.9208, "step": 15782 }, { "epoch": 0.3, "learning_rate": 4.117373393457748e-06, "loss": 0.9085, "step": 15783 }, { "epoch": 0.3, "learning_rate": 4.117256901681991e-06, "loss": 1.1151, "step": 15784 }, { "epoch": 0.3, "learning_rate": 4.1171404038674465e-06, "loss": 0.9248, "step": 15785 }, { "epoch": 0.3, "learning_rate": 4.117023900014548e-06, "loss": 0.8819, "step": 15786 }, { "epoch": 0.3, "learning_rate": 4.116907390123733e-06, "loss": 1.0903, "step": 15787 }, { "epoch": 0.3, "learning_rate": 4.116790874195436e-06, "loss": 1.0627, "step": 15788 }, { "epoch": 0.3, "learning_rate": 4.11667435223009e-06, "loss": 0.9969, "step": 15789 }, { "epoch": 0.3, "learning_rate": 4.116557824228132e-06, "loss": 0.8636, "step": 15790 }, { "epoch": 0.3, "learning_rate": 4.116441290189996e-06, "loss": 0.9312, "step": 15791 }, { "epoch": 0.3, "learning_rate": 4.116324750116119e-06, "loss": 0.9164, "step": 15792 }, { "epoch": 0.3, "learning_rate": 4.116208204006935e-06, "loss": 0.9595, "step": 15793 }, { "epoch": 0.3, "learning_rate": 4.116091651862878e-06, "loss": 0.8999, "step": 15794 }, { "epoch": 0.3, "learning_rate": 4.115975093684385e-06, "loss": 0.9265, "step": 15795 }, { "epoch": 0.3, "learning_rate": 4.115858529471891e-06, "loss": 0.7937, "step": 15796 }, { "epoch": 0.3, "learning_rate": 4.11574195922583e-06, "loss": 0.8404, "step": 15797 }, { "epoch": 0.3, "learning_rate": 4.115625382946638e-06, "loss": 0.769, "step": 15798 }, { "epoch": 0.3, "learning_rate": 4.115508800634751e-06, "loss": 1.0247, "step": 15799 }, { "epoch": 0.3, "learning_rate": 4.115392212290603e-06, "loss": 0.9186, "step": 15800 }, { "epoch": 0.3, "learning_rate": 4.115275617914631e-06, "loss": 1.0871, "step": 15801 }, { "epoch": 0.3, "learning_rate": 4.1151590175072684e-06, "loss": 0.8684, "step": 15802 }, { "epoch": 0.3, "learning_rate": 4.115042411068952e-06, "loss": 1.0276, "step": 15803 }, { "epoch": 0.3, "learning_rate": 4.114925798600117e-06, "loss": 0.8419, "step": 15804 }, { "epoch": 0.3, "learning_rate": 4.114809180101198e-06, "loss": 0.8896, "step": 15805 }, { "epoch": 0.3, "learning_rate": 4.1146925555726315e-06, "loss": 1.1575, "step": 15806 }, { "epoch": 0.3, "learning_rate": 4.114575925014851e-06, "loss": 1.1049, "step": 15807 }, { "epoch": 0.3, "learning_rate": 4.114459288428296e-06, "loss": 0.8527, "step": 15808 }, { "epoch": 0.3, "learning_rate": 4.114342645813397e-06, "loss": 0.9349, "step": 15809 }, { "epoch": 0.3, "learning_rate": 4.114225997170595e-06, "loss": 0.8221, "step": 15810 }, { "epoch": 0.3, "learning_rate": 4.114109342500321e-06, "loss": 1.0223, "step": 15811 }, { "epoch": 0.3, "learning_rate": 4.113992681803011e-06, "loss": 1.269, "step": 15812 }, { "epoch": 0.3, "learning_rate": 4.113876015079103e-06, "loss": 1.1252, "step": 15813 }, { "epoch": 0.3, "learning_rate": 4.113759342329032e-06, "loss": 0.957, "step": 15814 }, { "epoch": 0.3, "learning_rate": 4.113642663553232e-06, "loss": 1.0159, "step": 15815 }, { "epoch": 0.3, "learning_rate": 4.11352597875214e-06, "loss": 1.0319, "step": 15816 }, { "epoch": 0.3, "learning_rate": 4.113409287926192e-06, "loss": 0.8511, "step": 15817 }, { "epoch": 0.3, "learning_rate": 4.113292591075823e-06, "loss": 0.9397, "step": 15818 }, { "epoch": 0.3, "learning_rate": 4.113175888201469e-06, "loss": 1.2556, "step": 15819 }, { "epoch": 0.3, "learning_rate": 4.1130591793035655e-06, "loss": 0.9655, "step": 15820 }, { "epoch": 0.3, "learning_rate": 4.112942464382549e-06, "loss": 0.9617, "step": 15821 }, { "epoch": 0.3, "learning_rate": 4.112825743438854e-06, "loss": 0.8085, "step": 15822 }, { "epoch": 0.3, "learning_rate": 4.112709016472917e-06, "loss": 0.8536, "step": 15823 }, { "epoch": 0.3, "learning_rate": 4.112592283485175e-06, "loss": 1.0443, "step": 15824 }, { "epoch": 0.3, "learning_rate": 4.112475544476062e-06, "loss": 1.024, "step": 15825 }, { "epoch": 0.3, "learning_rate": 4.112358799446015e-06, "loss": 0.872, "step": 15826 }, { "epoch": 0.3, "learning_rate": 4.11224204839547e-06, "loss": 0.9536, "step": 15827 }, { "epoch": 0.3, "learning_rate": 4.112125291324862e-06, "loss": 1.0027, "step": 15828 }, { "epoch": 0.3, "learning_rate": 4.112008528234628e-06, "loss": 0.8311, "step": 15829 }, { "epoch": 0.3, "learning_rate": 4.111891759125204e-06, "loss": 1.0353, "step": 15830 }, { "epoch": 0.3, "learning_rate": 4.1117749839970244e-06, "loss": 0.9585, "step": 15831 }, { "epoch": 0.3, "learning_rate": 4.1116582028505275e-06, "loss": 0.8769, "step": 15832 }, { "epoch": 0.3, "learning_rate": 4.111541415686148e-06, "loss": 0.7455, "step": 15833 }, { "epoch": 0.3, "learning_rate": 4.111424622504322e-06, "loss": 0.9926, "step": 15834 }, { "epoch": 0.3, "learning_rate": 4.111307823305486e-06, "loss": 0.9847, "step": 15835 }, { "epoch": 0.3, "learning_rate": 4.111191018090076e-06, "loss": 0.7176, "step": 15836 }, { "epoch": 0.3, "learning_rate": 4.111074206858528e-06, "loss": 1.0235, "step": 15837 }, { "epoch": 0.3, "learning_rate": 4.110957389611279e-06, "loss": 1.0604, "step": 15838 }, { "epoch": 0.3, "learning_rate": 4.110840566348764e-06, "loss": 0.9559, "step": 15839 }, { "epoch": 0.3, "learning_rate": 4.11072373707142e-06, "loss": 0.8739, "step": 15840 }, { "epoch": 0.3, "learning_rate": 4.110606901779682e-06, "loss": 1.0151, "step": 15841 }, { "epoch": 0.3, "learning_rate": 4.1104900604739884e-06, "loss": 0.8678, "step": 15842 }, { "epoch": 0.3, "learning_rate": 4.110373213154774e-06, "loss": 1.1984, "step": 15843 }, { "epoch": 0.3, "learning_rate": 4.110256359822474e-06, "loss": 1.1497, "step": 15844 }, { "epoch": 0.3, "learning_rate": 4.110139500477528e-06, "loss": 0.8602, "step": 15845 }, { "epoch": 0.3, "learning_rate": 4.11002263512037e-06, "loss": 0.8835, "step": 15846 }, { "epoch": 0.3, "learning_rate": 4.109905763751436e-06, "loss": 0.9739, "step": 15847 }, { "epoch": 0.3, "learning_rate": 4.1097888863711645e-06, "loss": 0.8951, "step": 15848 }, { "epoch": 0.3, "learning_rate": 4.10967200297999e-06, "loss": 1.0912, "step": 15849 }, { "epoch": 0.3, "learning_rate": 4.1095551135783496e-06, "loss": 1.2305, "step": 15850 }, { "epoch": 0.3, "learning_rate": 4.1094382181666795e-06, "loss": 1.0636, "step": 15851 }, { "epoch": 0.3, "learning_rate": 4.109321316745416e-06, "loss": 0.8152, "step": 15852 }, { "epoch": 0.3, "learning_rate": 4.109204409314998e-06, "loss": 0.812, "step": 15853 }, { "epoch": 0.3, "learning_rate": 4.109087495875858e-06, "loss": 0.8864, "step": 15854 }, { "epoch": 0.3, "learning_rate": 4.108970576428435e-06, "loss": 1.0563, "step": 15855 }, { "epoch": 0.3, "learning_rate": 4.108853650973166e-06, "loss": 1.1396, "step": 15856 }, { "epoch": 0.3, "learning_rate": 4.1087367195104865e-06, "loss": 0.9418, "step": 15857 }, { "epoch": 0.3, "learning_rate": 4.108619782040834e-06, "loss": 0.807, "step": 15858 }, { "epoch": 0.3, "learning_rate": 4.108502838564643e-06, "loss": 0.9509, "step": 15859 }, { "epoch": 0.3, "learning_rate": 4.108385889082353e-06, "loss": 1.0682, "step": 15860 }, { "epoch": 0.3, "learning_rate": 4.108268933594399e-06, "loss": 1.0499, "step": 15861 }, { "epoch": 0.3, "learning_rate": 4.1081519721012185e-06, "loss": 1.063, "step": 15862 }, { "epoch": 0.3, "learning_rate": 4.1080350046032465e-06, "loss": 0.9181, "step": 15863 }, { "epoch": 0.3, "learning_rate": 4.107918031100922e-06, "loss": 0.5775, "step": 15864 }, { "epoch": 0.3, "learning_rate": 4.107801051594682e-06, "loss": 0.9107, "step": 15865 }, { "epoch": 0.3, "learning_rate": 4.10768406608496e-06, "loss": 0.6564, "step": 15866 }, { "epoch": 0.3, "learning_rate": 4.107567074572197e-06, "loss": 0.8214, "step": 15867 }, { "epoch": 0.3, "learning_rate": 4.107450077056827e-06, "loss": 1.4427, "step": 15868 }, { "epoch": 0.3, "learning_rate": 4.107333073539288e-06, "loss": 0.9704, "step": 15869 }, { "epoch": 0.3, "learning_rate": 4.1072160640200155e-06, "loss": 0.8407, "step": 15870 }, { "epoch": 0.3, "learning_rate": 4.107099048499449e-06, "loss": 0.8902, "step": 15871 }, { "epoch": 0.3, "learning_rate": 4.106982026978023e-06, "loss": 1.054, "step": 15872 }, { "epoch": 0.3, "learning_rate": 4.106864999456175e-06, "loss": 0.9158, "step": 15873 }, { "epoch": 0.3, "learning_rate": 4.106747965934344e-06, "loss": 1.1835, "step": 15874 }, { "epoch": 0.3, "learning_rate": 4.106630926412964e-06, "loss": 0.9575, "step": 15875 }, { "epoch": 0.3, "learning_rate": 4.106513880892473e-06, "loss": 0.9124, "step": 15876 }, { "epoch": 0.3, "learning_rate": 4.106396829373309e-06, "loss": 0.8792, "step": 15877 }, { "epoch": 0.3, "learning_rate": 4.1062797718559085e-06, "loss": 0.973, "step": 15878 }, { "epoch": 0.3, "learning_rate": 4.106162708340708e-06, "loss": 0.7239, "step": 15879 }, { "epoch": 0.3, "learning_rate": 4.1060456388281466e-06, "loss": 1.1092, "step": 15880 }, { "epoch": 0.3, "learning_rate": 4.105928563318659e-06, "loss": 1.0072, "step": 15881 }, { "epoch": 0.3, "learning_rate": 4.105811481812683e-06, "loss": 0.8331, "step": 15882 }, { "epoch": 0.3, "learning_rate": 4.105694394310658e-06, "loss": 0.8532, "step": 15883 }, { "epoch": 0.3, "learning_rate": 4.105577300813017e-06, "loss": 0.8925, "step": 15884 }, { "epoch": 0.3, "learning_rate": 4.105460201320202e-06, "loss": 0.6978, "step": 15885 }, { "epoch": 0.3, "learning_rate": 4.105343095832646e-06, "loss": 0.8586, "step": 15886 }, { "epoch": 0.3, "learning_rate": 4.105225984350789e-06, "loss": 1.1548, "step": 15887 }, { "epoch": 0.3, "learning_rate": 4.105108866875067e-06, "loss": 0.9857, "step": 15888 }, { "epoch": 0.3, "learning_rate": 4.1049917434059176e-06, "loss": 0.8591, "step": 15889 }, { "epoch": 0.3, "learning_rate": 4.104874613943778e-06, "loss": 0.9875, "step": 15890 }, { "epoch": 0.3, "learning_rate": 4.104757478489086e-06, "loss": 0.8293, "step": 15891 }, { "epoch": 0.3, "learning_rate": 4.104640337042279e-06, "loss": 0.8298, "step": 15892 }, { "epoch": 0.3, "learning_rate": 4.104523189603795e-06, "loss": 1.1633, "step": 15893 }, { "epoch": 0.3, "learning_rate": 4.104406036174069e-06, "loss": 0.7772, "step": 15894 }, { "epoch": 0.3, "learning_rate": 4.104288876753541e-06, "loss": 1.0295, "step": 15895 }, { "epoch": 0.3, "learning_rate": 4.104171711342648e-06, "loss": 0.9219, "step": 15896 }, { "epoch": 0.3, "learning_rate": 4.104054539941827e-06, "loss": 0.7472, "step": 15897 }, { "epoch": 0.3, "learning_rate": 4.103937362551515e-06, "loss": 1.0927, "step": 15898 }, { "epoch": 0.3, "learning_rate": 4.1038201791721485e-06, "loss": 0.9117, "step": 15899 }, { "epoch": 0.3, "learning_rate": 4.103702989804169e-06, "loss": 0.9308, "step": 15900 }, { "epoch": 0.3, "learning_rate": 4.103585794448011e-06, "loss": 1.0585, "step": 15901 }, { "epoch": 0.3, "learning_rate": 4.103468593104112e-06, "loss": 0.8231, "step": 15902 }, { "epoch": 0.3, "learning_rate": 4.103351385772911e-06, "loss": 0.9723, "step": 15903 }, { "epoch": 0.3, "learning_rate": 4.1032341724548455e-06, "loss": 0.97, "step": 15904 }, { "epoch": 0.3, "learning_rate": 4.103116953150352e-06, "loss": 0.986, "step": 15905 }, { "epoch": 0.3, "learning_rate": 4.10299972785987e-06, "loss": 1.0542, "step": 15906 }, { "epoch": 0.3, "learning_rate": 4.1028824965838346e-06, "loss": 0.9384, "step": 15907 }, { "epoch": 0.3, "learning_rate": 4.102765259322687e-06, "loss": 1.0018, "step": 15908 }, { "epoch": 0.3, "learning_rate": 4.1026480160768615e-06, "loss": 0.8355, "step": 15909 }, { "epoch": 0.3, "learning_rate": 4.1025307668467984e-06, "loss": 0.8115, "step": 15910 }, { "epoch": 0.3, "learning_rate": 4.102413511632933e-06, "loss": 1.0714, "step": 15911 }, { "epoch": 0.3, "learning_rate": 4.102296250435706e-06, "loss": 1.0766, "step": 15912 }, { "epoch": 0.3, "learning_rate": 4.102178983255555e-06, "loss": 1.0748, "step": 15913 }, { "epoch": 0.3, "learning_rate": 4.102061710092915e-06, "loss": 1.0063, "step": 15914 }, { "epoch": 0.3, "learning_rate": 4.1019444309482255e-06, "loss": 0.9849, "step": 15915 }, { "epoch": 0.3, "learning_rate": 4.101827145821926e-06, "loss": 0.9167, "step": 15916 }, { "epoch": 0.3, "learning_rate": 4.101709854714452e-06, "loss": 0.9559, "step": 15917 }, { "epoch": 0.3, "learning_rate": 4.1015925576262435e-06, "loss": 1.144, "step": 15918 }, { "epoch": 0.3, "learning_rate": 4.101475254557737e-06, "loss": 0.9663, "step": 15919 }, { "epoch": 0.3, "learning_rate": 4.101357945509371e-06, "loss": 0.8368, "step": 15920 }, { "epoch": 0.3, "learning_rate": 4.101240630481583e-06, "loss": 0.9111, "step": 15921 }, { "epoch": 0.3, "learning_rate": 4.101123309474813e-06, "loss": 0.9234, "step": 15922 }, { "epoch": 0.3, "learning_rate": 4.101005982489496e-06, "loss": 1.006, "step": 15923 }, { "epoch": 0.3, "learning_rate": 4.1008886495260725e-06, "loss": 1.1456, "step": 15924 }, { "epoch": 0.3, "learning_rate": 4.10077131058498e-06, "loss": 1.1424, "step": 15925 }, { "epoch": 0.3, "learning_rate": 4.100653965666656e-06, "loss": 0.8929, "step": 15926 }, { "epoch": 0.3, "learning_rate": 4.1005366147715394e-06, "loss": 0.8981, "step": 15927 }, { "epoch": 0.3, "learning_rate": 4.100419257900069e-06, "loss": 0.7874, "step": 15928 }, { "epoch": 0.3, "learning_rate": 4.1003018950526805e-06, "loss": 0.9389, "step": 15929 }, { "epoch": 0.3, "learning_rate": 4.100184526229815e-06, "loss": 0.9785, "step": 15930 }, { "epoch": 0.3, "learning_rate": 4.100067151431909e-06, "loss": 0.992, "step": 15931 }, { "epoch": 0.3, "learning_rate": 4.099949770659402e-06, "loss": 1.0201, "step": 15932 }, { "epoch": 0.3, "learning_rate": 4.099832383912731e-06, "loss": 0.8398, "step": 15933 }, { "epoch": 0.3, "learning_rate": 4.099714991192335e-06, "loss": 1.0425, "step": 15934 }, { "epoch": 0.3, "learning_rate": 4.099597592498653e-06, "loss": 0.6587, "step": 15935 }, { "epoch": 0.3, "learning_rate": 4.0994801878321215e-06, "loss": 0.8963, "step": 15936 }, { "epoch": 0.3, "learning_rate": 4.09936277719318e-06, "loss": 0.9012, "step": 15937 }, { "epoch": 0.3, "learning_rate": 4.099245360582268e-06, "loss": 0.9379, "step": 15938 }, { "epoch": 0.3, "learning_rate": 4.099127937999822e-06, "loss": 0.7152, "step": 15939 }, { "epoch": 0.3, "learning_rate": 4.099010509446282e-06, "loss": 0.9714, "step": 15940 }, { "epoch": 0.3, "learning_rate": 4.098893074922085e-06, "loss": 0.865, "step": 15941 }, { "epoch": 0.3, "learning_rate": 4.098775634427671e-06, "loss": 0.9752, "step": 15942 }, { "epoch": 0.3, "learning_rate": 4.098658187963477e-06, "loss": 0.9885, "step": 15943 }, { "epoch": 0.3, "learning_rate": 4.0985407355299435e-06, "loss": 0.9113, "step": 15944 }, { "epoch": 0.3, "learning_rate": 4.0984232771275065e-06, "loss": 0.8111, "step": 15945 }, { "epoch": 0.3, "learning_rate": 4.098305812756607e-06, "loss": 0.8089, "step": 15946 }, { "epoch": 0.3, "learning_rate": 4.098188342417682e-06, "loss": 0.9423, "step": 15947 }, { "epoch": 0.3, "learning_rate": 4.098070866111172e-06, "loss": 0.9216, "step": 15948 }, { "epoch": 0.3, "learning_rate": 4.097953383837513e-06, "loss": 1.234, "step": 15949 }, { "epoch": 0.3, "learning_rate": 4.097835895597145e-06, "loss": 0.8597, "step": 15950 }, { "epoch": 0.3, "learning_rate": 4.097718401390508e-06, "loss": 1.0302, "step": 15951 }, { "epoch": 0.3, "learning_rate": 4.097600901218038e-06, "loss": 0.9843, "step": 15952 }, { "epoch": 0.3, "learning_rate": 4.097483395080176e-06, "loss": 0.7946, "step": 15953 }, { "epoch": 0.3, "learning_rate": 4.0973658829773605e-06, "loss": 1.2203, "step": 15954 }, { "epoch": 0.3, "learning_rate": 4.097248364910029e-06, "loss": 1.1017, "step": 15955 }, { "epoch": 0.3, "learning_rate": 4.0971308408786215e-06, "loss": 0.9109, "step": 15956 }, { "epoch": 0.3, "learning_rate": 4.097013310883577e-06, "loss": 1.0435, "step": 15957 }, { "epoch": 0.3, "learning_rate": 4.0968957749253325e-06, "loss": 1.0383, "step": 15958 }, { "epoch": 0.3, "learning_rate": 4.096778233004328e-06, "loss": 0.9471, "step": 15959 }, { "epoch": 0.3, "learning_rate": 4.096660685121003e-06, "loss": 0.9982, "step": 15960 }, { "epoch": 0.3, "learning_rate": 4.096543131275796e-06, "loss": 0.8847, "step": 15961 }, { "epoch": 0.3, "learning_rate": 4.096425571469146e-06, "loss": 1.0219, "step": 15962 }, { "epoch": 0.3, "learning_rate": 4.0963080057014926e-06, "loss": 0.9926, "step": 15963 }, { "epoch": 0.3, "learning_rate": 4.096190433973272e-06, "loss": 0.7963, "step": 15964 }, { "epoch": 0.3, "learning_rate": 4.096072856284927e-06, "loss": 1.1032, "step": 15965 }, { "epoch": 0.3, "learning_rate": 4.095955272636895e-06, "loss": 0.9415, "step": 15966 }, { "epoch": 0.3, "learning_rate": 4.095837683029614e-06, "loss": 0.883, "step": 15967 }, { "epoch": 0.3, "learning_rate": 4.095720087463525e-06, "loss": 1.0585, "step": 15968 }, { "epoch": 0.3, "learning_rate": 4.0956024859390654e-06, "loss": 0.8767, "step": 15969 }, { "epoch": 0.3, "learning_rate": 4.095484878456675e-06, "loss": 0.9569, "step": 15970 }, { "epoch": 0.3, "learning_rate": 4.095367265016793e-06, "loss": 0.9819, "step": 15971 }, { "epoch": 0.3, "learning_rate": 4.0952496456198585e-06, "loss": 0.6981, "step": 15972 }, { "epoch": 0.3, "learning_rate": 4.095132020266311e-06, "loss": 0.9366, "step": 15973 }, { "epoch": 0.3, "learning_rate": 4.09501438895659e-06, "loss": 0.9696, "step": 15974 }, { "epoch": 0.3, "learning_rate": 4.094896751691133e-06, "loss": 1.0922, "step": 15975 }, { "epoch": 0.3, "learning_rate": 4.094779108470381e-06, "loss": 0.7782, "step": 15976 }, { "epoch": 0.3, "learning_rate": 4.094661459294773e-06, "loss": 0.8918, "step": 15977 }, { "epoch": 0.3, "learning_rate": 4.0945438041647475e-06, "loss": 0.8953, "step": 15978 }, { "epoch": 0.3, "learning_rate": 4.094426143080745e-06, "loss": 0.9136, "step": 15979 }, { "epoch": 0.3, "learning_rate": 4.0943084760432035e-06, "loss": 1.2091, "step": 15980 }, { "epoch": 0.3, "learning_rate": 4.094190803052564e-06, "loss": 1.1953, "step": 15981 }, { "epoch": 0.3, "learning_rate": 4.094073124109264e-06, "loss": 0.9799, "step": 15982 }, { "epoch": 0.3, "learning_rate": 4.093955439213743e-06, "loss": 1.0679, "step": 15983 }, { "epoch": 0.3, "learning_rate": 4.093837748366442e-06, "loss": 0.88, "step": 15984 }, { "epoch": 0.3, "learning_rate": 4.0937200515678e-06, "loss": 0.9893, "step": 15985 }, { "epoch": 0.3, "learning_rate": 4.093602348818256e-06, "loss": 0.9148, "step": 15986 }, { "epoch": 0.3, "learning_rate": 4.09348464011825e-06, "loss": 0.967, "step": 15987 }, { "epoch": 0.3, "learning_rate": 4.093366925468222e-06, "loss": 1.0142, "step": 15988 }, { "epoch": 0.3, "learning_rate": 4.093249204868609e-06, "loss": 0.877, "step": 15989 }, { "epoch": 0.3, "learning_rate": 4.093131478319854e-06, "loss": 0.9064, "step": 15990 }, { "epoch": 0.3, "learning_rate": 4.093013745822393e-06, "loss": 0.9164, "step": 15991 }, { "epoch": 0.3, "learning_rate": 4.092896007376669e-06, "loss": 1.0695, "step": 15992 }, { "epoch": 0.3, "learning_rate": 4.09277826298312e-06, "loss": 0.9952, "step": 15993 }, { "epoch": 0.3, "learning_rate": 4.092660512642185e-06, "loss": 0.9573, "step": 15994 }, { "epoch": 0.3, "learning_rate": 4.092542756354305e-06, "loss": 0.9149, "step": 15995 }, { "epoch": 0.3, "learning_rate": 4.092424994119919e-06, "loss": 0.9806, "step": 15996 }, { "epoch": 0.3, "learning_rate": 4.092307225939467e-06, "loss": 0.8779, "step": 15997 }, { "epoch": 0.3, "learning_rate": 4.092189451813388e-06, "loss": 1.0478, "step": 15998 }, { "epoch": 0.3, "learning_rate": 4.092071671742124e-06, "loss": 1.0336, "step": 15999 }, { "epoch": 0.3, "learning_rate": 4.0919538857261125e-06, "loss": 1.1754, "step": 16000 }, { "epoch": 0.3, "learning_rate": 4.091836093765794e-06, "loss": 1.0289, "step": 16001 }, { "epoch": 0.3, "learning_rate": 4.091718295861607e-06, "loss": 0.8622, "step": 16002 }, { "epoch": 0.3, "learning_rate": 4.091600492013994e-06, "loss": 1.0651, "step": 16003 }, { "epoch": 0.3, "learning_rate": 4.091482682223394e-06, "loss": 0.9093, "step": 16004 }, { "epoch": 0.3, "learning_rate": 4.091364866490246e-06, "loss": 0.9371, "step": 16005 }, { "epoch": 0.3, "learning_rate": 4.0912470448149896e-06, "loss": 1.3779, "step": 16006 }, { "epoch": 0.3, "learning_rate": 4.091129217198067e-06, "loss": 0.9539, "step": 16007 }, { "epoch": 0.3, "learning_rate": 4.091011383639915e-06, "loss": 1.1263, "step": 16008 }, { "epoch": 0.3, "learning_rate": 4.0908935441409755e-06, "loss": 0.9732, "step": 16009 }, { "epoch": 0.3, "learning_rate": 4.090775698701689e-06, "loss": 0.8088, "step": 16010 }, { "epoch": 0.3, "learning_rate": 4.090657847322496e-06, "loss": 0.8694, "step": 16011 }, { "epoch": 0.3, "learning_rate": 4.090539990003833e-06, "loss": 1.0321, "step": 16012 }, { "epoch": 0.3, "learning_rate": 4.090422126746144e-06, "loss": 1.0416, "step": 16013 }, { "epoch": 0.3, "learning_rate": 4.090304257549868e-06, "loss": 1.0419, "step": 16014 }, { "epoch": 0.3, "learning_rate": 4.090186382415443e-06, "loss": 0.8571, "step": 16015 }, { "epoch": 0.3, "learning_rate": 4.090068501343311e-06, "loss": 0.8208, "step": 16016 }, { "epoch": 0.3, "learning_rate": 4.089950614333913e-06, "loss": 0.9473, "step": 16017 }, { "epoch": 0.3, "learning_rate": 4.089832721387688e-06, "loss": 0.9757, "step": 16018 }, { "epoch": 0.3, "learning_rate": 4.089714822505075e-06, "loss": 0.9772, "step": 16019 }, { "epoch": 0.3, "learning_rate": 4.089596917686517e-06, "loss": 1.0197, "step": 16020 }, { "epoch": 0.3, "learning_rate": 4.089479006932453e-06, "loss": 0.8953, "step": 16021 }, { "epoch": 0.3, "learning_rate": 4.089361090243322e-06, "loss": 0.9698, "step": 16022 }, { "epoch": 0.3, "learning_rate": 4.089243167619566e-06, "loss": 0.8751, "step": 16023 }, { "epoch": 0.3, "learning_rate": 4.089125239061624e-06, "loss": 0.8877, "step": 16024 }, { "epoch": 0.3, "learning_rate": 4.089007304569938e-06, "loss": 1.3423, "step": 16025 }, { "epoch": 0.3, "learning_rate": 4.0888893641449476e-06, "loss": 1.0149, "step": 16026 }, { "epoch": 0.3, "learning_rate": 4.088771417787093e-06, "loss": 0.9379, "step": 16027 }, { "epoch": 0.3, "learning_rate": 4.088653465496815e-06, "loss": 0.9359, "step": 16028 }, { "epoch": 0.3, "learning_rate": 4.088535507274552e-06, "loss": 0.7665, "step": 16029 }, { "epoch": 0.3, "learning_rate": 4.088417543120747e-06, "loss": 0.9631, "step": 16030 }, { "epoch": 0.3, "learning_rate": 4.08829957303584e-06, "loss": 1.0748, "step": 16031 }, { "epoch": 0.3, "learning_rate": 4.088181597020271e-06, "loss": 0.9819, "step": 16032 }, { "epoch": 0.3, "learning_rate": 4.08806361507448e-06, "loss": 0.9559, "step": 16033 }, { "epoch": 0.3, "learning_rate": 4.087945627198909e-06, "loss": 0.9815, "step": 16034 }, { "epoch": 0.3, "learning_rate": 4.087827633393997e-06, "loss": 0.9192, "step": 16035 }, { "epoch": 0.3, "learning_rate": 4.0877096336601855e-06, "loss": 1.0248, "step": 16036 }, { "epoch": 0.3, "learning_rate": 4.087591627997915e-06, "loss": 1.249, "step": 16037 }, { "epoch": 0.3, "learning_rate": 4.0874736164076255e-06, "loss": 1.1055, "step": 16038 }, { "epoch": 0.3, "learning_rate": 4.08735559888976e-06, "loss": 1.0449, "step": 16039 }, { "epoch": 0.3, "learning_rate": 4.087237575444756e-06, "loss": 0.806, "step": 16040 }, { "epoch": 0.3, "learning_rate": 4.087119546073055e-06, "loss": 0.7223, "step": 16041 }, { "epoch": 0.3, "learning_rate": 4.0870015107750984e-06, "loss": 1.0252, "step": 16042 }, { "epoch": 0.3, "learning_rate": 4.0868834695513285e-06, "loss": 1.3564, "step": 16043 }, { "epoch": 0.3, "learning_rate": 4.086765422402183e-06, "loss": 0.9255, "step": 16044 }, { "epoch": 0.3, "learning_rate": 4.086647369328104e-06, "loss": 0.8733, "step": 16045 }, { "epoch": 0.3, "learning_rate": 4.086529310329533e-06, "loss": 0.6199, "step": 16046 }, { "epoch": 0.3, "learning_rate": 4.086411245406909e-06, "loss": 0.9432, "step": 16047 }, { "epoch": 0.3, "learning_rate": 4.086293174560675e-06, "loss": 0.9872, "step": 16048 }, { "epoch": 0.3, "learning_rate": 4.086175097791271e-06, "loss": 0.9569, "step": 16049 }, { "epoch": 0.3, "learning_rate": 4.086057015099138e-06, "loss": 1.1761, "step": 16050 }, { "epoch": 0.3, "learning_rate": 4.085938926484716e-06, "loss": 0.9384, "step": 16051 }, { "epoch": 0.3, "learning_rate": 4.085820831948447e-06, "loss": 1.0628, "step": 16052 }, { "epoch": 0.3, "learning_rate": 4.085702731490771e-06, "loss": 0.9163, "step": 16053 }, { "epoch": 0.3, "learning_rate": 4.085584625112131e-06, "loss": 0.9817, "step": 16054 }, { "epoch": 0.3, "learning_rate": 4.085466512812966e-06, "loss": 1.1523, "step": 16055 }, { "epoch": 0.3, "learning_rate": 4.085348394593718e-06, "loss": 1.0243, "step": 16056 }, { "epoch": 0.3, "learning_rate": 4.085230270454826e-06, "loss": 0.9174, "step": 16057 }, { "epoch": 0.3, "learning_rate": 4.085112140396735e-06, "loss": 0.8893, "step": 16058 }, { "epoch": 0.3, "learning_rate": 4.084994004419882e-06, "loss": 0.7539, "step": 16059 }, { "epoch": 0.3, "learning_rate": 4.084875862524712e-06, "loss": 0.7681, "step": 16060 }, { "epoch": 0.3, "learning_rate": 4.084757714711663e-06, "loss": 0.8996, "step": 16061 }, { "epoch": 0.3, "learning_rate": 4.084639560981177e-06, "loss": 1.1038, "step": 16062 }, { "epoch": 0.3, "learning_rate": 4.084521401333695e-06, "loss": 0.9164, "step": 16063 }, { "epoch": 0.3, "learning_rate": 4.08440323576966e-06, "loss": 1.1257, "step": 16064 }, { "epoch": 0.3, "learning_rate": 4.084285064289512e-06, "loss": 0.9206, "step": 16065 }, { "epoch": 0.3, "learning_rate": 4.084166886893691e-06, "loss": 0.9595, "step": 16066 }, { "epoch": 0.3, "learning_rate": 4.08404870358264e-06, "loss": 0.758, "step": 16067 }, { "epoch": 0.3, "learning_rate": 4.083930514356799e-06, "loss": 1.1547, "step": 16068 }, { "epoch": 0.3, "learning_rate": 4.083812319216611e-06, "loss": 0.782, "step": 16069 }, { "epoch": 0.3, "learning_rate": 4.083694118162516e-06, "loss": 1.1649, "step": 16070 }, { "epoch": 0.3, "learning_rate": 4.083575911194955e-06, "loss": 0.9722, "step": 16071 }, { "epoch": 0.3, "learning_rate": 4.083457698314372e-06, "loss": 0.8165, "step": 16072 }, { "epoch": 0.3, "learning_rate": 4.083339479521205e-06, "loss": 1.3618, "step": 16073 }, { "epoch": 0.3, "learning_rate": 4.083221254815897e-06, "loss": 1.1406, "step": 16074 }, { "epoch": 0.3, "learning_rate": 4.083103024198889e-06, "loss": 1.1374, "step": 16075 }, { "epoch": 0.3, "learning_rate": 4.0829847876706245e-06, "loss": 0.7209, "step": 16076 }, { "epoch": 0.3, "learning_rate": 4.082866545231542e-06, "loss": 0.7637, "step": 16077 }, { "epoch": 0.3, "learning_rate": 4.082748296882085e-06, "loss": 1.1232, "step": 16078 }, { "epoch": 0.3, "learning_rate": 4.082630042622694e-06, "loss": 0.9202, "step": 16079 }, { "epoch": 0.3, "learning_rate": 4.082511782453811e-06, "loss": 1.054, "step": 16080 }, { "epoch": 0.3, "learning_rate": 4.0823935163758775e-06, "loss": 1.1237, "step": 16081 }, { "epoch": 0.3, "learning_rate": 4.0822752443893356e-06, "loss": 0.9836, "step": 16082 }, { "epoch": 0.3, "learning_rate": 4.082156966494625e-06, "loss": 0.9805, "step": 16083 }, { "epoch": 0.3, "learning_rate": 4.08203868269219e-06, "loss": 0.9152, "step": 16084 }, { "epoch": 0.3, "learning_rate": 4.081920392982471e-06, "loss": 0.9142, "step": 16085 }, { "epoch": 0.3, "learning_rate": 4.08180209736591e-06, "loss": 0.8002, "step": 16086 }, { "epoch": 0.3, "learning_rate": 4.081683795842948e-06, "loss": 0.9552, "step": 16087 }, { "epoch": 0.3, "learning_rate": 4.081565488414027e-06, "loss": 0.8909, "step": 16088 }, { "epoch": 0.3, "learning_rate": 4.081447175079589e-06, "loss": 0.8485, "step": 16089 }, { "epoch": 0.3, "learning_rate": 4.081328855840076e-06, "loss": 0.7486, "step": 16090 }, { "epoch": 0.3, "learning_rate": 4.08121053069593e-06, "loss": 0.9444, "step": 16091 }, { "epoch": 0.3, "learning_rate": 4.081092199647591e-06, "loss": 0.9929, "step": 16092 }, { "epoch": 0.3, "learning_rate": 4.080973862695503e-06, "loss": 0.834, "step": 16093 }, { "epoch": 0.3, "learning_rate": 4.080855519840108e-06, "loss": 0.9319, "step": 16094 }, { "epoch": 0.3, "learning_rate": 4.080737171081846e-06, "loss": 0.8481, "step": 16095 }, { "epoch": 0.3, "learning_rate": 4.08061881642116e-06, "loss": 0.7516, "step": 16096 }, { "epoch": 0.3, "learning_rate": 4.080500455858491e-06, "loss": 0.8791, "step": 16097 }, { "epoch": 0.3, "learning_rate": 4.080382089394283e-06, "loss": 0.8582, "step": 16098 }, { "epoch": 0.3, "learning_rate": 4.080263717028976e-06, "loss": 0.8798, "step": 16099 }, { "epoch": 0.3, "learning_rate": 4.080145338763013e-06, "loss": 1.0253, "step": 16100 }, { "epoch": 0.3, "learning_rate": 4.080026954596836e-06, "loss": 1.0793, "step": 16101 }, { "epoch": 0.3, "learning_rate": 4.079908564530887e-06, "loss": 0.6833, "step": 16102 }, { "epoch": 0.3, "learning_rate": 4.079790168565607e-06, "loss": 0.8369, "step": 16103 }, { "epoch": 0.3, "learning_rate": 4.079671766701439e-06, "loss": 1.0724, "step": 16104 }, { "epoch": 0.3, "learning_rate": 4.079553358938826e-06, "loss": 0.9928, "step": 16105 }, { "epoch": 0.3, "learning_rate": 4.079434945278209e-06, "loss": 1.1183, "step": 16106 }, { "epoch": 0.3, "learning_rate": 4.0793165257200294e-06, "loss": 1.0496, "step": 16107 }, { "epoch": 0.3, "learning_rate": 4.079198100264731e-06, "loss": 0.9128, "step": 16108 }, { "epoch": 0.3, "learning_rate": 4.079079668912755e-06, "loss": 0.938, "step": 16109 }, { "epoch": 0.3, "learning_rate": 4.078961231664545e-06, "loss": 0.8536, "step": 16110 }, { "epoch": 0.3, "learning_rate": 4.07884278852054e-06, "loss": 0.7906, "step": 16111 }, { "epoch": 0.3, "learning_rate": 4.078724339481187e-06, "loss": 1.0859, "step": 16112 }, { "epoch": 0.3, "learning_rate": 4.078605884546923e-06, "loss": 1.093, "step": 16113 }, { "epoch": 0.3, "learning_rate": 4.078487423718195e-06, "loss": 1.0319, "step": 16114 }, { "epoch": 0.3, "learning_rate": 4.0783689569954435e-06, "loss": 0.7858, "step": 16115 }, { "epoch": 0.3, "learning_rate": 4.078250484379109e-06, "loss": 1.03, "step": 16116 }, { "epoch": 0.3, "learning_rate": 4.078132005869637e-06, "loss": 0.9144, "step": 16117 }, { "epoch": 0.3, "learning_rate": 4.078013521467469e-06, "loss": 1.2653, "step": 16118 }, { "epoch": 0.3, "learning_rate": 4.077895031173045e-06, "loss": 1.1421, "step": 16119 }, { "epoch": 0.3, "learning_rate": 4.07777653498681e-06, "loss": 0.7966, "step": 16120 }, { "epoch": 0.3, "learning_rate": 4.077658032909207e-06, "loss": 1.0921, "step": 16121 }, { "epoch": 0.3, "learning_rate": 4.077539524940676e-06, "loss": 1.1097, "step": 16122 }, { "epoch": 0.3, "learning_rate": 4.077421011081662e-06, "loss": 0.8823, "step": 16123 }, { "epoch": 0.3, "learning_rate": 4.077302491332605e-06, "loss": 0.8667, "step": 16124 }, { "epoch": 0.3, "learning_rate": 4.077183965693949e-06, "loss": 1.1275, "step": 16125 }, { "epoch": 0.3, "learning_rate": 4.077065434166136e-06, "loss": 0.8859, "step": 16126 }, { "epoch": 0.3, "learning_rate": 4.07694689674961e-06, "loss": 0.8422, "step": 16127 }, { "epoch": 0.3, "learning_rate": 4.076828353444813e-06, "loss": 0.933, "step": 16128 }, { "epoch": 0.3, "learning_rate": 4.076709804252187e-06, "loss": 0.8112, "step": 16129 }, { "epoch": 0.3, "learning_rate": 4.076591249172175e-06, "loss": 1.057, "step": 16130 }, { "epoch": 0.3, "learning_rate": 4.076472688205218e-06, "loss": 1.122, "step": 16131 }, { "epoch": 0.3, "learning_rate": 4.076354121351762e-06, "loss": 0.9883, "step": 16132 }, { "epoch": 0.3, "learning_rate": 4.076235548612248e-06, "loss": 0.9086, "step": 16133 }, { "epoch": 0.3, "learning_rate": 4.0761169699871185e-06, "loss": 0.8975, "step": 16134 }, { "epoch": 0.3, "learning_rate": 4.075998385476816e-06, "loss": 0.9754, "step": 16135 }, { "epoch": 0.3, "learning_rate": 4.075879795081784e-06, "loss": 0.9421, "step": 16136 }, { "epoch": 0.3, "learning_rate": 4.0757611988024655e-06, "loss": 1.1328, "step": 16137 }, { "epoch": 0.3, "learning_rate": 4.0756425966393035e-06, "loss": 0.8318, "step": 16138 }, { "epoch": 0.3, "learning_rate": 4.07552398859274e-06, "loss": 0.7364, "step": 16139 }, { "epoch": 0.3, "learning_rate": 4.0754053746632185e-06, "loss": 0.9691, "step": 16140 }, { "epoch": 0.3, "learning_rate": 4.075286754851181e-06, "loss": 1.0398, "step": 16141 }, { "epoch": 0.3, "learning_rate": 4.075168129157071e-06, "loss": 0.8478, "step": 16142 }, { "epoch": 0.3, "learning_rate": 4.075049497581332e-06, "loss": 0.9652, "step": 16143 }, { "epoch": 0.3, "learning_rate": 4.0749308601244066e-06, "loss": 0.9747, "step": 16144 }, { "epoch": 0.3, "learning_rate": 4.074812216786737e-06, "loss": 0.7996, "step": 16145 }, { "epoch": 0.3, "learning_rate": 4.074693567568767e-06, "loss": 0.9239, "step": 16146 }, { "epoch": 0.3, "learning_rate": 4.07457491247094e-06, "loss": 0.9521, "step": 16147 }, { "epoch": 0.3, "learning_rate": 4.074456251493698e-06, "loss": 0.8519, "step": 16148 }, { "epoch": 0.3, "learning_rate": 4.074337584637485e-06, "loss": 1.1056, "step": 16149 }, { "epoch": 0.3, "learning_rate": 4.074218911902743e-06, "loss": 1.2141, "step": 16150 }, { "epoch": 0.3, "learning_rate": 4.074100233289916e-06, "loss": 0.7658, "step": 16151 }, { "epoch": 0.3, "learning_rate": 4.073981548799447e-06, "loss": 1.112, "step": 16152 }, { "epoch": 0.3, "learning_rate": 4.073862858431781e-06, "loss": 1.0165, "step": 16153 }, { "epoch": 0.3, "learning_rate": 4.073744162187357e-06, "loss": 0.9779, "step": 16154 }, { "epoch": 0.3, "learning_rate": 4.0736254600666216e-06, "loss": 0.7829, "step": 16155 }, { "epoch": 0.3, "learning_rate": 4.073506752070017e-06, "loss": 0.8437, "step": 16156 }, { "epoch": 0.3, "learning_rate": 4.073388038197986e-06, "loss": 0.9714, "step": 16157 }, { "epoch": 0.3, "learning_rate": 4.0732693184509725e-06, "loss": 0.7064, "step": 16158 }, { "epoch": 0.3, "learning_rate": 4.07315059282942e-06, "loss": 0.957, "step": 16159 }, { "epoch": 0.3, "learning_rate": 4.073031861333771e-06, "loss": 0.7725, "step": 16160 }, { "epoch": 0.3, "learning_rate": 4.072913123964469e-06, "loss": 1.1121, "step": 16161 }, { "epoch": 0.3, "learning_rate": 4.072794380721958e-06, "loss": 1.203, "step": 16162 }, { "epoch": 0.3, "learning_rate": 4.072675631606682e-06, "loss": 0.9541, "step": 16163 }, { "epoch": 0.3, "learning_rate": 4.072556876619082e-06, "loss": 1.0318, "step": 16164 }, { "epoch": 0.3, "learning_rate": 4.072438115759603e-06, "loss": 0.8937, "step": 16165 }, { "epoch": 0.31, "learning_rate": 4.072319349028688e-06, "loss": 0.947, "step": 16166 }, { "epoch": 0.31, "learning_rate": 4.072200576426781e-06, "loss": 1.0094, "step": 16167 }, { "epoch": 0.31, "learning_rate": 4.072081797954326e-06, "loss": 1.0842, "step": 16168 }, { "epoch": 0.31, "learning_rate": 4.071963013611766e-06, "loss": 0.989, "step": 16169 }, { "epoch": 0.31, "learning_rate": 4.0718442233995435e-06, "loss": 0.8383, "step": 16170 }, { "epoch": 0.31, "learning_rate": 4.071725427318103e-06, "loss": 0.946, "step": 16171 }, { "epoch": 0.31, "learning_rate": 4.0716066253678875e-06, "loss": 0.8615, "step": 16172 }, { "epoch": 0.31, "learning_rate": 4.071487817549341e-06, "loss": 0.9743, "step": 16173 }, { "epoch": 0.31, "learning_rate": 4.071369003862908e-06, "loss": 1.2767, "step": 16174 }, { "epoch": 0.31, "learning_rate": 4.0712501843090315e-06, "loss": 1.1455, "step": 16175 }, { "epoch": 0.31, "learning_rate": 4.071131358888154e-06, "loss": 0.9523, "step": 16176 }, { "epoch": 0.31, "learning_rate": 4.071012527600721e-06, "loss": 0.9929, "step": 16177 }, { "epoch": 0.31, "learning_rate": 4.070893690447175e-06, "loss": 0.9114, "step": 16178 }, { "epoch": 0.31, "learning_rate": 4.07077484742796e-06, "loss": 1.0119, "step": 16179 }, { "epoch": 0.31, "learning_rate": 4.07065599854352e-06, "loss": 0.8589, "step": 16180 }, { "epoch": 0.31, "learning_rate": 4.070537143794298e-06, "loss": 1.2496, "step": 16181 }, { "epoch": 0.31, "learning_rate": 4.0704182831807394e-06, "loss": 0.8828, "step": 16182 }, { "epoch": 0.31, "learning_rate": 4.0702994167032875e-06, "loss": 0.9023, "step": 16183 }, { "epoch": 0.31, "learning_rate": 4.0701805443623846e-06, "loss": 0.943, "step": 16184 }, { "epoch": 0.31, "learning_rate": 4.0700616661584755e-06, "loss": 0.8079, "step": 16185 }, { "epoch": 0.31, "learning_rate": 4.069942782092006e-06, "loss": 0.9756, "step": 16186 }, { "epoch": 0.31, "learning_rate": 4.069823892163417e-06, "loss": 1.045, "step": 16187 }, { "epoch": 0.31, "learning_rate": 4.069704996373154e-06, "loss": 0.7368, "step": 16188 }, { "epoch": 0.31, "learning_rate": 4.06958609472166e-06, "loss": 0.8994, "step": 16189 }, { "epoch": 0.31, "learning_rate": 4.069467187209381e-06, "loss": 0.9308, "step": 16190 }, { "epoch": 0.31, "learning_rate": 4.069348273836758e-06, "loss": 0.812, "step": 16191 }, { "epoch": 0.31, "learning_rate": 4.069229354604238e-06, "loss": 0.9702, "step": 16192 }, { "epoch": 0.31, "learning_rate": 4.069110429512263e-06, "loss": 1.1172, "step": 16193 }, { "epoch": 0.31, "learning_rate": 4.068991498561278e-06, "loss": 0.9202, "step": 16194 }, { "epoch": 0.31, "learning_rate": 4.0688725617517265e-06, "loss": 0.8014, "step": 16195 }, { "epoch": 0.31, "learning_rate": 4.068753619084054e-06, "loss": 0.8839, "step": 16196 }, { "epoch": 0.31, "learning_rate": 4.068634670558702e-06, "loss": 0.8598, "step": 16197 }, { "epoch": 0.31, "learning_rate": 4.0685157161761176e-06, "loss": 0.827, "step": 16198 }, { "epoch": 0.31, "learning_rate": 4.068396755936743e-06, "loss": 0.8948, "step": 16199 }, { "epoch": 0.31, "learning_rate": 4.068277789841023e-06, "loss": 1.3668, "step": 16200 }, { "epoch": 0.31, "learning_rate": 4.068158817889403e-06, "loss": 1.0081, "step": 16201 }, { "epoch": 0.31, "learning_rate": 4.068039840082324e-06, "loss": 0.9753, "step": 16202 }, { "epoch": 0.31, "learning_rate": 4.067920856420233e-06, "loss": 0.8506, "step": 16203 }, { "epoch": 0.31, "learning_rate": 4.067801866903575e-06, "loss": 0.9226, "step": 16204 }, { "epoch": 0.31, "learning_rate": 4.067682871532791e-06, "loss": 0.8757, "step": 16205 }, { "epoch": 0.31, "learning_rate": 4.067563870308328e-06, "loss": 1.0957, "step": 16206 }, { "epoch": 0.31, "learning_rate": 4.067444863230629e-06, "loss": 0.838, "step": 16207 }, { "epoch": 0.31, "learning_rate": 4.06732585030014e-06, "loss": 0.9492, "step": 16208 }, { "epoch": 0.31, "learning_rate": 4.067206831517304e-06, "loss": 0.8793, "step": 16209 }, { "epoch": 0.31, "learning_rate": 4.0670878068825656e-06, "loss": 1.0789, "step": 16210 }, { "epoch": 0.31, "learning_rate": 4.0669687763963695e-06, "loss": 0.9455, "step": 16211 }, { "epoch": 0.31, "learning_rate": 4.06684974005916e-06, "loss": 1.0049, "step": 16212 }, { "epoch": 0.31, "learning_rate": 4.066730697871382e-06, "loss": 0.8672, "step": 16213 }, { "epoch": 0.31, "learning_rate": 4.066611649833478e-06, "loss": 0.8502, "step": 16214 }, { "epoch": 0.31, "learning_rate": 4.066492595945896e-06, "loss": 0.9412, "step": 16215 }, { "epoch": 0.31, "learning_rate": 4.0663735362090785e-06, "loss": 1.0141, "step": 16216 }, { "epoch": 0.31, "learning_rate": 4.066254470623469e-06, "loss": 0.8101, "step": 16217 }, { "epoch": 0.31, "learning_rate": 4.066135399189514e-06, "loss": 1.0767, "step": 16218 }, { "epoch": 0.31, "learning_rate": 4.066016321907658e-06, "loss": 0.9886, "step": 16219 }, { "epoch": 0.31, "learning_rate": 4.065897238778344e-06, "loss": 0.791, "step": 16220 }, { "epoch": 0.31, "learning_rate": 4.065778149802019e-06, "loss": 0.991, "step": 16221 }, { "epoch": 0.31, "learning_rate": 4.065659054979125e-06, "loss": 0.9012, "step": 16222 }, { "epoch": 0.31, "learning_rate": 4.065539954310109e-06, "loss": 0.8112, "step": 16223 }, { "epoch": 0.31, "learning_rate": 4.065420847795415e-06, "loss": 1.0232, "step": 16224 }, { "epoch": 0.31, "learning_rate": 4.065301735435487e-06, "loss": 1.3108, "step": 16225 }, { "epoch": 0.31, "learning_rate": 4.06518261723077e-06, "loss": 0.8776, "step": 16226 }, { "epoch": 0.31, "learning_rate": 4.06506349318171e-06, "loss": 0.7916, "step": 16227 }, { "epoch": 0.31, "learning_rate": 4.06494436328875e-06, "loss": 0.9603, "step": 16228 }, { "epoch": 0.31, "learning_rate": 4.064825227552336e-06, "loss": 0.9044, "step": 16229 }, { "epoch": 0.31, "learning_rate": 4.064706085972912e-06, "loss": 0.9062, "step": 16230 }, { "epoch": 0.31, "learning_rate": 4.064586938550925e-06, "loss": 1.035, "step": 16231 }, { "epoch": 0.31, "learning_rate": 4.064467785286817e-06, "loss": 1.1456, "step": 16232 }, { "epoch": 0.31, "learning_rate": 4.064348626181036e-06, "loss": 0.904, "step": 16233 }, { "epoch": 0.31, "learning_rate": 4.064229461234024e-06, "loss": 0.7665, "step": 16234 }, { "epoch": 0.31, "learning_rate": 4.064110290446227e-06, "loss": 0.8267, "step": 16235 }, { "epoch": 0.31, "learning_rate": 4.06399111381809e-06, "loss": 0.8711, "step": 16236 }, { "epoch": 0.31, "learning_rate": 4.0638719313500585e-06, "loss": 1.1007, "step": 16237 }, { "epoch": 0.31, "learning_rate": 4.063752743042577e-06, "loss": 1.1398, "step": 16238 }, { "epoch": 0.31, "learning_rate": 4.06363354889609e-06, "loss": 0.733, "step": 16239 }, { "epoch": 0.31, "learning_rate": 4.063514348911045e-06, "loss": 0.8324, "step": 16240 }, { "epoch": 0.31, "learning_rate": 4.0633951430878845e-06, "loss": 0.9265, "step": 16241 }, { "epoch": 0.31, "learning_rate": 4.0632759314270534e-06, "loss": 0.9345, "step": 16242 }, { "epoch": 0.31, "learning_rate": 4.063156713929e-06, "loss": 1.0411, "step": 16243 }, { "epoch": 0.31, "learning_rate": 4.063037490594166e-06, "loss": 0.9742, "step": 16244 }, { "epoch": 0.31, "learning_rate": 4.062918261422998e-06, "loss": 0.7904, "step": 16245 }, { "epoch": 0.31, "learning_rate": 4.062799026415941e-06, "loss": 0.8986, "step": 16246 }, { "epoch": 0.31, "learning_rate": 4.06267978557344e-06, "loss": 1.0466, "step": 16247 }, { "epoch": 0.31, "learning_rate": 4.062560538895942e-06, "loss": 0.8608, "step": 16248 }, { "epoch": 0.31, "learning_rate": 4.06244128638389e-06, "loss": 1.0109, "step": 16249 }, { "epoch": 0.31, "learning_rate": 4.062322028037731e-06, "loss": 1.0246, "step": 16250 }, { "epoch": 0.31, "learning_rate": 4.062202763857908e-06, "loss": 0.9911, "step": 16251 }, { "epoch": 0.31, "learning_rate": 4.0620834938448685e-06, "loss": 0.9706, "step": 16252 }, { "epoch": 0.31, "learning_rate": 4.061964217999057e-06, "loss": 0.8748, "step": 16253 }, { "epoch": 0.31, "learning_rate": 4.061844936320919e-06, "loss": 1.1083, "step": 16254 }, { "epoch": 0.31, "learning_rate": 4.0617256488109005e-06, "loss": 1.0801, "step": 16255 }, { "epoch": 0.31, "learning_rate": 4.061606355469445e-06, "loss": 1.0377, "step": 16256 }, { "epoch": 0.31, "learning_rate": 4.061487056297001e-06, "loss": 0.9201, "step": 16257 }, { "epoch": 0.31, "learning_rate": 4.0613677512940104e-06, "loss": 0.9153, "step": 16258 }, { "epoch": 0.31, "learning_rate": 4.061248440460921e-06, "loss": 0.9767, "step": 16259 }, { "epoch": 0.31, "learning_rate": 4.0611291237981785e-06, "loss": 0.8805, "step": 16260 }, { "epoch": 0.31, "learning_rate": 4.061009801306228e-06, "loss": 1.0013, "step": 16261 }, { "epoch": 0.31, "learning_rate": 4.060890472985514e-06, "loss": 1.0777, "step": 16262 }, { "epoch": 0.31, "learning_rate": 4.060771138836483e-06, "loss": 1.0425, "step": 16263 }, { "epoch": 0.31, "learning_rate": 4.06065179885958e-06, "loss": 0.9214, "step": 16264 }, { "epoch": 0.31, "learning_rate": 4.060532453055251e-06, "loss": 0.987, "step": 16265 }, { "epoch": 0.31, "learning_rate": 4.060413101423943e-06, "loss": 1.0274, "step": 16266 }, { "epoch": 0.31, "learning_rate": 4.060293743966099e-06, "loss": 1.0859, "step": 16267 }, { "epoch": 0.31, "learning_rate": 4.060174380682167e-06, "loss": 1.2268, "step": 16268 }, { "epoch": 0.31, "learning_rate": 4.060055011572591e-06, "loss": 1.0784, "step": 16269 }, { "epoch": 0.31, "learning_rate": 4.0599356366378175e-06, "loss": 0.9837, "step": 16270 }, { "epoch": 0.31, "learning_rate": 4.059816255878292e-06, "loss": 0.9072, "step": 16271 }, { "epoch": 0.31, "learning_rate": 4.059696869294461e-06, "loss": 0.7384, "step": 16272 }, { "epoch": 0.31, "learning_rate": 4.059577476886768e-06, "loss": 0.9492, "step": 16273 }, { "epoch": 0.31, "learning_rate": 4.059458078655662e-06, "loss": 0.9064, "step": 16274 }, { "epoch": 0.31, "learning_rate": 4.059338674601588e-06, "loss": 1.0974, "step": 16275 }, { "epoch": 0.31, "learning_rate": 4.0592192647249895e-06, "loss": 1.1269, "step": 16276 }, { "epoch": 0.31, "learning_rate": 4.059099849026315e-06, "loss": 0.8539, "step": 16277 }, { "epoch": 0.31, "learning_rate": 4.05898042750601e-06, "loss": 0.9329, "step": 16278 }, { "epoch": 0.31, "learning_rate": 4.058861000164519e-06, "loss": 0.9794, "step": 16279 }, { "epoch": 0.31, "learning_rate": 4.058741567002289e-06, "loss": 0.9915, "step": 16280 }, { "epoch": 0.31, "learning_rate": 4.0586221280197666e-06, "loss": 1.0822, "step": 16281 }, { "epoch": 0.31, "learning_rate": 4.058502683217396e-06, "loss": 0.9099, "step": 16282 }, { "epoch": 0.31, "learning_rate": 4.058383232595624e-06, "loss": 0.8861, "step": 16283 }, { "epoch": 0.31, "learning_rate": 4.058263776154897e-06, "loss": 0.9618, "step": 16284 }, { "epoch": 0.31, "learning_rate": 4.058144313895661e-06, "loss": 0.8464, "step": 16285 }, { "epoch": 0.31, "learning_rate": 4.058024845818363e-06, "loss": 0.7918, "step": 16286 }, { "epoch": 0.31, "learning_rate": 4.057905371923446e-06, "loss": 1.1752, "step": 16287 }, { "epoch": 0.31, "learning_rate": 4.05778589221136e-06, "loss": 1.0328, "step": 16288 }, { "epoch": 0.31, "learning_rate": 4.057666406682548e-06, "loss": 0.71, "step": 16289 }, { "epoch": 0.31, "learning_rate": 4.057546915337458e-06, "loss": 0.8701, "step": 16290 }, { "epoch": 0.31, "learning_rate": 4.057427418176535e-06, "loss": 0.8953, "step": 16291 }, { "epoch": 0.31, "learning_rate": 4.057307915200226e-06, "loss": 0.968, "step": 16292 }, { "epoch": 0.31, "learning_rate": 4.057188406408977e-06, "loss": 0.8258, "step": 16293 }, { "epoch": 0.31, "learning_rate": 4.057068891803234e-06, "loss": 0.83, "step": 16294 }, { "epoch": 0.31, "learning_rate": 4.056949371383444e-06, "loss": 0.9611, "step": 16295 }, { "epoch": 0.31, "learning_rate": 4.056829845150052e-06, "loss": 1.0277, "step": 16296 }, { "epoch": 0.31, "learning_rate": 4.056710313103506e-06, "loss": 0.8933, "step": 16297 }, { "epoch": 0.31, "learning_rate": 4.056590775244252e-06, "loss": 1.0363, "step": 16298 }, { "epoch": 0.31, "learning_rate": 4.056471231572734e-06, "loss": 1.2202, "step": 16299 }, { "epoch": 0.31, "learning_rate": 4.0563516820894015e-06, "loss": 1.092, "step": 16300 }, { "epoch": 0.31, "learning_rate": 4.056232126794698e-06, "loss": 0.915, "step": 16301 }, { "epoch": 0.31, "learning_rate": 4.056112565689073e-06, "loss": 0.9816, "step": 16302 }, { "epoch": 0.31, "learning_rate": 4.055992998772971e-06, "loss": 0.9658, "step": 16303 }, { "epoch": 0.31, "learning_rate": 4.055873426046839e-06, "loss": 0.8215, "step": 16304 }, { "epoch": 0.31, "learning_rate": 4.055753847511123e-06, "loss": 1.0792, "step": 16305 }, { "epoch": 0.31, "learning_rate": 4.055634263166269e-06, "loss": 1.1829, "step": 16306 }, { "epoch": 0.31, "learning_rate": 4.0555146730127255e-06, "loss": 1.0165, "step": 16307 }, { "epoch": 0.31, "learning_rate": 4.055395077050938e-06, "loss": 1.0914, "step": 16308 }, { "epoch": 0.31, "learning_rate": 4.055275475281353e-06, "loss": 0.9378, "step": 16309 }, { "epoch": 0.31, "learning_rate": 4.055155867704415e-06, "loss": 0.9352, "step": 16310 }, { "epoch": 0.31, "learning_rate": 4.0550362543205754e-06, "loss": 0.9696, "step": 16311 }, { "epoch": 0.31, "learning_rate": 4.054916635130277e-06, "loss": 1.0583, "step": 16312 }, { "epoch": 0.31, "learning_rate": 4.054797010133967e-06, "loss": 1.0695, "step": 16313 }, { "epoch": 0.31, "learning_rate": 4.054677379332093e-06, "loss": 1.0919, "step": 16314 }, { "epoch": 0.31, "learning_rate": 4.054557742725103e-06, "loss": 0.8844, "step": 16315 }, { "epoch": 0.31, "learning_rate": 4.0544381003134405e-06, "loss": 0.9246, "step": 16316 }, { "epoch": 0.31, "learning_rate": 4.0543184520975535e-06, "loss": 0.8174, "step": 16317 }, { "epoch": 0.31, "learning_rate": 4.05419879807789e-06, "loss": 1.1932, "step": 16318 }, { "epoch": 0.31, "learning_rate": 4.054079138254895e-06, "loss": 0.951, "step": 16319 }, { "epoch": 0.31, "learning_rate": 4.053959472629017e-06, "loss": 0.8495, "step": 16320 }, { "epoch": 0.31, "learning_rate": 4.053839801200701e-06, "loss": 0.8129, "step": 16321 }, { "epoch": 0.31, "learning_rate": 4.053720123970395e-06, "loss": 0.9025, "step": 16322 }, { "epoch": 0.31, "learning_rate": 4.053600440938547e-06, "loss": 0.8931, "step": 16323 }, { "epoch": 0.31, "learning_rate": 4.053480752105601e-06, "loss": 1.0704, "step": 16324 }, { "epoch": 0.31, "learning_rate": 4.053361057472005e-06, "loss": 1.0647, "step": 16325 }, { "epoch": 0.31, "learning_rate": 4.0532413570382075e-06, "loss": 0.9293, "step": 16326 }, { "epoch": 0.31, "learning_rate": 4.053121650804655e-06, "loss": 1.0189, "step": 16327 }, { "epoch": 0.31, "learning_rate": 4.053001938771794e-06, "loss": 0.8369, "step": 16328 }, { "epoch": 0.31, "learning_rate": 4.052882220940069e-06, "loss": 0.7108, "step": 16329 }, { "epoch": 0.31, "learning_rate": 4.052762497309932e-06, "loss": 0.9312, "step": 16330 }, { "epoch": 0.31, "learning_rate": 4.052642767881826e-06, "loss": 1.069, "step": 16331 }, { "epoch": 0.31, "learning_rate": 4.0525230326562e-06, "loss": 0.8292, "step": 16332 }, { "epoch": 0.31, "learning_rate": 4.052403291633501e-06, "loss": 0.8536, "step": 16333 }, { "epoch": 0.31, "learning_rate": 4.0522835448141754e-06, "loss": 0.9012, "step": 16334 }, { "epoch": 0.31, "learning_rate": 4.052163792198671e-06, "loss": 0.8731, "step": 16335 }, { "epoch": 0.31, "learning_rate": 4.0520440337874335e-06, "loss": 0.9047, "step": 16336 }, { "epoch": 0.31, "learning_rate": 4.051924269580912e-06, "loss": 1.103, "step": 16337 }, { "epoch": 0.31, "learning_rate": 4.051804499579553e-06, "loss": 1.2741, "step": 16338 }, { "epoch": 0.31, "learning_rate": 4.051684723783803e-06, "loss": 0.8726, "step": 16339 }, { "epoch": 0.31, "learning_rate": 4.05156494219411e-06, "loss": 1.0596, "step": 16340 }, { "epoch": 0.31, "learning_rate": 4.051445154810921e-06, "loss": 0.9409, "step": 16341 }, { "epoch": 0.31, "learning_rate": 4.051325361634684e-06, "loss": 0.9602, "step": 16342 }, { "epoch": 0.31, "learning_rate": 4.051205562665844e-06, "loss": 1.1484, "step": 16343 }, { "epoch": 0.31, "learning_rate": 4.051085757904852e-06, "loss": 1.0127, "step": 16344 }, { "epoch": 0.31, "learning_rate": 4.050965947352152e-06, "loss": 0.982, "step": 16345 }, { "epoch": 0.31, "learning_rate": 4.050846131008193e-06, "loss": 0.8514, "step": 16346 }, { "epoch": 0.31, "learning_rate": 4.0507263088734224e-06, "loss": 0.9426, "step": 16347 }, { "epoch": 0.31, "learning_rate": 4.050606480948288e-06, "loss": 0.8536, "step": 16348 }, { "epoch": 0.31, "learning_rate": 4.050486647233235e-06, "loss": 0.8698, "step": 16349 }, { "epoch": 0.31, "learning_rate": 4.050366807728713e-06, "loss": 1.0023, "step": 16350 }, { "epoch": 0.31, "learning_rate": 4.05024696243517e-06, "loss": 0.8867, "step": 16351 }, { "epoch": 0.31, "learning_rate": 4.05012711135305e-06, "loss": 0.6852, "step": 16352 }, { "epoch": 0.31, "learning_rate": 4.050007254482805e-06, "loss": 0.8349, "step": 16353 }, { "epoch": 0.31, "learning_rate": 4.049887391824879e-06, "loss": 0.7077, "step": 16354 }, { "epoch": 0.31, "learning_rate": 4.049767523379722e-06, "loss": 1.09, "step": 16355 }, { "epoch": 0.31, "learning_rate": 4.049647649147781e-06, "loss": 1.2604, "step": 16356 }, { "epoch": 0.31, "learning_rate": 4.049527769129502e-06, "loss": 0.8847, "step": 16357 }, { "epoch": 0.31, "learning_rate": 4.049407883325335e-06, "loss": 0.8765, "step": 16358 }, { "epoch": 0.31, "learning_rate": 4.049287991735726e-06, "loss": 1.119, "step": 16359 }, { "epoch": 0.31, "learning_rate": 4.049168094361122e-06, "loss": 0.9977, "step": 16360 }, { "epoch": 0.31, "learning_rate": 4.049048191201973e-06, "loss": 0.8419, "step": 16361 }, { "epoch": 0.31, "learning_rate": 4.048928282258725e-06, "loss": 1.0399, "step": 16362 }, { "epoch": 0.31, "learning_rate": 4.048808367531827e-06, "loss": 1.1331, "step": 16363 }, { "epoch": 0.31, "learning_rate": 4.0486884470217256e-06, "loss": 0.8544, "step": 16364 }, { "epoch": 0.31, "learning_rate": 4.048568520728869e-06, "loss": 0.8297, "step": 16365 }, { "epoch": 0.31, "learning_rate": 4.048448588653705e-06, "loss": 0.8295, "step": 16366 }, { "epoch": 0.31, "learning_rate": 4.048328650796681e-06, "loss": 0.9145, "step": 16367 }, { "epoch": 0.31, "learning_rate": 4.048208707158247e-06, "loss": 1.0085, "step": 16368 }, { "epoch": 0.31, "learning_rate": 4.048088757738847e-06, "loss": 1.0827, "step": 16369 }, { "epoch": 0.31, "learning_rate": 4.047968802538932e-06, "loss": 0.9479, "step": 16370 }, { "epoch": 0.31, "learning_rate": 4.047848841558949e-06, "loss": 0.9691, "step": 16371 }, { "epoch": 0.31, "learning_rate": 4.0477288747993456e-06, "loss": 0.9211, "step": 16372 }, { "epoch": 0.31, "learning_rate": 4.0476089022605705e-06, "loss": 0.8031, "step": 16373 }, { "epoch": 0.31, "learning_rate": 4.047488923943072e-06, "loss": 0.8543, "step": 16374 }, { "epoch": 0.31, "learning_rate": 4.047368939847296e-06, "loss": 1.0612, "step": 16375 }, { "epoch": 0.31, "learning_rate": 4.047248949973692e-06, "loss": 0.8016, "step": 16376 }, { "epoch": 0.31, "learning_rate": 4.047128954322708e-06, "loss": 0.7867, "step": 16377 }, { "epoch": 0.31, "learning_rate": 4.047008952894791e-06, "loss": 1.1757, "step": 16378 }, { "epoch": 0.31, "learning_rate": 4.046888945690391e-06, "loss": 0.8167, "step": 16379 }, { "epoch": 0.31, "learning_rate": 4.046768932709955e-06, "loss": 1.2592, "step": 16380 }, { "epoch": 0.31, "learning_rate": 4.046648913953931e-06, "loss": 1.1854, "step": 16381 }, { "epoch": 0.31, "learning_rate": 4.046528889422768e-06, "loss": 0.9006, "step": 16382 }, { "epoch": 0.31, "learning_rate": 4.046408859116913e-06, "loss": 0.8368, "step": 16383 }, { "epoch": 0.31, "learning_rate": 4.046288823036816e-06, "loss": 1.132, "step": 16384 }, { "epoch": 0.31, "learning_rate": 4.046168781182922e-06, "loss": 1.0543, "step": 16385 }, { "epoch": 0.31, "learning_rate": 4.046048733555683e-06, "loss": 1.0999, "step": 16386 }, { "epoch": 0.31, "learning_rate": 4.0459286801555436e-06, "loss": 0.8917, "step": 16387 }, { "epoch": 0.31, "learning_rate": 4.045808620982955e-06, "loss": 1.1386, "step": 16388 }, { "epoch": 0.31, "learning_rate": 4.045688556038364e-06, "loss": 0.9917, "step": 16389 }, { "epoch": 0.31, "learning_rate": 4.04556848532222e-06, "loss": 0.9293, "step": 16390 }, { "epoch": 0.31, "learning_rate": 4.04544840883497e-06, "loss": 0.6728, "step": 16391 }, { "epoch": 0.31, "learning_rate": 4.045328326577063e-06, "loss": 0.9271, "step": 16392 }, { "epoch": 0.31, "learning_rate": 4.045208238548948e-06, "loss": 1.2214, "step": 16393 }, { "epoch": 0.31, "learning_rate": 4.045088144751072e-06, "loss": 0.8149, "step": 16394 }, { "epoch": 0.31, "learning_rate": 4.044968045183884e-06, "loss": 0.9605, "step": 16395 }, { "epoch": 0.31, "learning_rate": 4.0448479398478336e-06, "loss": 0.7672, "step": 16396 }, { "epoch": 0.31, "learning_rate": 4.044727828743369e-06, "loss": 0.9901, "step": 16397 }, { "epoch": 0.31, "learning_rate": 4.044607711870936e-06, "loss": 0.8683, "step": 16398 }, { "epoch": 0.31, "learning_rate": 4.0444875892309865e-06, "loss": 1.1924, "step": 16399 }, { "epoch": 0.31, "learning_rate": 4.044367460823968e-06, "loss": 1.2789, "step": 16400 }, { "epoch": 0.31, "learning_rate": 4.044247326650328e-06, "loss": 1.0551, "step": 16401 }, { "epoch": 0.31, "learning_rate": 4.044127186710516e-06, "loss": 1.044, "step": 16402 }, { "epoch": 0.31, "learning_rate": 4.044007041004981e-06, "loss": 0.9608, "step": 16403 }, { "epoch": 0.31, "learning_rate": 4.04388688953417e-06, "loss": 0.9597, "step": 16404 }, { "epoch": 0.31, "learning_rate": 4.043766732298533e-06, "loss": 0.831, "step": 16405 }, { "epoch": 0.31, "learning_rate": 4.043646569298519e-06, "loss": 0.9724, "step": 16406 }, { "epoch": 0.31, "learning_rate": 4.043526400534576e-06, "loss": 0.9352, "step": 16407 }, { "epoch": 0.31, "learning_rate": 4.043406226007152e-06, "loss": 0.8746, "step": 16408 }, { "epoch": 0.31, "learning_rate": 4.043286045716697e-06, "loss": 0.8794, "step": 16409 }, { "epoch": 0.31, "learning_rate": 4.043165859663659e-06, "loss": 0.9704, "step": 16410 }, { "epoch": 0.31, "learning_rate": 4.043045667848487e-06, "loss": 0.7477, "step": 16411 }, { "epoch": 0.31, "learning_rate": 4.04292547027163e-06, "loss": 1.067, "step": 16412 }, { "epoch": 0.31, "learning_rate": 4.042805266933536e-06, "loss": 0.8615, "step": 16413 }, { "epoch": 0.31, "learning_rate": 4.042685057834656e-06, "loss": 0.9406, "step": 16414 }, { "epoch": 0.31, "learning_rate": 4.042564842975436e-06, "loss": 1.0436, "step": 16415 }, { "epoch": 0.31, "learning_rate": 4.0424446223563255e-06, "loss": 0.9445, "step": 16416 }, { "epoch": 0.31, "learning_rate": 4.042324395977775e-06, "loss": 1.0015, "step": 16417 }, { "epoch": 0.31, "learning_rate": 4.042204163840233e-06, "loss": 1.0175, "step": 16418 }, { "epoch": 0.31, "learning_rate": 4.042083925944147e-06, "loss": 0.9083, "step": 16419 }, { "epoch": 0.31, "learning_rate": 4.041963682289967e-06, "loss": 0.8399, "step": 16420 }, { "epoch": 0.31, "learning_rate": 4.041843432878143e-06, "loss": 0.9413, "step": 16421 }, { "epoch": 0.31, "learning_rate": 4.041723177709122e-06, "loss": 0.8203, "step": 16422 }, { "epoch": 0.31, "learning_rate": 4.041602916783353e-06, "loss": 0.9208, "step": 16423 }, { "epoch": 0.31, "learning_rate": 4.041482650101288e-06, "loss": 0.7423, "step": 16424 }, { "epoch": 0.31, "learning_rate": 4.041362377663373e-06, "loss": 1.1318, "step": 16425 }, { "epoch": 0.31, "learning_rate": 4.0412420994700574e-06, "loss": 0.9549, "step": 16426 }, { "epoch": 0.31, "learning_rate": 4.041121815521792e-06, "loss": 0.9323, "step": 16427 }, { "epoch": 0.31, "learning_rate": 4.041001525819025e-06, "loss": 0.777, "step": 16428 }, { "epoch": 0.31, "learning_rate": 4.040881230362205e-06, "loss": 0.9834, "step": 16429 }, { "epoch": 0.31, "learning_rate": 4.040760929151783e-06, "loss": 0.8584, "step": 16430 }, { "epoch": 0.31, "learning_rate": 4.040640622188206e-06, "loss": 1.1091, "step": 16431 }, { "epoch": 0.31, "learning_rate": 4.040520309471924e-06, "loss": 0.7466, "step": 16432 }, { "epoch": 0.31, "learning_rate": 4.040399991003386e-06, "loss": 0.8112, "step": 16433 }, { "epoch": 0.31, "learning_rate": 4.040279666783043e-06, "loss": 0.7623, "step": 16434 }, { "epoch": 0.31, "learning_rate": 4.040159336811341e-06, "loss": 0.8293, "step": 16435 }, { "epoch": 0.31, "learning_rate": 4.040039001088733e-06, "loss": 0.7227, "step": 16436 }, { "epoch": 0.31, "learning_rate": 4.039918659615666e-06, "loss": 0.8832, "step": 16437 }, { "epoch": 0.31, "learning_rate": 4.03979831239259e-06, "loss": 1.1642, "step": 16438 }, { "epoch": 0.31, "learning_rate": 4.0396779594199545e-06, "loss": 1.0778, "step": 16439 }, { "epoch": 0.31, "learning_rate": 4.039557600698208e-06, "loss": 0.9814, "step": 16440 }, { "epoch": 0.31, "learning_rate": 4.039437236227801e-06, "loss": 0.8335, "step": 16441 }, { "epoch": 0.31, "learning_rate": 4.039316866009183e-06, "loss": 0.9204, "step": 16442 }, { "epoch": 0.31, "learning_rate": 4.039196490042802e-06, "loss": 1.1058, "step": 16443 }, { "epoch": 0.31, "learning_rate": 4.03907610832911e-06, "loss": 1.0507, "step": 16444 }, { "epoch": 0.31, "learning_rate": 4.0389557208685545e-06, "loss": 1.0843, "step": 16445 }, { "epoch": 0.31, "learning_rate": 4.0388353276615845e-06, "loss": 0.8556, "step": 16446 }, { "epoch": 0.31, "learning_rate": 4.038714928708651e-06, "loss": 0.9438, "step": 16447 }, { "epoch": 0.31, "learning_rate": 4.038594524010204e-06, "loss": 0.9585, "step": 16448 }, { "epoch": 0.31, "learning_rate": 4.038474113566691e-06, "loss": 1.0756, "step": 16449 }, { "epoch": 0.31, "learning_rate": 4.038353697378564e-06, "loss": 1.0685, "step": 16450 }, { "epoch": 0.31, "learning_rate": 4.038233275446271e-06, "loss": 0.9017, "step": 16451 }, { "epoch": 0.31, "learning_rate": 4.038112847770262e-06, "loss": 0.8029, "step": 16452 }, { "epoch": 0.31, "learning_rate": 4.037992414350987e-06, "loss": 0.7498, "step": 16453 }, { "epoch": 0.31, "learning_rate": 4.037871975188895e-06, "loss": 0.937, "step": 16454 }, { "epoch": 0.31, "learning_rate": 4.037751530284436e-06, "loss": 0.9997, "step": 16455 }, { "epoch": 0.31, "learning_rate": 4.0376310796380605e-06, "loss": 0.9826, "step": 16456 }, { "epoch": 0.31, "learning_rate": 4.037510623250218e-06, "loss": 0.8543, "step": 16457 }, { "epoch": 0.31, "learning_rate": 4.037390161121358e-06, "loss": 0.9731, "step": 16458 }, { "epoch": 0.31, "learning_rate": 4.037269693251929e-06, "loss": 1.1093, "step": 16459 }, { "epoch": 0.31, "learning_rate": 4.037149219642384e-06, "loss": 0.9642, "step": 16460 }, { "epoch": 0.31, "learning_rate": 4.037028740293169e-06, "loss": 0.9441, "step": 16461 }, { "epoch": 0.31, "learning_rate": 4.036908255204737e-06, "loss": 1.2211, "step": 16462 }, { "epoch": 0.31, "learning_rate": 4.036787764377536e-06, "loss": 1.1508, "step": 16463 }, { "epoch": 0.31, "learning_rate": 4.036667267812018e-06, "loss": 0.8871, "step": 16464 }, { "epoch": 0.31, "learning_rate": 4.03654676550863e-06, "loss": 0.9196, "step": 16465 }, { "epoch": 0.31, "learning_rate": 4.036426257467825e-06, "loss": 0.6962, "step": 16466 }, { "epoch": 0.31, "learning_rate": 4.03630574369005e-06, "loss": 0.8497, "step": 16467 }, { "epoch": 0.31, "learning_rate": 4.036185224175756e-06, "loss": 0.9282, "step": 16468 }, { "epoch": 0.31, "learning_rate": 4.036064698925395e-06, "loss": 0.9936, "step": 16469 }, { "epoch": 0.31, "learning_rate": 4.035944167939415e-06, "loss": 1.0599, "step": 16470 }, { "epoch": 0.31, "learning_rate": 4.035823631218266e-06, "loss": 0.8583, "step": 16471 }, { "epoch": 0.31, "learning_rate": 4.0357030887624e-06, "loss": 0.9224, "step": 16472 }, { "epoch": 0.31, "learning_rate": 4.0355825405722645e-06, "loss": 0.9016, "step": 16473 }, { "epoch": 0.31, "learning_rate": 4.035461986648311e-06, "loss": 1.1505, "step": 16474 }, { "epoch": 0.31, "learning_rate": 4.035341426990991e-06, "loss": 1.217, "step": 16475 }, { "epoch": 0.31, "learning_rate": 4.0352208616007514e-06, "loss": 0.8187, "step": 16476 }, { "epoch": 0.31, "learning_rate": 4.035100290478045e-06, "loss": 0.9032, "step": 16477 }, { "epoch": 0.31, "learning_rate": 4.034979713623321e-06, "loss": 0.7617, "step": 16478 }, { "epoch": 0.31, "learning_rate": 4.03485913103703e-06, "loss": 1.0264, "step": 16479 }, { "epoch": 0.31, "learning_rate": 4.034738542719621e-06, "loss": 0.8013, "step": 16480 }, { "epoch": 0.31, "learning_rate": 4.034617948671546e-06, "loss": 0.8864, "step": 16481 }, { "epoch": 0.31, "learning_rate": 4.034497348893256e-06, "loss": 1.0937, "step": 16482 }, { "epoch": 0.31, "learning_rate": 4.034376743385198e-06, "loss": 0.8936, "step": 16483 }, { "epoch": 0.31, "learning_rate": 4.034256132147826e-06, "loss": 0.8536, "step": 16484 }, { "epoch": 0.31, "learning_rate": 4.034135515181587e-06, "loss": 1.1007, "step": 16485 }, { "epoch": 0.31, "learning_rate": 4.034014892486934e-06, "loss": 0.8932, "step": 16486 }, { "epoch": 0.31, "learning_rate": 4.033894264064316e-06, "loss": 1.1449, "step": 16487 }, { "epoch": 0.31, "learning_rate": 4.033773629914184e-06, "loss": 1.062, "step": 16488 }, { "epoch": 0.31, "learning_rate": 4.033652990036988e-06, "loss": 0.7736, "step": 16489 }, { "epoch": 0.31, "learning_rate": 4.0335323444331794e-06, "loss": 0.8964, "step": 16490 }, { "epoch": 0.31, "learning_rate": 4.033411693103208e-06, "loss": 0.8512, "step": 16491 }, { "epoch": 0.31, "learning_rate": 4.0332910360475246e-06, "loss": 0.9846, "step": 16492 }, { "epoch": 0.31, "learning_rate": 4.033170373266578e-06, "loss": 1.0723, "step": 16493 }, { "epoch": 0.31, "learning_rate": 4.033049704760821e-06, "loss": 1.1085, "step": 16494 }, { "epoch": 0.31, "learning_rate": 4.032929030530703e-06, "loss": 0.7574, "step": 16495 }, { "epoch": 0.31, "learning_rate": 4.032808350576677e-06, "loss": 0.8184, "step": 16496 }, { "epoch": 0.31, "learning_rate": 4.0326876648991895e-06, "loss": 0.9598, "step": 16497 }, { "epoch": 0.31, "learning_rate": 4.032566973498694e-06, "loss": 0.8335, "step": 16498 }, { "epoch": 0.31, "learning_rate": 4.03244627637564e-06, "loss": 1.025, "step": 16499 }, { "epoch": 0.31, "learning_rate": 4.032325573530479e-06, "loss": 1.1108, "step": 16500 }, { "epoch": 0.31, "learning_rate": 4.032204864963662e-06, "loss": 0.9007, "step": 16501 }, { "epoch": 0.31, "learning_rate": 4.032084150675638e-06, "loss": 0.9252, "step": 16502 }, { "epoch": 0.31, "learning_rate": 4.031963430666859e-06, "loss": 0.9412, "step": 16503 }, { "epoch": 0.31, "learning_rate": 4.031842704937775e-06, "loss": 0.872, "step": 16504 }, { "epoch": 0.31, "learning_rate": 4.031721973488838e-06, "loss": 0.8932, "step": 16505 }, { "epoch": 0.31, "learning_rate": 4.031601236320497e-06, "loss": 1.0528, "step": 16506 }, { "epoch": 0.31, "learning_rate": 4.031480493433206e-06, "loss": 0.7484, "step": 16507 }, { "epoch": 0.31, "learning_rate": 4.031359744827412e-06, "loss": 1.0077, "step": 16508 }, { "epoch": 0.31, "learning_rate": 4.0312389905035685e-06, "loss": 0.9728, "step": 16509 }, { "epoch": 0.31, "learning_rate": 4.031118230462126e-06, "loss": 0.9721, "step": 16510 }, { "epoch": 0.31, "learning_rate": 4.030997464703535e-06, "loss": 0.9821, "step": 16511 }, { "epoch": 0.31, "learning_rate": 4.030876693228245e-06, "loss": 0.9428, "step": 16512 }, { "epoch": 0.31, "learning_rate": 4.03075591603671e-06, "loss": 1.1146, "step": 16513 }, { "epoch": 0.31, "learning_rate": 4.030635133129378e-06, "loss": 1.049, "step": 16514 }, { "epoch": 0.31, "learning_rate": 4.030514344506701e-06, "loss": 0.9945, "step": 16515 }, { "epoch": 0.31, "learning_rate": 4.030393550169131e-06, "loss": 0.8503, "step": 16516 }, { "epoch": 0.31, "learning_rate": 4.030272750117119e-06, "loss": 0.9674, "step": 16517 }, { "epoch": 0.31, "learning_rate": 4.030151944351115e-06, "loss": 1.1031, "step": 16518 }, { "epoch": 0.31, "learning_rate": 4.030031132871571e-06, "loss": 1.0433, "step": 16519 }, { "epoch": 0.31, "learning_rate": 4.029910315678937e-06, "loss": 1.0106, "step": 16520 }, { "epoch": 0.31, "learning_rate": 4.029789492773665e-06, "loss": 0.7746, "step": 16521 }, { "epoch": 0.31, "learning_rate": 4.029668664156207e-06, "loss": 1.1251, "step": 16522 }, { "epoch": 0.31, "learning_rate": 4.0295478298270115e-06, "loss": 0.7847, "step": 16523 }, { "epoch": 0.31, "learning_rate": 4.029426989786531e-06, "loss": 0.8488, "step": 16524 }, { "epoch": 0.31, "learning_rate": 4.029306144035219e-06, "loss": 1.0444, "step": 16525 }, { "epoch": 0.31, "learning_rate": 4.029185292573523e-06, "loss": 0.996, "step": 16526 }, { "epoch": 0.31, "learning_rate": 4.029064435401897e-06, "loss": 0.8639, "step": 16527 }, { "epoch": 0.31, "learning_rate": 4.028943572520791e-06, "loss": 0.8848, "step": 16528 }, { "epoch": 0.31, "learning_rate": 4.028822703930657e-06, "loss": 0.7818, "step": 16529 }, { "epoch": 0.31, "learning_rate": 4.028701829631945e-06, "loss": 0.9284, "step": 16530 }, { "epoch": 0.31, "learning_rate": 4.028580949625108e-06, "loss": 0.9489, "step": 16531 }, { "epoch": 0.31, "learning_rate": 4.028460063910596e-06, "loss": 0.8026, "step": 16532 }, { "epoch": 0.31, "learning_rate": 4.028339172488861e-06, "loss": 0.8604, "step": 16533 }, { "epoch": 0.31, "learning_rate": 4.028218275360355e-06, "loss": 0.9247, "step": 16534 }, { "epoch": 0.31, "learning_rate": 4.028097372525529e-06, "loss": 1.0016, "step": 16535 }, { "epoch": 0.31, "learning_rate": 4.027976463984833e-06, "loss": 0.9254, "step": 16536 }, { "epoch": 0.31, "learning_rate": 4.027855549738721e-06, "loss": 1.0918, "step": 16537 }, { "epoch": 0.31, "learning_rate": 4.027734629787642e-06, "loss": 1.0873, "step": 16538 }, { "epoch": 0.31, "learning_rate": 4.02761370413205e-06, "loss": 0.9419, "step": 16539 }, { "epoch": 0.31, "learning_rate": 4.0274927727723945e-06, "loss": 0.983, "step": 16540 }, { "epoch": 0.31, "learning_rate": 4.027371835709128e-06, "loss": 0.7294, "step": 16541 }, { "epoch": 0.31, "learning_rate": 4.027250892942702e-06, "loss": 1.0518, "step": 16542 }, { "epoch": 0.31, "learning_rate": 4.027129944473568e-06, "loss": 1.0782, "step": 16543 }, { "epoch": 0.31, "learning_rate": 4.027008990302177e-06, "loss": 1.0889, "step": 16544 }, { "epoch": 0.31, "learning_rate": 4.026888030428982e-06, "loss": 0.8571, "step": 16545 }, { "epoch": 0.31, "learning_rate": 4.026767064854434e-06, "loss": 0.9021, "step": 16546 }, { "epoch": 0.31, "learning_rate": 4.026646093578984e-06, "loss": 0.9775, "step": 16547 }, { "epoch": 0.31, "learning_rate": 4.0265251166030845e-06, "loss": 0.764, "step": 16548 }, { "epoch": 0.31, "learning_rate": 4.026404133927187e-06, "loss": 0.9626, "step": 16549 }, { "epoch": 0.31, "learning_rate": 4.026283145551744e-06, "loss": 0.9523, "step": 16550 }, { "epoch": 0.31, "learning_rate": 4.026162151477205e-06, "loss": 0.9889, "step": 16551 }, { "epoch": 0.31, "learning_rate": 4.026041151704025e-06, "loss": 1.0499, "step": 16552 }, { "epoch": 0.31, "learning_rate": 4.025920146232653e-06, "loss": 0.864, "step": 16553 }, { "epoch": 0.31, "learning_rate": 4.025799135063542e-06, "loss": 0.8833, "step": 16554 }, { "epoch": 0.31, "learning_rate": 4.025678118197144e-06, "loss": 0.957, "step": 16555 }, { "epoch": 0.31, "learning_rate": 4.025557095633911e-06, "loss": 1.2764, "step": 16556 }, { "epoch": 0.31, "learning_rate": 4.025436067374295e-06, "loss": 0.9, "step": 16557 }, { "epoch": 0.31, "learning_rate": 4.025315033418746e-06, "loss": 0.9745, "step": 16558 }, { "epoch": 0.31, "learning_rate": 4.025193993767719e-06, "loss": 1.026, "step": 16559 }, { "epoch": 0.31, "learning_rate": 4.0250729484216635e-06, "loss": 0.8575, "step": 16560 }, { "epoch": 0.31, "learning_rate": 4.024951897381033e-06, "loss": 0.7168, "step": 16561 }, { "epoch": 0.31, "learning_rate": 4.024830840646278e-06, "loss": 1.0753, "step": 16562 }, { "epoch": 0.31, "learning_rate": 4.024709778217851e-06, "loss": 0.9276, "step": 16563 }, { "epoch": 0.31, "learning_rate": 4.024588710096206e-06, "loss": 0.9919, "step": 16564 }, { "epoch": 0.31, "learning_rate": 4.024467636281793e-06, "loss": 0.9465, "step": 16565 }, { "epoch": 0.31, "learning_rate": 4.024346556775064e-06, "loss": 0.9066, "step": 16566 }, { "epoch": 0.31, "learning_rate": 4.024225471576472e-06, "loss": 0.9285, "step": 16567 }, { "epoch": 0.31, "learning_rate": 4.024104380686469e-06, "loss": 0.9943, "step": 16568 }, { "epoch": 0.31, "learning_rate": 4.023983284105506e-06, "loss": 1.0742, "step": 16569 }, { "epoch": 0.31, "learning_rate": 4.023862181834038e-06, "loss": 0.8408, "step": 16570 }, { "epoch": 0.31, "learning_rate": 4.023741073872514e-06, "loss": 0.9478, "step": 16571 }, { "epoch": 0.31, "learning_rate": 4.023619960221388e-06, "loss": 0.8566, "step": 16572 }, { "epoch": 0.31, "learning_rate": 4.023498840881111e-06, "loss": 0.8113, "step": 16573 }, { "epoch": 0.31, "learning_rate": 4.023377715852137e-06, "loss": 1.0414, "step": 16574 }, { "epoch": 0.31, "learning_rate": 4.023256585134917e-06, "loss": 1.2353, "step": 16575 }, { "epoch": 0.31, "learning_rate": 4.023135448729904e-06, "loss": 1.1552, "step": 16576 }, { "epoch": 0.31, "learning_rate": 4.023014306637549e-06, "loss": 0.9821, "step": 16577 }, { "epoch": 0.31, "learning_rate": 4.022893158858306e-06, "loss": 1.1074, "step": 16578 }, { "epoch": 0.31, "learning_rate": 4.022772005392627e-06, "loss": 0.8218, "step": 16579 }, { "epoch": 0.31, "learning_rate": 4.022650846240963e-06, "loss": 1.0114, "step": 16580 }, { "epoch": 0.31, "learning_rate": 4.0225296814037675e-06, "loss": 1.1072, "step": 16581 }, { "epoch": 0.31, "learning_rate": 4.022408510881494e-06, "loss": 0.7974, "step": 16582 }, { "epoch": 0.31, "learning_rate": 4.022287334674593e-06, "loss": 0.9718, "step": 16583 }, { "epoch": 0.31, "learning_rate": 4.022166152783518e-06, "loss": 0.9786, "step": 16584 }, { "epoch": 0.31, "learning_rate": 4.022044965208721e-06, "loss": 0.7447, "step": 16585 }, { "epoch": 0.31, "learning_rate": 4.021923771950654e-06, "loss": 0.7031, "step": 16586 }, { "epoch": 0.31, "learning_rate": 4.0218025730097715e-06, "loss": 1.0734, "step": 16587 }, { "epoch": 0.31, "learning_rate": 4.021681368386525e-06, "loss": 1.0749, "step": 16588 }, { "epoch": 0.31, "learning_rate": 4.021560158081366e-06, "loss": 0.9675, "step": 16589 }, { "epoch": 0.31, "learning_rate": 4.0214389420947484e-06, "loss": 0.9635, "step": 16590 }, { "epoch": 0.31, "learning_rate": 4.021317720427125e-06, "loss": 0.9993, "step": 16591 }, { "epoch": 0.31, "learning_rate": 4.021196493078947e-06, "loss": 1.0338, "step": 16592 }, { "epoch": 0.31, "learning_rate": 4.021075260050669e-06, "loss": 1.1826, "step": 16593 }, { "epoch": 0.31, "learning_rate": 4.020954021342741e-06, "loss": 0.8905, "step": 16594 }, { "epoch": 0.31, "learning_rate": 4.020832776955619e-06, "loss": 1.0034, "step": 16595 }, { "epoch": 0.31, "learning_rate": 4.020711526889753e-06, "loss": 0.8881, "step": 16596 }, { "epoch": 0.31, "learning_rate": 4.0205902711455966e-06, "loss": 1.0467, "step": 16597 }, { "epoch": 0.31, "learning_rate": 4.020469009723603e-06, "loss": 0.8997, "step": 16598 }, { "epoch": 0.31, "learning_rate": 4.020347742624225e-06, "loss": 0.9436, "step": 16599 }, { "epoch": 0.31, "learning_rate": 4.020226469847916e-06, "loss": 1.0396, "step": 16600 }, { "epoch": 0.31, "learning_rate": 4.020105191395126e-06, "loss": 1.1606, "step": 16601 }, { "epoch": 0.31, "learning_rate": 4.019983907266311e-06, "loss": 0.7511, "step": 16602 }, { "epoch": 0.31, "learning_rate": 4.019862617461922e-06, "loss": 0.8902, "step": 16603 }, { "epoch": 0.31, "learning_rate": 4.019741321982414e-06, "loss": 0.8276, "step": 16604 }, { "epoch": 0.31, "learning_rate": 4.019620020828238e-06, "loss": 1.0143, "step": 16605 }, { "epoch": 0.31, "learning_rate": 4.019498713999847e-06, "loss": 0.9084, "step": 16606 }, { "epoch": 0.31, "learning_rate": 4.019377401497694e-06, "loss": 1.0444, "step": 16607 }, { "epoch": 0.31, "learning_rate": 4.019256083322234e-06, "loss": 0.9973, "step": 16608 }, { "epoch": 0.31, "learning_rate": 4.019134759473916e-06, "loss": 0.9287, "step": 16609 }, { "epoch": 0.31, "learning_rate": 4.019013429953197e-06, "loss": 0.9507, "step": 16610 }, { "epoch": 0.31, "learning_rate": 4.018892094760528e-06, "loss": 0.9258, "step": 16611 }, { "epoch": 0.31, "learning_rate": 4.018770753896363e-06, "loss": 1.1796, "step": 16612 }, { "epoch": 0.31, "learning_rate": 4.018649407361154e-06, "loss": 1.0048, "step": 16613 }, { "epoch": 0.31, "learning_rate": 4.018528055155355e-06, "loss": 0.998, "step": 16614 }, { "epoch": 0.31, "learning_rate": 4.018406697279418e-06, "loss": 0.8575, "step": 16615 }, { "epoch": 0.31, "learning_rate": 4.0182853337337975e-06, "loss": 0.9545, "step": 16616 }, { "epoch": 0.31, "learning_rate": 4.018163964518947e-06, "loss": 0.8337, "step": 16617 }, { "epoch": 0.31, "learning_rate": 4.018042589635317e-06, "loss": 0.9803, "step": 16618 }, { "epoch": 0.31, "learning_rate": 4.0179212090833636e-06, "loss": 1.0922, "step": 16619 }, { "epoch": 0.31, "learning_rate": 4.017799822863539e-06, "loss": 1.0269, "step": 16620 }, { "epoch": 0.31, "learning_rate": 4.0176784309762965e-06, "loss": 0.9236, "step": 16621 }, { "epoch": 0.31, "learning_rate": 4.017557033422088e-06, "loss": 0.8959, "step": 16622 }, { "epoch": 0.31, "learning_rate": 4.017435630201369e-06, "loss": 0.822, "step": 16623 }, { "epoch": 0.31, "learning_rate": 4.0173142213145926e-06, "loss": 1.0469, "step": 16624 }, { "epoch": 0.31, "learning_rate": 4.01719280676221e-06, "loss": 1.0658, "step": 16625 }, { "epoch": 0.31, "learning_rate": 4.017071386544677e-06, "loss": 0.9603, "step": 16626 }, { "epoch": 0.31, "learning_rate": 4.016949960662446e-06, "loss": 0.9869, "step": 16627 }, { "epoch": 0.31, "learning_rate": 4.0168285291159705e-06, "loss": 0.785, "step": 16628 }, { "epoch": 0.31, "learning_rate": 4.016707091905703e-06, "loss": 1.0112, "step": 16629 }, { "epoch": 0.31, "learning_rate": 4.016585649032098e-06, "loss": 1.0685, "step": 16630 }, { "epoch": 0.31, "learning_rate": 4.016464200495609e-06, "loss": 1.1812, "step": 16631 }, { "epoch": 0.31, "learning_rate": 4.016342746296688e-06, "loss": 1.0263, "step": 16632 }, { "epoch": 0.31, "learning_rate": 4.016221286435791e-06, "loss": 0.8199, "step": 16633 }, { "epoch": 0.31, "learning_rate": 4.016099820913369e-06, "loss": 0.8846, "step": 16634 }, { "epoch": 0.31, "learning_rate": 4.0159783497298784e-06, "loss": 0.9026, "step": 16635 }, { "epoch": 0.31, "learning_rate": 4.0158568728857705e-06, "loss": 0.855, "step": 16636 }, { "epoch": 0.31, "learning_rate": 4.015735390381499e-06, "loss": 1.0278, "step": 16637 }, { "epoch": 0.31, "learning_rate": 4.015613902217518e-06, "loss": 0.9399, "step": 16638 }, { "epoch": 0.31, "learning_rate": 4.0154924083942815e-06, "loss": 0.7943, "step": 16639 }, { "epoch": 0.31, "learning_rate": 4.015370908912243e-06, "loss": 0.8208, "step": 16640 }, { "epoch": 0.31, "learning_rate": 4.015249403771856e-06, "loss": 1.0645, "step": 16641 }, { "epoch": 0.31, "learning_rate": 4.015127892973574e-06, "loss": 0.7579, "step": 16642 }, { "epoch": 0.31, "learning_rate": 4.0150063765178505e-06, "loss": 1.1066, "step": 16643 }, { "epoch": 0.31, "learning_rate": 4.01488485440514e-06, "loss": 1.048, "step": 16644 }, { "epoch": 0.31, "learning_rate": 4.014763326635896e-06, "loss": 0.9241, "step": 16645 }, { "epoch": 0.31, "learning_rate": 4.0146417932105715e-06, "loss": 0.8405, "step": 16646 }, { "epoch": 0.31, "learning_rate": 4.0145202541296226e-06, "loss": 0.9747, "step": 16647 }, { "epoch": 0.31, "learning_rate": 4.0143987093935e-06, "loss": 0.889, "step": 16648 }, { "epoch": 0.31, "learning_rate": 4.014277159002659e-06, "loss": 0.9999, "step": 16649 }, { "epoch": 0.31, "learning_rate": 4.014155602957555e-06, "loss": 1.0446, "step": 16650 }, { "epoch": 0.31, "learning_rate": 4.014034041258639e-06, "loss": 0.9704, "step": 16651 }, { "epoch": 0.31, "learning_rate": 4.013912473906366e-06, "loss": 0.874, "step": 16652 }, { "epoch": 0.31, "learning_rate": 4.013790900901191e-06, "loss": 0.9545, "step": 16653 }, { "epoch": 0.31, "learning_rate": 4.013669322243567e-06, "loss": 0.8467, "step": 16654 }, { "epoch": 0.31, "learning_rate": 4.013547737933949e-06, "loss": 0.8915, "step": 16655 }, { "epoch": 0.31, "learning_rate": 4.01342614797279e-06, "loss": 1.2261, "step": 16656 }, { "epoch": 0.31, "learning_rate": 4.013304552360543e-06, "loss": 1.1926, "step": 16657 }, { "epoch": 0.31, "learning_rate": 4.013182951097664e-06, "loss": 0.714, "step": 16658 }, { "epoch": 0.31, "learning_rate": 4.013061344184606e-06, "loss": 0.9738, "step": 16659 }, { "epoch": 0.31, "learning_rate": 4.012939731621823e-06, "loss": 0.7379, "step": 16660 }, { "epoch": 0.31, "learning_rate": 4.01281811340977e-06, "loss": 0.8978, "step": 16661 }, { "epoch": 0.31, "learning_rate": 4.012696489548901e-06, "loss": 1.0844, "step": 16662 }, { "epoch": 0.31, "learning_rate": 4.0125748600396684e-06, "loss": 1.0746, "step": 16663 }, { "epoch": 0.31, "learning_rate": 4.0124532248825286e-06, "loss": 0.976, "step": 16664 }, { "epoch": 0.31, "learning_rate": 4.012331584077935e-06, "loss": 0.8397, "step": 16665 }, { "epoch": 0.31, "learning_rate": 4.012209937626341e-06, "loss": 0.9801, "step": 16666 }, { "epoch": 0.31, "learning_rate": 4.012088285528202e-06, "loss": 0.8505, "step": 16667 }, { "epoch": 0.31, "learning_rate": 4.0119666277839705e-06, "loss": 0.9641, "step": 16668 }, { "epoch": 0.31, "learning_rate": 4.011844964394104e-06, "loss": 1.1696, "step": 16669 }, { "epoch": 0.31, "learning_rate": 4.0117232953590526e-06, "loss": 1.006, "step": 16670 }, { "epoch": 0.31, "learning_rate": 4.011601620679274e-06, "loss": 0.9142, "step": 16671 }, { "epoch": 0.31, "learning_rate": 4.011479940355221e-06, "loss": 0.811, "step": 16672 }, { "epoch": 0.31, "learning_rate": 4.011358254387349e-06, "loss": 0.8047, "step": 16673 }, { "epoch": 0.31, "learning_rate": 4.011236562776111e-06, "loss": 1.1116, "step": 16674 }, { "epoch": 0.31, "learning_rate": 4.011114865521961e-06, "loss": 1.0625, "step": 16675 }, { "epoch": 0.31, "learning_rate": 4.010993162625356e-06, "loss": 0.953, "step": 16676 }, { "epoch": 0.31, "learning_rate": 4.010871454086748e-06, "loss": 0.8928, "step": 16677 }, { "epoch": 0.31, "learning_rate": 4.010749739906593e-06, "loss": 0.9071, "step": 16678 }, { "epoch": 0.31, "learning_rate": 4.010628020085343e-06, "loss": 0.776, "step": 16679 }, { "epoch": 0.31, "learning_rate": 4.010506294623456e-06, "loss": 0.9409, "step": 16680 }, { "epoch": 0.31, "learning_rate": 4.010384563521384e-06, "loss": 1.1315, "step": 16681 }, { "epoch": 0.31, "learning_rate": 4.010262826779584e-06, "loss": 1.1277, "step": 16682 }, { "epoch": 0.31, "learning_rate": 4.010141084398507e-06, "loss": 0.9153, "step": 16683 }, { "epoch": 0.31, "learning_rate": 4.010019336378611e-06, "loss": 0.9853, "step": 16684 }, { "epoch": 0.31, "learning_rate": 4.0098975827203476e-06, "loss": 0.8435, "step": 16685 }, { "epoch": 0.31, "learning_rate": 4.009775823424174e-06, "loss": 0.9411, "step": 16686 }, { "epoch": 0.31, "learning_rate": 4.009654058490543e-06, "loss": 1.1062, "step": 16687 }, { "epoch": 0.31, "learning_rate": 4.00953228791991e-06, "loss": 1.1481, "step": 16688 }, { "epoch": 0.31, "learning_rate": 4.009410511712731e-06, "loss": 0.8584, "step": 16689 }, { "epoch": 0.31, "learning_rate": 4.009288729869458e-06, "loss": 1.0773, "step": 16690 }, { "epoch": 0.31, "learning_rate": 4.009166942390548e-06, "loss": 0.9623, "step": 16691 }, { "epoch": 0.31, "learning_rate": 4.009045149276455e-06, "loss": 0.8458, "step": 16692 }, { "epoch": 0.31, "learning_rate": 4.008923350527633e-06, "loss": 1.0371, "step": 16693 }, { "epoch": 0.31, "learning_rate": 4.008801546144538e-06, "loss": 0.9485, "step": 16694 }, { "epoch": 0.31, "learning_rate": 4.008679736127624e-06, "loss": 0.8202, "step": 16695 }, { "epoch": 0.32, "learning_rate": 4.008557920477346e-06, "loss": 1.0667, "step": 16696 }, { "epoch": 0.32, "learning_rate": 4.008436099194159e-06, "loss": 0.8307, "step": 16697 }, { "epoch": 0.32, "learning_rate": 4.0083142722785175e-06, "loss": 0.9517, "step": 16698 }, { "epoch": 0.32, "learning_rate": 4.008192439730878e-06, "loss": 1.1945, "step": 16699 }, { "epoch": 0.32, "learning_rate": 4.008070601551693e-06, "loss": 1.2996, "step": 16700 }, { "epoch": 0.32, "learning_rate": 4.007948757741419e-06, "loss": 0.9939, "step": 16701 }, { "epoch": 0.32, "learning_rate": 4.007826908300511e-06, "loss": 1.0854, "step": 16702 }, { "epoch": 0.32, "learning_rate": 4.0077050532294225e-06, "loss": 1.013, "step": 16703 }, { "epoch": 0.32, "learning_rate": 4.007583192528611e-06, "loss": 0.8695, "step": 16704 }, { "epoch": 0.32, "learning_rate": 4.007461326198529e-06, "loss": 0.9393, "step": 16705 }, { "epoch": 0.32, "learning_rate": 4.007339454239632e-06, "loss": 1.0001, "step": 16706 }, { "epoch": 0.32, "learning_rate": 4.007217576652378e-06, "loss": 1.0112, "step": 16707 }, { "epoch": 0.32, "learning_rate": 4.007095693437218e-06, "loss": 1.2351, "step": 16708 }, { "epoch": 0.32, "learning_rate": 4.00697380459461e-06, "loss": 0.9285, "step": 16709 }, { "epoch": 0.32, "learning_rate": 4.006851910125007e-06, "loss": 0.8928, "step": 16710 }, { "epoch": 0.32, "learning_rate": 4.0067300100288655e-06, "loss": 0.9534, "step": 16711 }, { "epoch": 0.32, "learning_rate": 4.00660810430664e-06, "loss": 0.9583, "step": 16712 }, { "epoch": 0.32, "learning_rate": 4.006486192958786e-06, "loss": 0.9324, "step": 16713 }, { "epoch": 0.32, "learning_rate": 4.006364275985759e-06, "loss": 0.9626, "step": 16714 }, { "epoch": 0.32, "learning_rate": 4.0062423533880144e-06, "loss": 0.8296, "step": 16715 }, { "epoch": 0.32, "learning_rate": 4.006120425166007e-06, "loss": 0.9298, "step": 16716 }, { "epoch": 0.32, "learning_rate": 4.005998491320192e-06, "loss": 0.8246, "step": 16717 }, { "epoch": 0.32, "learning_rate": 4.005876551851024e-06, "loss": 1.1719, "step": 16718 }, { "epoch": 0.32, "learning_rate": 4.005754606758961e-06, "loss": 1.1466, "step": 16719 }, { "epoch": 0.32, "learning_rate": 4.005632656044454e-06, "loss": 0.9878, "step": 16720 }, { "epoch": 0.32, "learning_rate": 4.005510699707962e-06, "loss": 0.8069, "step": 16721 }, { "epoch": 0.32, "learning_rate": 4.00538873774994e-06, "loss": 0.7568, "step": 16722 }, { "epoch": 0.32, "learning_rate": 4.005266770170841e-06, "loss": 0.735, "step": 16723 }, { "epoch": 0.32, "learning_rate": 4.0051447969711236e-06, "loss": 0.933, "step": 16724 }, { "epoch": 0.32, "learning_rate": 4.0050228181512404e-06, "loss": 1.3341, "step": 16725 }, { "epoch": 0.32, "learning_rate": 4.0049008337116495e-06, "loss": 1.0251, "step": 16726 }, { "epoch": 0.32, "learning_rate": 4.004778843652805e-06, "loss": 0.8188, "step": 16727 }, { "epoch": 0.32, "learning_rate": 4.004656847975161e-06, "loss": 0.7017, "step": 16728 }, { "epoch": 0.32, "learning_rate": 4.004534846679175e-06, "loss": 0.8786, "step": 16729 }, { "epoch": 0.32, "learning_rate": 4.004412839765302e-06, "loss": 0.9629, "step": 16730 }, { "epoch": 0.32, "learning_rate": 4.004290827233998e-06, "loss": 1.1556, "step": 16731 }, { "epoch": 0.32, "learning_rate": 4.004168809085718e-06, "loss": 0.8207, "step": 16732 }, { "epoch": 0.32, "learning_rate": 4.004046785320918e-06, "loss": 0.9103, "step": 16733 }, { "epoch": 0.32, "learning_rate": 4.003924755940053e-06, "loss": 0.7106, "step": 16734 }, { "epoch": 0.32, "learning_rate": 4.003802720943579e-06, "loss": 0.9811, "step": 16735 }, { "epoch": 0.32, "learning_rate": 4.003680680331952e-06, "loss": 0.9026, "step": 16736 }, { "epoch": 0.32, "learning_rate": 4.003558634105627e-06, "loss": 1.021, "step": 16737 }, { "epoch": 0.32, "learning_rate": 4.003436582265061e-06, "loss": 1.0337, "step": 16738 }, { "epoch": 0.32, "learning_rate": 4.003314524810708e-06, "loss": 0.9223, "step": 16739 }, { "epoch": 0.32, "learning_rate": 4.0031924617430255e-06, "loss": 0.9246, "step": 16740 }, { "epoch": 0.32, "learning_rate": 4.003070393062467e-06, "loss": 1.0557, "step": 16741 }, { "epoch": 0.32, "learning_rate": 4.002948318769492e-06, "loss": 1.033, "step": 16742 }, { "epoch": 0.32, "learning_rate": 4.002826238864552e-06, "loss": 1.1197, "step": 16743 }, { "epoch": 0.32, "learning_rate": 4.002704153348106e-06, "loss": 1.1089, "step": 16744 }, { "epoch": 0.32, "learning_rate": 4.002582062220609e-06, "loss": 0.9631, "step": 16745 }, { "epoch": 0.32, "learning_rate": 4.0024599654825154e-06, "loss": 1.0156, "step": 16746 }, { "epoch": 0.32, "learning_rate": 4.002337863134283e-06, "loss": 1.0277, "step": 16747 }, { "epoch": 0.32, "learning_rate": 4.0022157551763676e-06, "loss": 0.7582, "step": 16748 }, { "epoch": 0.32, "learning_rate": 4.0020936416092245e-06, "loss": 1.033, "step": 16749 }, { "epoch": 0.32, "learning_rate": 4.001971522433309e-06, "loss": 1.0247, "step": 16750 }, { "epoch": 0.32, "learning_rate": 4.001849397649079e-06, "loss": 1.0196, "step": 16751 }, { "epoch": 0.32, "learning_rate": 4.001727267256988e-06, "loss": 0.9043, "step": 16752 }, { "epoch": 0.32, "learning_rate": 4.001605131257495e-06, "loss": 0.7322, "step": 16753 }, { "epoch": 0.32, "learning_rate": 4.001482989651054e-06, "loss": 0.8926, "step": 16754 }, { "epoch": 0.32, "learning_rate": 4.001360842438121e-06, "loss": 1.1511, "step": 16755 }, { "epoch": 0.32, "learning_rate": 4.001238689619152e-06, "loss": 1.2008, "step": 16756 }, { "epoch": 0.32, "learning_rate": 4.0011165311946054e-06, "loss": 0.9129, "step": 16757 }, { "epoch": 0.32, "learning_rate": 4.000994367164935e-06, "loss": 1.0869, "step": 16758 }, { "epoch": 0.32, "learning_rate": 4.0008721975305975e-06, "loss": 0.7513, "step": 16759 }, { "epoch": 0.32, "learning_rate": 4.000750022292049e-06, "loss": 0.8547, "step": 16760 }, { "epoch": 0.32, "learning_rate": 4.0006278414497465e-06, "loss": 0.9344, "step": 16761 }, { "epoch": 0.32, "learning_rate": 4.000505655004145e-06, "loss": 1.1824, "step": 16762 }, { "epoch": 0.32, "learning_rate": 4.000383462955702e-06, "loss": 1.1408, "step": 16763 }, { "epoch": 0.32, "learning_rate": 4.0002612653048735e-06, "loss": 1.0595, "step": 16764 }, { "epoch": 0.32, "learning_rate": 4.000139062052115e-06, "loss": 0.9857, "step": 16765 }, { "epoch": 0.32, "learning_rate": 4.000016853197884e-06, "loss": 0.9399, "step": 16766 }, { "epoch": 0.32, "learning_rate": 3.999894638742634e-06, "loss": 0.873, "step": 16767 }, { "epoch": 0.32, "learning_rate": 3.999772418686825e-06, "loss": 0.9833, "step": 16768 }, { "epoch": 0.32, "learning_rate": 3.999650193030912e-06, "loss": 1.0228, "step": 16769 }, { "epoch": 0.32, "learning_rate": 3.99952796177535e-06, "loss": 0.7132, "step": 16770 }, { "epoch": 0.32, "learning_rate": 3.999405724920596e-06, "loss": 0.8562, "step": 16771 }, { "epoch": 0.32, "learning_rate": 3.999283482467109e-06, "loss": 0.8004, "step": 16772 }, { "epoch": 0.32, "learning_rate": 3.999161234415343e-06, "loss": 0.9361, "step": 16773 }, { "epoch": 0.32, "learning_rate": 3.999038980765754e-06, "loss": 1.1877, "step": 16774 }, { "epoch": 0.32, "learning_rate": 3.9989167215188e-06, "loss": 0.9512, "step": 16775 }, { "epoch": 0.32, "learning_rate": 3.998794456674937e-06, "loss": 0.8245, "step": 16776 }, { "epoch": 0.32, "learning_rate": 3.998672186234621e-06, "loss": 0.9666, "step": 16777 }, { "epoch": 0.32, "learning_rate": 3.99854991019831e-06, "loss": 0.9454, "step": 16778 }, { "epoch": 0.32, "learning_rate": 3.998427628566458e-06, "loss": 0.8828, "step": 16779 }, { "epoch": 0.32, "learning_rate": 3.998305341339525e-06, "loss": 1.1826, "step": 16780 }, { "epoch": 0.32, "learning_rate": 3.998183048517964e-06, "loss": 1.2549, "step": 16781 }, { "epoch": 0.32, "learning_rate": 3.9980607501022335e-06, "loss": 1.0095, "step": 16782 }, { "epoch": 0.32, "learning_rate": 3.997938446092792e-06, "loss": 0.9126, "step": 16783 }, { "epoch": 0.32, "learning_rate": 3.997816136490093e-06, "loss": 0.9241, "step": 16784 }, { "epoch": 0.32, "learning_rate": 3.997693821294594e-06, "loss": 0.8271, "step": 16785 }, { "epoch": 0.32, "learning_rate": 3.997571500506753e-06, "loss": 1.0754, "step": 16786 }, { "epoch": 0.32, "learning_rate": 3.997449174127026e-06, "loss": 1.0468, "step": 16787 }, { "epoch": 0.32, "learning_rate": 3.997326842155869e-06, "loss": 1.0305, "step": 16788 }, { "epoch": 0.32, "learning_rate": 3.99720450459374e-06, "loss": 0.9187, "step": 16789 }, { "epoch": 0.32, "learning_rate": 3.997082161441096e-06, "loss": 0.8872, "step": 16790 }, { "epoch": 0.32, "learning_rate": 3.996959812698392e-06, "loss": 1.0578, "step": 16791 }, { "epoch": 0.32, "learning_rate": 3.996837458366086e-06, "loss": 0.8203, "step": 16792 }, { "epoch": 0.32, "learning_rate": 3.996715098444635e-06, "loss": 1.3089, "step": 16793 }, { "epoch": 0.32, "learning_rate": 3.996592732934495e-06, "loss": 0.9197, "step": 16794 }, { "epoch": 0.32, "learning_rate": 3.996470361836125e-06, "loss": 0.8403, "step": 16795 }, { "epoch": 0.32, "learning_rate": 3.99634798514998e-06, "loss": 0.9991, "step": 16796 }, { "epoch": 0.32, "learning_rate": 3.996225602876518e-06, "loss": 0.8411, "step": 16797 }, { "epoch": 0.32, "learning_rate": 3.9961032150161945e-06, "loss": 0.853, "step": 16798 }, { "epoch": 0.32, "learning_rate": 3.995980821569468e-06, "loss": 1.012, "step": 16799 }, { "epoch": 0.32, "learning_rate": 3.995858422536795e-06, "loss": 1.0711, "step": 16800 }, { "epoch": 0.32, "learning_rate": 3.995736017918632e-06, "loss": 1.0562, "step": 16801 }, { "epoch": 0.32, "learning_rate": 3.995613607715437e-06, "loss": 0.8289, "step": 16802 }, { "epoch": 0.32, "learning_rate": 3.995491191927667e-06, "loss": 0.9923, "step": 16803 }, { "epoch": 0.32, "learning_rate": 3.995368770555777e-06, "loss": 0.8812, "step": 16804 }, { "epoch": 0.32, "learning_rate": 3.995246343600228e-06, "loss": 1.1308, "step": 16805 }, { "epoch": 0.32, "learning_rate": 3.995123911061474e-06, "loss": 1.1208, "step": 16806 }, { "epoch": 0.32, "learning_rate": 3.995001472939973e-06, "loss": 1.0164, "step": 16807 }, { "epoch": 0.32, "learning_rate": 3.994879029236184e-06, "loss": 0.9213, "step": 16808 }, { "epoch": 0.32, "learning_rate": 3.99475657995056e-06, "loss": 0.8431, "step": 16809 }, { "epoch": 0.32, "learning_rate": 3.994634125083563e-06, "loss": 0.7826, "step": 16810 }, { "epoch": 0.32, "learning_rate": 3.994511664635647e-06, "loss": 0.9969, "step": 16811 }, { "epoch": 0.32, "learning_rate": 3.99438919860727e-06, "loss": 1.1213, "step": 16812 }, { "epoch": 0.32, "learning_rate": 3.99426672699889e-06, "loss": 0.8962, "step": 16813 }, { "epoch": 0.32, "learning_rate": 3.994144249810964e-06, "loss": 1.0528, "step": 16814 }, { "epoch": 0.32, "learning_rate": 3.994021767043948e-06, "loss": 0.8395, "step": 16815 }, { "epoch": 0.32, "learning_rate": 3.993899278698302e-06, "loss": 0.9708, "step": 16816 }, { "epoch": 0.32, "learning_rate": 3.9937767847744815e-06, "loss": 0.8152, "step": 16817 }, { "epoch": 0.32, "learning_rate": 3.993654285272944e-06, "loss": 0.9592, "step": 16818 }, { "epoch": 0.32, "learning_rate": 3.993531780194147e-06, "loss": 0.9073, "step": 16819 }, { "epoch": 0.32, "learning_rate": 3.993409269538549e-06, "loss": 0.8468, "step": 16820 }, { "epoch": 0.32, "learning_rate": 3.993286753306606e-06, "loss": 0.9622, "step": 16821 }, { "epoch": 0.32, "learning_rate": 3.993164231498775e-06, "loss": 0.8041, "step": 16822 }, { "epoch": 0.32, "learning_rate": 3.993041704115516e-06, "loss": 0.8541, "step": 16823 }, { "epoch": 0.32, "learning_rate": 3.992919171157284e-06, "loss": 0.8451, "step": 16824 }, { "epoch": 0.32, "learning_rate": 3.992796632624538e-06, "loss": 1.1044, "step": 16825 }, { "epoch": 0.32, "learning_rate": 3.992674088517736e-06, "loss": 0.8296, "step": 16826 }, { "epoch": 0.32, "learning_rate": 3.9925515388373334e-06, "loss": 0.8796, "step": 16827 }, { "epoch": 0.32, "learning_rate": 3.99242898358379e-06, "loss": 0.8152, "step": 16828 }, { "epoch": 0.32, "learning_rate": 3.992306422757562e-06, "loss": 0.987, "step": 16829 }, { "epoch": 0.32, "learning_rate": 3.9921838563591085e-06, "loss": 1.0593, "step": 16830 }, { "epoch": 0.32, "learning_rate": 3.9920612843888856e-06, "loss": 1.0566, "step": 16831 }, { "epoch": 0.32, "learning_rate": 3.991938706847352e-06, "loss": 0.8534, "step": 16832 }, { "epoch": 0.32, "learning_rate": 3.991816123734964e-06, "loss": 1.003, "step": 16833 }, { "epoch": 0.32, "learning_rate": 3.991693535052182e-06, "loss": 0.9259, "step": 16834 }, { "epoch": 0.32, "learning_rate": 3.991570940799461e-06, "loss": 0.9242, "step": 16835 }, { "epoch": 0.32, "learning_rate": 3.99144834097726e-06, "loss": 0.8167, "step": 16836 }, { "epoch": 0.32, "learning_rate": 3.991325735586036e-06, "loss": 1.0656, "step": 16837 }, { "epoch": 0.32, "learning_rate": 3.991203124626249e-06, "loss": 1.1046, "step": 16838 }, { "epoch": 0.32, "learning_rate": 3.991080508098353e-06, "loss": 1.0629, "step": 16839 }, { "epoch": 0.32, "learning_rate": 3.99095788600281e-06, "loss": 0.8301, "step": 16840 }, { "epoch": 0.32, "learning_rate": 3.990835258340074e-06, "loss": 0.9033, "step": 16841 }, { "epoch": 0.32, "learning_rate": 3.9907126251106065e-06, "loss": 0.6803, "step": 16842 }, { "epoch": 0.32, "learning_rate": 3.990589986314864e-06, "loss": 0.9356, "step": 16843 }, { "epoch": 0.32, "learning_rate": 3.9904673419533036e-06, "loss": 1.166, "step": 16844 }, { "epoch": 0.32, "learning_rate": 3.990344692026383e-06, "loss": 1.08, "step": 16845 }, { "epoch": 0.32, "learning_rate": 3.990222036534562e-06, "loss": 0.8566, "step": 16846 }, { "epoch": 0.32, "learning_rate": 3.9900993754782976e-06, "loss": 1.0634, "step": 16847 }, { "epoch": 0.32, "learning_rate": 3.9899767088580475e-06, "loss": 0.7017, "step": 16848 }, { "epoch": 0.32, "learning_rate": 3.989854036674271e-06, "loss": 1.1767, "step": 16849 }, { "epoch": 0.32, "learning_rate": 3.989731358927424e-06, "loss": 0.8582, "step": 16850 }, { "epoch": 0.32, "learning_rate": 3.9896086756179666e-06, "loss": 0.9738, "step": 16851 }, { "epoch": 0.32, "learning_rate": 3.989485986746356e-06, "loss": 0.8732, "step": 16852 }, { "epoch": 0.32, "learning_rate": 3.9893632923130495e-06, "loss": 0.9888, "step": 16853 }, { "epoch": 0.32, "learning_rate": 3.989240592318506e-06, "loss": 1.0234, "step": 16854 }, { "epoch": 0.32, "learning_rate": 3.9891178867631855e-06, "loss": 0.8453, "step": 16855 }, { "epoch": 0.32, "learning_rate": 3.988995175647543e-06, "loss": 1.2336, "step": 16856 }, { "epoch": 0.32, "learning_rate": 3.988872458972039e-06, "loss": 1.0785, "step": 16857 }, { "epoch": 0.32, "learning_rate": 3.988749736737131e-06, "loss": 0.8612, "step": 16858 }, { "epoch": 0.32, "learning_rate": 3.988627008943276e-06, "loss": 1.061, "step": 16859 }, { "epoch": 0.32, "learning_rate": 3.988504275590935e-06, "loss": 0.8893, "step": 16860 }, { "epoch": 0.32, "learning_rate": 3.988381536680563e-06, "loss": 0.9674, "step": 16861 }, { "epoch": 0.32, "learning_rate": 3.9882587922126205e-06, "loss": 1.1358, "step": 16862 }, { "epoch": 0.32, "learning_rate": 3.988136042187565e-06, "loss": 0.9721, "step": 16863 }, { "epoch": 0.32, "learning_rate": 3.988013286605856e-06, "loss": 0.9789, "step": 16864 }, { "epoch": 0.32, "learning_rate": 3.987890525467951e-06, "loss": 1.0828, "step": 16865 }, { "epoch": 0.32, "learning_rate": 3.987767758774308e-06, "loss": 1.1273, "step": 16866 }, { "epoch": 0.32, "learning_rate": 3.987644986525386e-06, "loss": 0.8469, "step": 16867 }, { "epoch": 0.32, "learning_rate": 3.987522208721643e-06, "loss": 1.0625, "step": 16868 }, { "epoch": 0.32, "learning_rate": 3.987399425363537e-06, "loss": 1.1447, "step": 16869 }, { "epoch": 0.32, "learning_rate": 3.987276636451529e-06, "loss": 1.0738, "step": 16870 }, { "epoch": 0.32, "learning_rate": 3.987153841986074e-06, "loss": 1.0352, "step": 16871 }, { "epoch": 0.32, "learning_rate": 3.987031041967633e-06, "loss": 0.8402, "step": 16872 }, { "epoch": 0.32, "learning_rate": 3.9869082363966635e-06, "loss": 0.8453, "step": 16873 }, { "epoch": 0.32, "learning_rate": 3.9867854252736235e-06, "loss": 1.0213, "step": 16874 }, { "epoch": 0.32, "learning_rate": 3.986662608598973e-06, "loss": 1.1476, "step": 16875 }, { "epoch": 0.32, "learning_rate": 3.9865397863731705e-06, "loss": 0.9648, "step": 16876 }, { "epoch": 0.32, "learning_rate": 3.986416958596672e-06, "loss": 0.873, "step": 16877 }, { "epoch": 0.32, "learning_rate": 3.98629412526994e-06, "loss": 0.8186, "step": 16878 }, { "epoch": 0.32, "learning_rate": 3.986171286393431e-06, "loss": 0.9587, "step": 16879 }, { "epoch": 0.32, "learning_rate": 3.986048441967604e-06, "loss": 1.009, "step": 16880 }, { "epoch": 0.32, "learning_rate": 3.985925591992917e-06, "loss": 1.1528, "step": 16881 }, { "epoch": 0.32, "learning_rate": 3.98580273646983e-06, "loss": 0.9171, "step": 16882 }, { "epoch": 0.32, "learning_rate": 3.9856798753988015e-06, "loss": 0.9061, "step": 16883 }, { "epoch": 0.32, "learning_rate": 3.985557008780289e-06, "loss": 1.0234, "step": 16884 }, { "epoch": 0.32, "learning_rate": 3.985434136614753e-06, "loss": 0.7083, "step": 16885 }, { "epoch": 0.32, "learning_rate": 3.985311258902651e-06, "loss": 0.9521, "step": 16886 }, { "epoch": 0.32, "learning_rate": 3.985188375644442e-06, "loss": 1.0258, "step": 16887 }, { "epoch": 0.32, "learning_rate": 3.985065486840586e-06, "loss": 1.0217, "step": 16888 }, { "epoch": 0.32, "learning_rate": 3.98494259249154e-06, "loss": 0.8495, "step": 16889 }, { "epoch": 0.32, "learning_rate": 3.984819692597764e-06, "loss": 0.9964, "step": 16890 }, { "epoch": 0.32, "learning_rate": 3.984696787159718e-06, "loss": 0.9993, "step": 16891 }, { "epoch": 0.32, "learning_rate": 3.984573876177859e-06, "loss": 0.9141, "step": 16892 }, { "epoch": 0.32, "learning_rate": 3.984450959652646e-06, "loss": 1.0208, "step": 16893 }, { "epoch": 0.32, "learning_rate": 3.984328037584539e-06, "loss": 1.0575, "step": 16894 }, { "epoch": 0.32, "learning_rate": 3.984205109973998e-06, "loss": 0.7996, "step": 16895 }, { "epoch": 0.32, "learning_rate": 3.984082176821479e-06, "loss": 0.804, "step": 16896 }, { "epoch": 0.32, "learning_rate": 3.983959238127443e-06, "loss": 0.9134, "step": 16897 }, { "epoch": 0.32, "learning_rate": 3.983836293892349e-06, "loss": 0.8694, "step": 16898 }, { "epoch": 0.32, "learning_rate": 3.983713344116656e-06, "loss": 1.0975, "step": 16899 }, { "epoch": 0.32, "learning_rate": 3.983590388800822e-06, "loss": 1.1209, "step": 16900 }, { "epoch": 0.32, "learning_rate": 3.983467427945307e-06, "loss": 0.8541, "step": 16901 }, { "epoch": 0.32, "learning_rate": 3.9833444615505704e-06, "loss": 0.8176, "step": 16902 }, { "epoch": 0.32, "learning_rate": 3.983221489617072e-06, "loss": 0.7339, "step": 16903 }, { "epoch": 0.32, "learning_rate": 3.983098512145269e-06, "loss": 0.9749, "step": 16904 }, { "epoch": 0.32, "learning_rate": 3.982975529135621e-06, "loss": 0.862, "step": 16905 }, { "epoch": 0.32, "learning_rate": 3.9828525405885894e-06, "loss": 1.0181, "step": 16906 }, { "epoch": 0.32, "learning_rate": 3.982729546504631e-06, "loss": 1.0261, "step": 16907 }, { "epoch": 0.32, "learning_rate": 3.982606546884206e-06, "loss": 0.9451, "step": 16908 }, { "epoch": 0.32, "learning_rate": 3.982483541727774e-06, "loss": 0.7663, "step": 16909 }, { "epoch": 0.32, "learning_rate": 3.982360531035794e-06, "loss": 1.0239, "step": 16910 }, { "epoch": 0.32, "learning_rate": 3.982237514808724e-06, "loss": 0.8328, "step": 16911 }, { "epoch": 0.32, "learning_rate": 3.982114493047026e-06, "loss": 0.951, "step": 16912 }, { "epoch": 0.32, "learning_rate": 3.981991465751157e-06, "loss": 0.9946, "step": 16913 }, { "epoch": 0.32, "learning_rate": 3.9818684329215776e-06, "loss": 0.9424, "step": 16914 }, { "epoch": 0.32, "learning_rate": 3.9817453945587475e-06, "loss": 1.0767, "step": 16915 }, { "epoch": 0.32, "learning_rate": 3.981622350663124e-06, "loss": 0.9869, "step": 16916 }, { "epoch": 0.32, "learning_rate": 3.98149930123517e-06, "loss": 0.9178, "step": 16917 }, { "epoch": 0.32, "learning_rate": 3.981376246275343e-06, "loss": 0.8267, "step": 16918 }, { "epoch": 0.32, "learning_rate": 3.981253185784101e-06, "loss": 0.9409, "step": 16919 }, { "epoch": 0.32, "learning_rate": 3.981130119761905e-06, "loss": 0.7475, "step": 16920 }, { "epoch": 0.32, "learning_rate": 3.981007048209215e-06, "loss": 0.7904, "step": 16921 }, { "epoch": 0.32, "learning_rate": 3.980883971126491e-06, "loss": 0.9479, "step": 16922 }, { "epoch": 0.32, "learning_rate": 3.98076088851419e-06, "loss": 0.7591, "step": 16923 }, { "epoch": 0.32, "learning_rate": 3.980637800372775e-06, "loss": 0.9093, "step": 16924 }, { "epoch": 0.32, "learning_rate": 3.980514706702703e-06, "loss": 0.9293, "step": 16925 }, { "epoch": 0.32, "learning_rate": 3.980391607504435e-06, "loss": 0.9366, "step": 16926 }, { "epoch": 0.32, "learning_rate": 3.980268502778429e-06, "loss": 0.8864, "step": 16927 }, { "epoch": 0.32, "learning_rate": 3.980145392525147e-06, "loss": 0.8516, "step": 16928 }, { "epoch": 0.32, "learning_rate": 3.980022276745046e-06, "loss": 0.7541, "step": 16929 }, { "epoch": 0.32, "learning_rate": 3.979899155438589e-06, "loss": 0.906, "step": 16930 }, { "epoch": 0.32, "learning_rate": 3.979776028606233e-06, "loss": 1.1071, "step": 16931 }, { "epoch": 0.32, "learning_rate": 3.979652896248439e-06, "loss": 1.1666, "step": 16932 }, { "epoch": 0.32, "learning_rate": 3.979529758365665e-06, "loss": 0.9116, "step": 16933 }, { "epoch": 0.32, "learning_rate": 3.979406614958374e-06, "loss": 0.938, "step": 16934 }, { "epoch": 0.32, "learning_rate": 3.979283466027023e-06, "loss": 0.9804, "step": 16935 }, { "epoch": 0.32, "learning_rate": 3.979160311572073e-06, "loss": 0.755, "step": 16936 }, { "epoch": 0.32, "learning_rate": 3.979037151593985e-06, "loss": 1.1014, "step": 16937 }, { "epoch": 0.32, "learning_rate": 3.978913986093217e-06, "loss": 0.9001, "step": 16938 }, { "epoch": 0.32, "learning_rate": 3.978790815070229e-06, "loss": 0.859, "step": 16939 }, { "epoch": 0.32, "learning_rate": 3.978667638525482e-06, "loss": 0.8412, "step": 16940 }, { "epoch": 0.32, "learning_rate": 3.9785444564594345e-06, "loss": 0.8383, "step": 16941 }, { "epoch": 0.32, "learning_rate": 3.978421268872548e-06, "loss": 0.9467, "step": 16942 }, { "epoch": 0.32, "learning_rate": 3.978298075765282e-06, "loss": 1.1151, "step": 16943 }, { "epoch": 0.32, "learning_rate": 3.978174877138096e-06, "loss": 1.178, "step": 16944 }, { "epoch": 0.32, "learning_rate": 3.97805167299145e-06, "loss": 1.024, "step": 16945 }, { "epoch": 0.32, "learning_rate": 3.9779284633258045e-06, "loss": 0.9877, "step": 16946 }, { "epoch": 0.32, "learning_rate": 3.9778052481416195e-06, "loss": 0.9131, "step": 16947 }, { "epoch": 0.32, "learning_rate": 3.977682027439355e-06, "loss": 1.1636, "step": 16948 }, { "epoch": 0.32, "learning_rate": 3.977558801219472e-06, "loss": 0.975, "step": 16949 }, { "epoch": 0.32, "learning_rate": 3.9774355694824284e-06, "loss": 0.9057, "step": 16950 }, { "epoch": 0.32, "learning_rate": 3.9773123322286865e-06, "loss": 0.8065, "step": 16951 }, { "epoch": 0.32, "learning_rate": 3.977189089458706e-06, "loss": 0.8066, "step": 16952 }, { "epoch": 0.32, "learning_rate": 3.977065841172946e-06, "loss": 1.0396, "step": 16953 }, { "epoch": 0.32, "learning_rate": 3.976942587371868e-06, "loss": 0.861, "step": 16954 }, { "epoch": 0.32, "learning_rate": 3.976819328055931e-06, "loss": 0.9515, "step": 16955 }, { "epoch": 0.32, "learning_rate": 3.9766960632255956e-06, "loss": 1.1485, "step": 16956 }, { "epoch": 0.32, "learning_rate": 3.976572792881324e-06, "loss": 1.0043, "step": 16957 }, { "epoch": 0.32, "learning_rate": 3.9764495170235735e-06, "loss": 0.9222, "step": 16958 }, { "epoch": 0.32, "learning_rate": 3.9763262356528065e-06, "loss": 0.9078, "step": 16959 }, { "epoch": 0.32, "learning_rate": 3.976202948769482e-06, "loss": 0.7743, "step": 16960 }, { "epoch": 0.32, "learning_rate": 3.9760796563740614e-06, "loss": 0.7923, "step": 16961 }, { "epoch": 0.32, "learning_rate": 3.975956358467004e-06, "loss": 1.072, "step": 16962 }, { "epoch": 0.32, "learning_rate": 3.975833055048771e-06, "loss": 0.9411, "step": 16963 }, { "epoch": 0.32, "learning_rate": 3.975709746119823e-06, "loss": 0.7124, "step": 16964 }, { "epoch": 0.32, "learning_rate": 3.97558643168062e-06, "loss": 0.6657, "step": 16965 }, { "epoch": 0.32, "learning_rate": 3.975463111731622e-06, "loss": 0.9667, "step": 16966 }, { "epoch": 0.32, "learning_rate": 3.97533978627329e-06, "loss": 0.9623, "step": 16967 }, { "epoch": 0.32, "learning_rate": 3.975216455306086e-06, "loss": 1.072, "step": 16968 }, { "epoch": 0.32, "learning_rate": 3.975093118830468e-06, "loss": 1.1499, "step": 16969 }, { "epoch": 0.32, "learning_rate": 3.974969776846896e-06, "loss": 0.9582, "step": 16970 }, { "epoch": 0.32, "learning_rate": 3.9748464293558345e-06, "loss": 0.8726, "step": 16971 }, { "epoch": 0.32, "learning_rate": 3.97472307635774e-06, "loss": 0.7869, "step": 16972 }, { "epoch": 0.32, "learning_rate": 3.9745997178530746e-06, "loss": 0.8078, "step": 16973 }, { "epoch": 0.32, "learning_rate": 3.9744763538423005e-06, "loss": 1.0991, "step": 16974 }, { "epoch": 0.32, "learning_rate": 3.974352984325877e-06, "loss": 0.8972, "step": 16975 }, { "epoch": 0.32, "learning_rate": 3.974229609304263e-06, "loss": 0.9807, "step": 16976 }, { "epoch": 0.32, "learning_rate": 3.974106228777922e-06, "loss": 1.0224, "step": 16977 }, { "epoch": 0.32, "learning_rate": 3.973982842747313e-06, "loss": 0.9545, "step": 16978 }, { "epoch": 0.32, "learning_rate": 3.973859451212897e-06, "loss": 0.9319, "step": 16979 }, { "epoch": 0.32, "learning_rate": 3.973736054175135e-06, "loss": 0.8454, "step": 16980 }, { "epoch": 0.32, "learning_rate": 3.973612651634489e-06, "loss": 1.0703, "step": 16981 }, { "epoch": 0.32, "learning_rate": 3.973489243591418e-06, "loss": 0.9014, "step": 16982 }, { "epoch": 0.32, "learning_rate": 3.9733658300463825e-06, "loss": 0.8678, "step": 16983 }, { "epoch": 0.32, "learning_rate": 3.973242410999846e-06, "loss": 0.83, "step": 16984 }, { "epoch": 0.32, "learning_rate": 3.973118986452266e-06, "loss": 0.8235, "step": 16985 }, { "epoch": 0.32, "learning_rate": 3.972995556404105e-06, "loss": 0.801, "step": 16986 }, { "epoch": 0.32, "learning_rate": 3.9728721208558245e-06, "loss": 1.0571, "step": 16987 }, { "epoch": 0.32, "learning_rate": 3.972748679807883e-06, "loss": 1.1262, "step": 16988 }, { "epoch": 0.32, "learning_rate": 3.972625233260745e-06, "loss": 0.8259, "step": 16989 }, { "epoch": 0.32, "learning_rate": 3.972501781214868e-06, "loss": 0.9247, "step": 16990 }, { "epoch": 0.32, "learning_rate": 3.972378323670715e-06, "loss": 0.9234, "step": 16991 }, { "epoch": 0.32, "learning_rate": 3.972254860628748e-06, "loss": 0.7646, "step": 16992 }, { "epoch": 0.32, "learning_rate": 3.972131392089425e-06, "loss": 0.9937, "step": 16993 }, { "epoch": 0.32, "learning_rate": 3.972007918053208e-06, "loss": 1.2339, "step": 16994 }, { "epoch": 0.32, "learning_rate": 3.97188443852056e-06, "loss": 0.9179, "step": 16995 }, { "epoch": 0.32, "learning_rate": 3.97176095349194e-06, "loss": 0.7029, "step": 16996 }, { "epoch": 0.32, "learning_rate": 3.971637462967809e-06, "loss": 0.8807, "step": 16997 }, { "epoch": 0.32, "learning_rate": 3.9715139669486295e-06, "loss": 0.8704, "step": 16998 }, { "epoch": 0.32, "learning_rate": 3.971390465434862e-06, "loss": 0.9941, "step": 16999 }, { "epoch": 0.32, "learning_rate": 3.971266958426967e-06, "loss": 1.0936, "step": 17000 }, { "epoch": 0.32, "learning_rate": 3.971143445925407e-06, "loss": 0.9402, "step": 17001 }, { "epoch": 0.32, "learning_rate": 3.9710199279306424e-06, "loss": 1.0703, "step": 17002 }, { "epoch": 0.32, "learning_rate": 3.970896404443134e-06, "loss": 0.8808, "step": 17003 }, { "epoch": 0.32, "learning_rate": 3.970772875463345e-06, "loss": 0.8658, "step": 17004 }, { "epoch": 0.32, "learning_rate": 3.970649340991734e-06, "loss": 1.0139, "step": 17005 }, { "epoch": 0.32, "learning_rate": 3.970525801028763e-06, "loss": 1.2486, "step": 17006 }, { "epoch": 0.32, "learning_rate": 3.970402255574894e-06, "loss": 0.7445, "step": 17007 }, { "epoch": 0.32, "learning_rate": 3.970278704630589e-06, "loss": 0.7378, "step": 17008 }, { "epoch": 0.32, "learning_rate": 3.9701551481963076e-06, "loss": 0.9335, "step": 17009 }, { "epoch": 0.32, "learning_rate": 3.970031586272512e-06, "loss": 0.9033, "step": 17010 }, { "epoch": 0.32, "learning_rate": 3.969908018859663e-06, "loss": 0.8734, "step": 17011 }, { "epoch": 0.32, "learning_rate": 3.969784445958224e-06, "loss": 1.092, "step": 17012 }, { "epoch": 0.32, "learning_rate": 3.969660867568655e-06, "loss": 1.025, "step": 17013 }, { "epoch": 0.32, "learning_rate": 3.969537283691416e-06, "loss": 0.7357, "step": 17014 }, { "epoch": 0.32, "learning_rate": 3.9694136943269695e-06, "loss": 0.9879, "step": 17015 }, { "epoch": 0.32, "learning_rate": 3.9692900994757784e-06, "loss": 0.9296, "step": 17016 }, { "epoch": 0.32, "learning_rate": 3.9691664991383024e-06, "loss": 0.767, "step": 17017 }, { "epoch": 0.32, "learning_rate": 3.969042893315004e-06, "loss": 1.0061, "step": 17018 }, { "epoch": 0.32, "learning_rate": 3.968919282006346e-06, "loss": 1.0858, "step": 17019 }, { "epoch": 0.32, "learning_rate": 3.968795665212786e-06, "loss": 1.0776, "step": 17020 }, { "epoch": 0.32, "learning_rate": 3.968672042934789e-06, "loss": 1.0469, "step": 17021 }, { "epoch": 0.32, "learning_rate": 3.968548415172816e-06, "loss": 1.0565, "step": 17022 }, { "epoch": 0.32, "learning_rate": 3.968424781927328e-06, "loss": 0.8969, "step": 17023 }, { "epoch": 0.32, "learning_rate": 3.968301143198787e-06, "loss": 1.2087, "step": 17024 }, { "epoch": 0.32, "learning_rate": 3.968177498987654e-06, "loss": 1.0664, "step": 17025 }, { "epoch": 0.32, "learning_rate": 3.968053849294392e-06, "loss": 1.019, "step": 17026 }, { "epoch": 0.32, "learning_rate": 3.967930194119461e-06, "loss": 0.9229, "step": 17027 }, { "epoch": 0.32, "learning_rate": 3.9678065334633256e-06, "loss": 0.8583, "step": 17028 }, { "epoch": 0.32, "learning_rate": 3.967682867326444e-06, "loss": 0.812, "step": 17029 }, { "epoch": 0.32, "learning_rate": 3.967559195709279e-06, "loss": 1.095, "step": 17030 }, { "epoch": 0.32, "learning_rate": 3.9674355186122945e-06, "loss": 1.0412, "step": 17031 }, { "epoch": 0.32, "learning_rate": 3.96731183603595e-06, "loss": 0.9338, "step": 17032 }, { "epoch": 0.32, "learning_rate": 3.9671881479807085e-06, "loss": 0.9793, "step": 17033 }, { "epoch": 0.32, "learning_rate": 3.967064454447031e-06, "loss": 0.9269, "step": 17034 }, { "epoch": 0.32, "learning_rate": 3.96694075543538e-06, "loss": 0.7404, "step": 17035 }, { "epoch": 0.32, "learning_rate": 3.966817050946217e-06, "loss": 0.8431, "step": 17036 }, { "epoch": 0.32, "learning_rate": 3.966693340980005e-06, "loss": 1.0316, "step": 17037 }, { "epoch": 0.32, "learning_rate": 3.966569625537203e-06, "loss": 0.8681, "step": 17038 }, { "epoch": 0.32, "learning_rate": 3.966445904618277e-06, "loss": 0.8703, "step": 17039 }, { "epoch": 0.32, "learning_rate": 3.966322178223686e-06, "loss": 1.1426, "step": 17040 }, { "epoch": 0.32, "learning_rate": 3.966198446353893e-06, "loss": 0.9599, "step": 17041 }, { "epoch": 0.32, "learning_rate": 3.96607470900936e-06, "loss": 0.9075, "step": 17042 }, { "epoch": 0.32, "learning_rate": 3.965950966190549e-06, "loss": 0.9984, "step": 17043 }, { "epoch": 0.32, "learning_rate": 3.965827217897922e-06, "loss": 1.0538, "step": 17044 }, { "epoch": 0.32, "learning_rate": 3.965703464131941e-06, "loss": 0.803, "step": 17045 }, { "epoch": 0.32, "learning_rate": 3.965579704893069e-06, "loss": 0.9053, "step": 17046 }, { "epoch": 0.32, "learning_rate": 3.965455940181768e-06, "loss": 0.8284, "step": 17047 }, { "epoch": 0.32, "learning_rate": 3.965332169998497e-06, "loss": 1.056, "step": 17048 }, { "epoch": 0.32, "learning_rate": 3.965208394343722e-06, "loss": 1.1143, "step": 17049 }, { "epoch": 0.32, "learning_rate": 3.965084613217903e-06, "loss": 0.9701, "step": 17050 }, { "epoch": 0.32, "learning_rate": 3.964960826621504e-06, "loss": 1.0598, "step": 17051 }, { "epoch": 0.32, "learning_rate": 3.964837034554986e-06, "loss": 1.0323, "step": 17052 }, { "epoch": 0.32, "learning_rate": 3.964713237018811e-06, "loss": 0.8507, "step": 17053 }, { "epoch": 0.32, "learning_rate": 3.964589434013441e-06, "loss": 0.9673, "step": 17054 }, { "epoch": 0.32, "learning_rate": 3.964465625539341e-06, "loss": 0.9982, "step": 17055 }, { "epoch": 0.32, "learning_rate": 3.96434181159697e-06, "loss": 0.9433, "step": 17056 }, { "epoch": 0.32, "learning_rate": 3.964217992186791e-06, "loss": 0.818, "step": 17057 }, { "epoch": 0.32, "learning_rate": 3.964094167309268e-06, "loss": 0.9468, "step": 17058 }, { "epoch": 0.32, "learning_rate": 3.963970336964862e-06, "loss": 0.9839, "step": 17059 }, { "epoch": 0.32, "learning_rate": 3.963846501154035e-06, "loss": 0.9731, "step": 17060 }, { "epoch": 0.32, "learning_rate": 3.963722659877251e-06, "loss": 0.8497, "step": 17061 }, { "epoch": 0.32, "learning_rate": 3.963598813134972e-06, "loss": 1.0577, "step": 17062 }, { "epoch": 0.32, "learning_rate": 3.963474960927657e-06, "loss": 0.8182, "step": 17063 }, { "epoch": 0.32, "learning_rate": 3.9633511032557745e-06, "loss": 0.9775, "step": 17064 }, { "epoch": 0.32, "learning_rate": 3.9632272401197825e-06, "loss": 1.012, "step": 17065 }, { "epoch": 0.32, "learning_rate": 3.963103371520144e-06, "loss": 0.8913, "step": 17066 }, { "epoch": 0.32, "learning_rate": 3.962979497457325e-06, "loss": 0.9533, "step": 17067 }, { "epoch": 0.32, "learning_rate": 3.962855617931782e-06, "loss": 1.0046, "step": 17068 }, { "epoch": 0.32, "learning_rate": 3.962731732943983e-06, "loss": 1.0251, "step": 17069 }, { "epoch": 0.32, "learning_rate": 3.962607842494389e-06, "loss": 0.9564, "step": 17070 }, { "epoch": 0.32, "learning_rate": 3.962483946583461e-06, "loss": 1.0675, "step": 17071 }, { "epoch": 0.32, "learning_rate": 3.9623600452116636e-06, "loss": 0.9911, "step": 17072 }, { "epoch": 0.32, "learning_rate": 3.9622361383794584e-06, "loss": 0.8398, "step": 17073 }, { "epoch": 0.32, "learning_rate": 3.962112226087308e-06, "loss": 0.9617, "step": 17074 }, { "epoch": 0.32, "learning_rate": 3.961988308335676e-06, "loss": 1.0239, "step": 17075 }, { "epoch": 0.32, "learning_rate": 3.961864385125023e-06, "loss": 0.8246, "step": 17076 }, { "epoch": 0.32, "learning_rate": 3.961740456455815e-06, "loss": 0.8911, "step": 17077 }, { "epoch": 0.32, "learning_rate": 3.961616522328512e-06, "loss": 1.0055, "step": 17078 }, { "epoch": 0.32, "learning_rate": 3.961492582743578e-06, "loss": 0.9785, "step": 17079 }, { "epoch": 0.32, "learning_rate": 3.961368637701475e-06, "loss": 1.0488, "step": 17080 }, { "epoch": 0.32, "learning_rate": 3.9612446872026665e-06, "loss": 1.1652, "step": 17081 }, { "epoch": 0.32, "learning_rate": 3.961120731247616e-06, "loss": 1.0258, "step": 17082 }, { "epoch": 0.32, "learning_rate": 3.960996769836785e-06, "loss": 0.9568, "step": 17083 }, { "epoch": 0.32, "learning_rate": 3.960872802970637e-06, "loss": 0.9749, "step": 17084 }, { "epoch": 0.32, "learning_rate": 3.960748830649633e-06, "loss": 0.9456, "step": 17085 }, { "epoch": 0.32, "learning_rate": 3.960624852874239e-06, "loss": 0.9603, "step": 17086 }, { "epoch": 0.32, "learning_rate": 3.9605008696449174e-06, "loss": 0.7779, "step": 17087 }, { "epoch": 0.32, "learning_rate": 3.96037688096213e-06, "loss": 0.9361, "step": 17088 }, { "epoch": 0.32, "learning_rate": 3.960252886826339e-06, "loss": 0.9085, "step": 17089 }, { "epoch": 0.32, "learning_rate": 3.960128887238009e-06, "loss": 0.8805, "step": 17090 }, { "epoch": 0.32, "learning_rate": 3.960004882197603e-06, "loss": 0.8711, "step": 17091 }, { "epoch": 0.32, "learning_rate": 3.959880871705583e-06, "loss": 0.8385, "step": 17092 }, { "epoch": 0.32, "learning_rate": 3.959756855762413e-06, "loss": 1.1267, "step": 17093 }, { "epoch": 0.32, "learning_rate": 3.9596328343685555e-06, "loss": 0.995, "step": 17094 }, { "epoch": 0.32, "learning_rate": 3.959508807524474e-06, "loss": 0.8464, "step": 17095 }, { "epoch": 0.32, "learning_rate": 3.959384775230631e-06, "loss": 0.8941, "step": 17096 }, { "epoch": 0.32, "learning_rate": 3.95926073748749e-06, "loss": 0.605, "step": 17097 }, { "epoch": 0.32, "learning_rate": 3.959136694295515e-06, "loss": 0.798, "step": 17098 }, { "epoch": 0.32, "learning_rate": 3.959012645655167e-06, "loss": 0.9661, "step": 17099 }, { "epoch": 0.32, "learning_rate": 3.958888591566911e-06, "loss": 0.9145, "step": 17100 }, { "epoch": 0.32, "learning_rate": 3.9587645320312096e-06, "loss": 0.9611, "step": 17101 }, { "epoch": 0.32, "learning_rate": 3.9586404670485266e-06, "loss": 0.7384, "step": 17102 }, { "epoch": 0.32, "learning_rate": 3.958516396619325e-06, "loss": 0.9964, "step": 17103 }, { "epoch": 0.32, "learning_rate": 3.958392320744067e-06, "loss": 0.8566, "step": 17104 }, { "epoch": 0.32, "learning_rate": 3.958268239423218e-06, "loss": 1.2164, "step": 17105 }, { "epoch": 0.32, "learning_rate": 3.958144152657239e-06, "loss": 0.9672, "step": 17106 }, { "epoch": 0.32, "learning_rate": 3.958020060446594e-06, "loss": 0.8634, "step": 17107 }, { "epoch": 0.32, "learning_rate": 3.957895962791748e-06, "loss": 0.8708, "step": 17108 }, { "epoch": 0.32, "learning_rate": 3.957771859693164e-06, "loss": 0.9306, "step": 17109 }, { "epoch": 0.32, "learning_rate": 3.957647751151302e-06, "loss": 0.8187, "step": 17110 }, { "epoch": 0.32, "learning_rate": 3.957523637166631e-06, "loss": 0.8838, "step": 17111 }, { "epoch": 0.32, "learning_rate": 3.957399517739608e-06, "loss": 1.2466, "step": 17112 }, { "epoch": 0.32, "learning_rate": 3.957275392870702e-06, "loss": 0.7813, "step": 17113 }, { "epoch": 0.32, "learning_rate": 3.9571512625603746e-06, "loss": 0.8856, "step": 17114 }, { "epoch": 0.32, "learning_rate": 3.957027126809088e-06, "loss": 0.8731, "step": 17115 }, { "epoch": 0.32, "learning_rate": 3.956902985617308e-06, "loss": 0.882, "step": 17116 }, { "epoch": 0.32, "learning_rate": 3.956778838985496e-06, "loss": 1.0092, "step": 17117 }, { "epoch": 0.32, "learning_rate": 3.956654686914116e-06, "loss": 0.7254, "step": 17118 }, { "epoch": 0.32, "learning_rate": 3.956530529403633e-06, "loss": 1.0673, "step": 17119 }, { "epoch": 0.32, "learning_rate": 3.95640636645451e-06, "loss": 1.0443, "step": 17120 }, { "epoch": 0.32, "learning_rate": 3.956282198067209e-06, "loss": 0.9836, "step": 17121 }, { "epoch": 0.32, "learning_rate": 3.956158024242196e-06, "loss": 1.112, "step": 17122 }, { "epoch": 0.32, "learning_rate": 3.956033844979933e-06, "loss": 0.762, "step": 17123 }, { "epoch": 0.32, "learning_rate": 3.955909660280884e-06, "loss": 0.9324, "step": 17124 }, { "epoch": 0.32, "learning_rate": 3.955785470145514e-06, "loss": 1.1788, "step": 17125 }, { "epoch": 0.32, "learning_rate": 3.955661274574285e-06, "loss": 0.8657, "step": 17126 }, { "epoch": 0.32, "learning_rate": 3.955537073567662e-06, "loss": 1.0748, "step": 17127 }, { "epoch": 0.32, "learning_rate": 3.955412867126108e-06, "loss": 1.1221, "step": 17128 }, { "epoch": 0.32, "learning_rate": 3.9552886552500866e-06, "loss": 0.9004, "step": 17129 }, { "epoch": 0.32, "learning_rate": 3.955164437940062e-06, "loss": 0.8983, "step": 17130 }, { "epoch": 0.32, "learning_rate": 3.955040215196498e-06, "loss": 1.0036, "step": 17131 }, { "epoch": 0.32, "learning_rate": 3.954915987019858e-06, "loss": 1.0397, "step": 17132 }, { "epoch": 0.32, "learning_rate": 3.9547917534106076e-06, "loss": 0.9306, "step": 17133 }, { "epoch": 0.32, "learning_rate": 3.954667514369208e-06, "loss": 0.8462, "step": 17134 }, { "epoch": 0.32, "learning_rate": 3.9545432698961254e-06, "loss": 0.9619, "step": 17135 }, { "epoch": 0.32, "learning_rate": 3.9544190199918225e-06, "loss": 1.0175, "step": 17136 }, { "epoch": 0.32, "learning_rate": 3.9542947646567636e-06, "loss": 0.9847, "step": 17137 }, { "epoch": 0.32, "learning_rate": 3.954170503891414e-06, "loss": 1.0575, "step": 17138 }, { "epoch": 0.32, "learning_rate": 3.9540462376962345e-06, "loss": 1.0196, "step": 17139 }, { "epoch": 0.32, "learning_rate": 3.953921966071691e-06, "loss": 0.8954, "step": 17140 }, { "epoch": 0.32, "learning_rate": 3.953797689018248e-06, "loss": 0.9046, "step": 17141 }, { "epoch": 0.32, "learning_rate": 3.9536734065363695e-06, "loss": 0.9869, "step": 17142 }, { "epoch": 0.32, "learning_rate": 3.953549118626517e-06, "loss": 0.988, "step": 17143 }, { "epoch": 0.32, "learning_rate": 3.953424825289159e-06, "loss": 1.0241, "step": 17144 }, { "epoch": 0.32, "learning_rate": 3.953300526524757e-06, "loss": 1.0564, "step": 17145 }, { "epoch": 0.32, "learning_rate": 3.953176222333774e-06, "loss": 1.1746, "step": 17146 }, { "epoch": 0.32, "learning_rate": 3.953051912716677e-06, "loss": 0.8742, "step": 17147 }, { "epoch": 0.32, "learning_rate": 3.952927597673928e-06, "loss": 0.9149, "step": 17148 }, { "epoch": 0.32, "learning_rate": 3.952803277205991e-06, "loss": 0.8341, "step": 17149 }, { "epoch": 0.32, "learning_rate": 3.952678951313333e-06, "loss": 1.0366, "step": 17150 }, { "epoch": 0.32, "learning_rate": 3.952554619996415e-06, "loss": 0.9172, "step": 17151 }, { "epoch": 0.32, "learning_rate": 3.952430283255703e-06, "loss": 0.9364, "step": 17152 }, { "epoch": 0.32, "learning_rate": 3.9523059410916605e-06, "loss": 0.9213, "step": 17153 }, { "epoch": 0.32, "learning_rate": 3.9521815935047525e-06, "loss": 0.8558, "step": 17154 }, { "epoch": 0.32, "learning_rate": 3.952057240495443e-06, "loss": 0.9598, "step": 17155 }, { "epoch": 0.32, "learning_rate": 3.9519328820641965e-06, "loss": 1.222, "step": 17156 }, { "epoch": 0.32, "learning_rate": 3.951808518211477e-06, "loss": 0.932, "step": 17157 }, { "epoch": 0.32, "learning_rate": 3.951684148937749e-06, "loss": 1.0472, "step": 17158 }, { "epoch": 0.32, "learning_rate": 3.951559774243477e-06, "loss": 0.7473, "step": 17159 }, { "epoch": 0.32, "learning_rate": 3.9514353941291245e-06, "loss": 0.9288, "step": 17160 }, { "epoch": 0.32, "learning_rate": 3.951311008595157e-06, "loss": 0.8995, "step": 17161 }, { "epoch": 0.32, "learning_rate": 3.9511866176420396e-06, "loss": 1.1191, "step": 17162 }, { "epoch": 0.32, "learning_rate": 3.951062221270235e-06, "loss": 1.0213, "step": 17163 }, { "epoch": 0.32, "learning_rate": 3.950937819480208e-06, "loss": 0.6976, "step": 17164 }, { "epoch": 0.32, "learning_rate": 3.950813412272426e-06, "loss": 0.9738, "step": 17165 }, { "epoch": 0.32, "learning_rate": 3.95068899964735e-06, "loss": 0.8358, "step": 17166 }, { "epoch": 0.32, "learning_rate": 3.950564581605445e-06, "loss": 0.8684, "step": 17167 }, { "epoch": 0.32, "learning_rate": 3.950440158147176e-06, "loss": 1.0395, "step": 17168 }, { "epoch": 0.32, "learning_rate": 3.950315729273009e-06, "loss": 1.0032, "step": 17169 }, { "epoch": 0.32, "learning_rate": 3.950191294983408e-06, "loss": 0.9311, "step": 17170 }, { "epoch": 0.32, "learning_rate": 3.950066855278836e-06, "loss": 0.9481, "step": 17171 }, { "epoch": 0.32, "learning_rate": 3.949942410159759e-06, "loss": 1.1054, "step": 17172 }, { "epoch": 0.32, "learning_rate": 3.949817959626642e-06, "loss": 0.7794, "step": 17173 }, { "epoch": 0.32, "learning_rate": 3.949693503679949e-06, "loss": 1.0703, "step": 17174 }, { "epoch": 0.32, "learning_rate": 3.949569042320144e-06, "loss": 1.0295, "step": 17175 }, { "epoch": 0.32, "learning_rate": 3.949444575547694e-06, "loss": 0.7506, "step": 17176 }, { "epoch": 0.32, "learning_rate": 3.949320103363061e-06, "loss": 0.7975, "step": 17177 }, { "epoch": 0.32, "learning_rate": 3.949195625766713e-06, "loss": 0.9739, "step": 17178 }, { "epoch": 0.32, "learning_rate": 3.9490711427591115e-06, "loss": 1.0292, "step": 17179 }, { "epoch": 0.32, "learning_rate": 3.948946654340724e-06, "loss": 1.0225, "step": 17180 }, { "epoch": 0.32, "learning_rate": 3.948822160512013e-06, "loss": 1.1369, "step": 17181 }, { "epoch": 0.32, "learning_rate": 3.948697661273445e-06, "loss": 0.7625, "step": 17182 }, { "epoch": 0.32, "learning_rate": 3.948573156625484e-06, "loss": 0.9617, "step": 17183 }, { "epoch": 0.32, "learning_rate": 3.948448646568595e-06, "loss": 0.8056, "step": 17184 }, { "epoch": 0.32, "learning_rate": 3.9483241311032435e-06, "loss": 0.8157, "step": 17185 }, { "epoch": 0.32, "learning_rate": 3.948199610229895e-06, "loss": 1.0864, "step": 17186 }, { "epoch": 0.32, "learning_rate": 3.948075083949013e-06, "loss": 1.0256, "step": 17187 }, { "epoch": 0.32, "learning_rate": 3.947950552261063e-06, "loss": 0.9124, "step": 17188 }, { "epoch": 0.32, "learning_rate": 3.9478260151665095e-06, "loss": 0.8885, "step": 17189 }, { "epoch": 0.32, "learning_rate": 3.9477014726658185e-06, "loss": 0.7826, "step": 17190 }, { "epoch": 0.32, "learning_rate": 3.947576924759454e-06, "loss": 0.9694, "step": 17191 }, { "epoch": 0.32, "learning_rate": 3.947452371447883e-06, "loss": 0.6539, "step": 17192 }, { "epoch": 0.32, "learning_rate": 3.947327812731568e-06, "loss": 0.9122, "step": 17193 }, { "epoch": 0.32, "learning_rate": 3.947203248610976e-06, "loss": 1.0874, "step": 17194 }, { "epoch": 0.32, "learning_rate": 3.947078679086571e-06, "loss": 0.9914, "step": 17195 }, { "epoch": 0.32, "learning_rate": 3.946954104158819e-06, "loss": 1.0276, "step": 17196 }, { "epoch": 0.32, "learning_rate": 3.946829523828184e-06, "loss": 1.0096, "step": 17197 }, { "epoch": 0.32, "learning_rate": 3.9467049380951326e-06, "loss": 0.8458, "step": 17198 }, { "epoch": 0.32, "learning_rate": 3.946580346960129e-06, "loss": 1.0547, "step": 17199 }, { "epoch": 0.32, "learning_rate": 3.946455750423639e-06, "loss": 1.0115, "step": 17200 }, { "epoch": 0.32, "learning_rate": 3.946331148486127e-06, "loss": 0.8584, "step": 17201 }, { "epoch": 0.32, "learning_rate": 3.946206541148059e-06, "loss": 0.7892, "step": 17202 }, { "epoch": 0.32, "learning_rate": 3.9460819284099e-06, "loss": 1.1031, "step": 17203 }, { "epoch": 0.32, "learning_rate": 3.9459573102721165e-06, "loss": 0.819, "step": 17204 }, { "epoch": 0.32, "learning_rate": 3.945832686735172e-06, "loss": 0.9256, "step": 17205 }, { "epoch": 0.32, "learning_rate": 3.945708057799533e-06, "loss": 0.9835, "step": 17206 }, { "epoch": 0.32, "learning_rate": 3.945583423465664e-06, "loss": 1.017, "step": 17207 }, { "epoch": 0.32, "learning_rate": 3.945458783734031e-06, "loss": 0.8806, "step": 17208 }, { "epoch": 0.32, "learning_rate": 3.9453341386050984e-06, "loss": 0.9802, "step": 17209 }, { "epoch": 0.32, "learning_rate": 3.945209488079334e-06, "loss": 0.8507, "step": 17210 }, { "epoch": 0.32, "learning_rate": 3.9450848321572e-06, "loss": 1.0776, "step": 17211 }, { "epoch": 0.32, "learning_rate": 3.944960170839165e-06, "loss": 1.0848, "step": 17212 }, { "epoch": 0.32, "learning_rate": 3.944835504125692e-06, "loss": 1.0687, "step": 17213 }, { "epoch": 0.32, "learning_rate": 3.944710832017248e-06, "loss": 0.802, "step": 17214 }, { "epoch": 0.32, "learning_rate": 3.944586154514298e-06, "loss": 0.8811, "step": 17215 }, { "epoch": 0.32, "learning_rate": 3.944461471617307e-06, "loss": 0.7953, "step": 17216 }, { "epoch": 0.32, "learning_rate": 3.944336783326742e-06, "loss": 0.9273, "step": 17217 }, { "epoch": 0.32, "learning_rate": 3.944212089643068e-06, "loss": 0.9031, "step": 17218 }, { "epoch": 0.32, "learning_rate": 3.944087390566748e-06, "loss": 0.8471, "step": 17219 }, { "epoch": 0.32, "learning_rate": 3.943962686098253e-06, "loss": 0.9808, "step": 17220 }, { "epoch": 0.32, "learning_rate": 3.943837976238044e-06, "loss": 0.872, "step": 17221 }, { "epoch": 0.32, "learning_rate": 3.9437132609865895e-06, "loss": 0.9674, "step": 17222 }, { "epoch": 0.32, "learning_rate": 3.943588540344352e-06, "loss": 0.9693, "step": 17223 }, { "epoch": 0.32, "learning_rate": 3.943463814311801e-06, "loss": 1.1247, "step": 17224 }, { "epoch": 0.32, "learning_rate": 3.943339082889399e-06, "loss": 1.3909, "step": 17225 }, { "epoch": 0.33, "learning_rate": 3.9432143460776136e-06, "loss": 0.7187, "step": 17226 }, { "epoch": 0.33, "learning_rate": 3.94308960387691e-06, "loss": 0.9819, "step": 17227 }, { "epoch": 0.33, "learning_rate": 3.942964856287755e-06, "loss": 0.9046, "step": 17228 }, { "epoch": 0.33, "learning_rate": 3.942840103310612e-06, "loss": 0.9037, "step": 17229 }, { "epoch": 0.33, "learning_rate": 3.94271534494595e-06, "loss": 1.0349, "step": 17230 }, { "epoch": 0.33, "learning_rate": 3.942590581194231e-06, "loss": 1.0947, "step": 17231 }, { "epoch": 0.33, "learning_rate": 3.9424658120559245e-06, "loss": 0.9196, "step": 17232 }, { "epoch": 0.33, "learning_rate": 3.9423410375314946e-06, "loss": 0.8628, "step": 17233 }, { "epoch": 0.33, "learning_rate": 3.942216257621407e-06, "loss": 0.8632, "step": 17234 }, { "epoch": 0.33, "learning_rate": 3.942091472326128e-06, "loss": 0.7354, "step": 17235 }, { "epoch": 0.33, "learning_rate": 3.941966681646125e-06, "loss": 0.9906, "step": 17236 }, { "epoch": 0.33, "learning_rate": 3.941841885581862e-06, "loss": 1.1498, "step": 17237 }, { "epoch": 0.33, "learning_rate": 3.9417170841338045e-06, "loss": 1.0118, "step": 17238 }, { "epoch": 0.33, "learning_rate": 3.941592277302422e-06, "loss": 0.7946, "step": 17239 }, { "epoch": 0.33, "learning_rate": 3.941467465088176e-06, "loss": 0.7148, "step": 17240 }, { "epoch": 0.33, "learning_rate": 3.941342647491535e-06, "loss": 1.0273, "step": 17241 }, { "epoch": 0.33, "learning_rate": 3.941217824512965e-06, "loss": 0.8947, "step": 17242 }, { "epoch": 0.33, "learning_rate": 3.941092996152932e-06, "loss": 1.0636, "step": 17243 }, { "epoch": 0.33, "learning_rate": 3.9409681624119015e-06, "loss": 1.2233, "step": 17244 }, { "epoch": 0.33, "learning_rate": 3.940843323290341e-06, "loss": 0.8288, "step": 17245 }, { "epoch": 0.33, "learning_rate": 3.940718478788715e-06, "loss": 1.01, "step": 17246 }, { "epoch": 0.33, "learning_rate": 3.940593628907491e-06, "loss": 0.8935, "step": 17247 }, { "epoch": 0.33, "learning_rate": 3.940468773647134e-06, "loss": 0.7736, "step": 17248 }, { "epoch": 0.33, "learning_rate": 3.940343913008111e-06, "loss": 0.9924, "step": 17249 }, { "epoch": 0.33, "learning_rate": 3.940219046990888e-06, "loss": 1.1051, "step": 17250 }, { "epoch": 0.33, "learning_rate": 3.94009417559593e-06, "loss": 0.9331, "step": 17251 }, { "epoch": 0.33, "learning_rate": 3.939969298823706e-06, "loss": 0.6838, "step": 17252 }, { "epoch": 0.33, "learning_rate": 3.9398444166746805e-06, "loss": 0.957, "step": 17253 }, { "epoch": 0.33, "learning_rate": 3.93971952914932e-06, "loss": 0.8635, "step": 17254 }, { "epoch": 0.33, "learning_rate": 3.939594636248091e-06, "loss": 0.8563, "step": 17255 }, { "epoch": 0.33, "learning_rate": 3.939469737971459e-06, "loss": 1.0645, "step": 17256 }, { "epoch": 0.33, "learning_rate": 3.939344834319892e-06, "loss": 0.8416, "step": 17257 }, { "epoch": 0.33, "learning_rate": 3.939219925293855e-06, "loss": 0.9493, "step": 17258 }, { "epoch": 0.33, "learning_rate": 3.939095010893815e-06, "loss": 1.0944, "step": 17259 }, { "epoch": 0.33, "learning_rate": 3.938970091120239e-06, "loss": 0.8267, "step": 17260 }, { "epoch": 0.33, "learning_rate": 3.938845165973592e-06, "loss": 1.1488, "step": 17261 }, { "epoch": 0.33, "learning_rate": 3.938720235454342e-06, "loss": 0.9827, "step": 17262 }, { "epoch": 0.33, "learning_rate": 3.938595299562955e-06, "loss": 1.0226, "step": 17263 }, { "epoch": 0.33, "learning_rate": 3.938470358299896e-06, "loss": 1.0269, "step": 17264 }, { "epoch": 0.33, "learning_rate": 3.938345411665633e-06, "loss": 0.864, "step": 17265 }, { "epoch": 0.33, "learning_rate": 3.938220459660634e-06, "loss": 0.9709, "step": 17266 }, { "epoch": 0.33, "learning_rate": 3.938095502285362e-06, "loss": 0.8209, "step": 17267 }, { "epoch": 0.33, "learning_rate": 3.937970539540285e-06, "loss": 0.9225, "step": 17268 }, { "epoch": 0.33, "learning_rate": 3.937845571425872e-06, "loss": 1.1362, "step": 17269 }, { "epoch": 0.33, "learning_rate": 3.937720597942587e-06, "loss": 0.9686, "step": 17270 }, { "epoch": 0.33, "learning_rate": 3.937595619090897e-06, "loss": 1.0053, "step": 17271 }, { "epoch": 0.33, "learning_rate": 3.93747063487127e-06, "loss": 1.0453, "step": 17272 }, { "epoch": 0.33, "learning_rate": 3.937345645284171e-06, "loss": 0.8541, "step": 17273 }, { "epoch": 0.33, "learning_rate": 3.937220650330067e-06, "loss": 0.9072, "step": 17274 }, { "epoch": 0.33, "learning_rate": 3.937095650009426e-06, "loss": 1.1707, "step": 17275 }, { "epoch": 0.33, "learning_rate": 3.936970644322713e-06, "loss": 0.891, "step": 17276 }, { "epoch": 0.33, "learning_rate": 3.936845633270397e-06, "loss": 1.0016, "step": 17277 }, { "epoch": 0.33, "learning_rate": 3.936720616852943e-06, "loss": 1.0822, "step": 17278 }, { "epoch": 0.33, "learning_rate": 3.936595595070817e-06, "loss": 0.859, "step": 17279 }, { "epoch": 0.33, "learning_rate": 3.936470567924488e-06, "loss": 1.0982, "step": 17280 }, { "epoch": 0.33, "learning_rate": 3.936345535414423e-06, "loss": 1.2092, "step": 17281 }, { "epoch": 0.33, "learning_rate": 3.936220497541087e-06, "loss": 0.9779, "step": 17282 }, { "epoch": 0.33, "learning_rate": 3.936095454304946e-06, "loss": 0.8715, "step": 17283 }, { "epoch": 0.33, "learning_rate": 3.935970405706471e-06, "loss": 0.859, "step": 17284 }, { "epoch": 0.33, "learning_rate": 3.935845351746126e-06, "loss": 0.8962, "step": 17285 }, { "epoch": 0.33, "learning_rate": 3.935720292424378e-06, "loss": 0.9525, "step": 17286 }, { "epoch": 0.33, "learning_rate": 3.935595227741694e-06, "loss": 1.0008, "step": 17287 }, { "epoch": 0.33, "learning_rate": 3.935470157698543e-06, "loss": 0.882, "step": 17288 }, { "epoch": 0.33, "learning_rate": 3.9353450822953884e-06, "loss": 0.7804, "step": 17289 }, { "epoch": 0.33, "learning_rate": 3.935220001532702e-06, "loss": 1.0605, "step": 17290 }, { "epoch": 0.33, "learning_rate": 3.935094915410945e-06, "loss": 0.873, "step": 17291 }, { "epoch": 0.33, "learning_rate": 3.934969823930589e-06, "loss": 0.9368, "step": 17292 }, { "epoch": 0.33, "learning_rate": 3.934844727092101e-06, "loss": 1.0734, "step": 17293 }, { "epoch": 0.33, "learning_rate": 3.934719624895945e-06, "loss": 1.1048, "step": 17294 }, { "epoch": 0.33, "learning_rate": 3.93459451734259e-06, "loss": 0.968, "step": 17295 }, { "epoch": 0.33, "learning_rate": 3.934469404432504e-06, "loss": 0.8803, "step": 17296 }, { "epoch": 0.33, "learning_rate": 3.934344286166152e-06, "loss": 0.8309, "step": 17297 }, { "epoch": 0.33, "learning_rate": 3.934219162544003e-06, "loss": 0.8782, "step": 17298 }, { "epoch": 0.33, "learning_rate": 3.934094033566524e-06, "loss": 1.068, "step": 17299 }, { "epoch": 0.33, "learning_rate": 3.933968899234182e-06, "loss": 0.8722, "step": 17300 }, { "epoch": 0.33, "learning_rate": 3.933843759547443e-06, "loss": 0.847, "step": 17301 }, { "epoch": 0.33, "learning_rate": 3.9337186145067765e-06, "loss": 0.9047, "step": 17302 }, { "epoch": 0.33, "learning_rate": 3.9335934641126485e-06, "loss": 0.924, "step": 17303 }, { "epoch": 0.33, "learning_rate": 3.9334683083655256e-06, "loss": 0.8473, "step": 17304 }, { "epoch": 0.33, "learning_rate": 3.933343147265877e-06, "loss": 0.9435, "step": 17305 }, { "epoch": 0.33, "learning_rate": 3.9332179808141675e-06, "loss": 0.8834, "step": 17306 }, { "epoch": 0.33, "learning_rate": 3.933092809010868e-06, "loss": 1.1089, "step": 17307 }, { "epoch": 0.33, "learning_rate": 3.932967631856443e-06, "loss": 0.7866, "step": 17308 }, { "epoch": 0.33, "learning_rate": 3.93284244935136e-06, "loss": 0.9951, "step": 17309 }, { "epoch": 0.33, "learning_rate": 3.932717261496089e-06, "loss": 1.0975, "step": 17310 }, { "epoch": 0.33, "learning_rate": 3.932592068291095e-06, "loss": 0.6893, "step": 17311 }, { "epoch": 0.33, "learning_rate": 3.932466869736845e-06, "loss": 1.1209, "step": 17312 }, { "epoch": 0.33, "learning_rate": 3.9323416658338085e-06, "loss": 0.7959, "step": 17313 }, { "epoch": 0.33, "learning_rate": 3.932216456582452e-06, "loss": 0.9307, "step": 17314 }, { "epoch": 0.33, "learning_rate": 3.932091241983243e-06, "loss": 0.8591, "step": 17315 }, { "epoch": 0.33, "learning_rate": 3.93196602203665e-06, "loss": 0.7499, "step": 17316 }, { "epoch": 0.33, "learning_rate": 3.93184079674314e-06, "loss": 1.0131, "step": 17317 }, { "epoch": 0.33, "learning_rate": 3.931715566103179e-06, "loss": 1.0825, "step": 17318 }, { "epoch": 0.33, "learning_rate": 3.931590330117236e-06, "loss": 0.9506, "step": 17319 }, { "epoch": 0.33, "learning_rate": 3.93146508878578e-06, "loss": 0.8473, "step": 17320 }, { "epoch": 0.33, "learning_rate": 3.931339842109276e-06, "loss": 0.8427, "step": 17321 }, { "epoch": 0.33, "learning_rate": 3.9312145900881934e-06, "loss": 1.0355, "step": 17322 }, { "epoch": 0.33, "learning_rate": 3.9310893327229996e-06, "loss": 0.9588, "step": 17323 }, { "epoch": 0.33, "learning_rate": 3.930964070014161e-06, "loss": 0.711, "step": 17324 }, { "epoch": 0.33, "learning_rate": 3.930838801962148e-06, "loss": 1.1407, "step": 17325 }, { "epoch": 0.33, "learning_rate": 3.930713528567426e-06, "loss": 1.1089, "step": 17326 }, { "epoch": 0.33, "learning_rate": 3.9305882498304634e-06, "loss": 1.1091, "step": 17327 }, { "epoch": 0.33, "learning_rate": 3.930462965751728e-06, "loss": 0.8864, "step": 17328 }, { "epoch": 0.33, "learning_rate": 3.930337676331688e-06, "loss": 1.0106, "step": 17329 }, { "epoch": 0.33, "learning_rate": 3.930212381570811e-06, "loss": 1.1761, "step": 17330 }, { "epoch": 0.33, "learning_rate": 3.930087081469566e-06, "loss": 1.0403, "step": 17331 }, { "epoch": 0.33, "learning_rate": 3.929961776028418e-06, "loss": 0.9601, "step": 17332 }, { "epoch": 0.33, "learning_rate": 3.929836465247837e-06, "loss": 0.9871, "step": 17333 }, { "epoch": 0.33, "learning_rate": 3.929711149128291e-06, "loss": 1.0137, "step": 17334 }, { "epoch": 0.33, "learning_rate": 3.929585827670247e-06, "loss": 0.8619, "step": 17335 }, { "epoch": 0.33, "learning_rate": 3.929460500874172e-06, "loss": 1.0817, "step": 17336 }, { "epoch": 0.33, "learning_rate": 3.9293351687405375e-06, "loss": 1.0009, "step": 17337 }, { "epoch": 0.33, "learning_rate": 3.929209831269809e-06, "loss": 1.0008, "step": 17338 }, { "epoch": 0.33, "learning_rate": 3.929084488462454e-06, "loss": 1.039, "step": 17339 }, { "epoch": 0.33, "learning_rate": 3.928959140318942e-06, "loss": 0.9026, "step": 17340 }, { "epoch": 0.33, "learning_rate": 3.92883378683974e-06, "loss": 0.7979, "step": 17341 }, { "epoch": 0.33, "learning_rate": 3.928708428025316e-06, "loss": 1.0757, "step": 17342 }, { "epoch": 0.33, "learning_rate": 3.92858306387614e-06, "loss": 1.0862, "step": 17343 }, { "epoch": 0.33, "learning_rate": 3.9284576943926775e-06, "loss": 0.9614, "step": 17344 }, { "epoch": 0.33, "learning_rate": 3.928332319575397e-06, "loss": 0.9815, "step": 17345 }, { "epoch": 0.33, "learning_rate": 3.928206939424769e-06, "loss": 0.9106, "step": 17346 }, { "epoch": 0.33, "learning_rate": 3.9280815539412595e-06, "loss": 0.8819, "step": 17347 }, { "epoch": 0.33, "learning_rate": 3.927956163125337e-06, "loss": 0.9053, "step": 17348 }, { "epoch": 0.33, "learning_rate": 3.92783076697747e-06, "loss": 1.0391, "step": 17349 }, { "epoch": 0.33, "learning_rate": 3.927705365498127e-06, "loss": 1.1249, "step": 17350 }, { "epoch": 0.33, "learning_rate": 3.927579958687775e-06, "loss": 0.9801, "step": 17351 }, { "epoch": 0.33, "learning_rate": 3.927454546546885e-06, "loss": 0.74, "step": 17352 }, { "epoch": 0.33, "learning_rate": 3.927329129075922e-06, "loss": 0.9323, "step": 17353 }, { "epoch": 0.33, "learning_rate": 3.927203706275357e-06, "loss": 0.9696, "step": 17354 }, { "epoch": 0.33, "learning_rate": 3.927078278145656e-06, "loss": 0.9731, "step": 17355 }, { "epoch": 0.33, "learning_rate": 3.926952844687289e-06, "loss": 1.0615, "step": 17356 }, { "epoch": 0.33, "learning_rate": 3.9268274059007234e-06, "loss": 1.0026, "step": 17357 }, { "epoch": 0.33, "learning_rate": 3.9267019617864284e-06, "loss": 1.0188, "step": 17358 }, { "epoch": 0.33, "learning_rate": 3.926576512344872e-06, "loss": 0.8896, "step": 17359 }, { "epoch": 0.33, "learning_rate": 3.926451057576522e-06, "loss": 0.8702, "step": 17360 }, { "epoch": 0.33, "learning_rate": 3.926325597481848e-06, "loss": 0.742, "step": 17361 }, { "epoch": 0.33, "learning_rate": 3.926200132061318e-06, "loss": 1.006, "step": 17362 }, { "epoch": 0.33, "learning_rate": 3.9260746613154e-06, "loss": 1.1523, "step": 17363 }, { "epoch": 0.33, "learning_rate": 3.925949185244564e-06, "loss": 0.9204, "step": 17364 }, { "epoch": 0.33, "learning_rate": 3.925823703849277e-06, "loss": 0.8956, "step": 17365 }, { "epoch": 0.33, "learning_rate": 3.925698217130007e-06, "loss": 0.7699, "step": 17366 }, { "epoch": 0.33, "learning_rate": 3.925572725087225e-06, "loss": 0.8277, "step": 17367 }, { "epoch": 0.33, "learning_rate": 3.925447227721398e-06, "loss": 0.9604, "step": 17368 }, { "epoch": 0.33, "learning_rate": 3.925321725032994e-06, "loss": 0.9809, "step": 17369 }, { "epoch": 0.33, "learning_rate": 3.925196217022483e-06, "loss": 0.9297, "step": 17370 }, { "epoch": 0.33, "learning_rate": 3.925070703690333e-06, "loss": 0.9031, "step": 17371 }, { "epoch": 0.33, "learning_rate": 3.924945185037012e-06, "loss": 0.8445, "step": 17372 }, { "epoch": 0.33, "learning_rate": 3.92481966106299e-06, "loss": 0.8475, "step": 17373 }, { "epoch": 0.33, "learning_rate": 3.924694131768735e-06, "loss": 0.9647, "step": 17374 }, { "epoch": 0.33, "learning_rate": 3.924568597154716e-06, "loss": 1.2187, "step": 17375 }, { "epoch": 0.33, "learning_rate": 3.924443057221401e-06, "loss": 0.9391, "step": 17376 }, { "epoch": 0.33, "learning_rate": 3.924317511969259e-06, "loss": 0.9724, "step": 17377 }, { "epoch": 0.33, "learning_rate": 3.92419196139876e-06, "loss": 0.8203, "step": 17378 }, { "epoch": 0.33, "learning_rate": 3.924066405510371e-06, "loss": 0.921, "step": 17379 }, { "epoch": 0.33, "learning_rate": 3.923940844304563e-06, "loss": 0.972, "step": 17380 }, { "epoch": 0.33, "learning_rate": 3.923815277781802e-06, "loss": 0.9708, "step": 17381 }, { "epoch": 0.33, "learning_rate": 3.923689705942558e-06, "loss": 0.9675, "step": 17382 }, { "epoch": 0.33, "learning_rate": 3.923564128787302e-06, "loss": 0.8824, "step": 17383 }, { "epoch": 0.33, "learning_rate": 3.9234385463165e-06, "loss": 1.0894, "step": 17384 }, { "epoch": 0.33, "learning_rate": 3.923312958530624e-06, "loss": 1.0023, "step": 17385 }, { "epoch": 0.33, "learning_rate": 3.923187365430139e-06, "loss": 0.8029, "step": 17386 }, { "epoch": 0.33, "learning_rate": 3.923061767015517e-06, "loss": 0.9425, "step": 17387 }, { "epoch": 0.33, "learning_rate": 3.922936163287226e-06, "loss": 0.9675, "step": 17388 }, { "epoch": 0.33, "learning_rate": 3.922810554245734e-06, "loss": 0.7281, "step": 17389 }, { "epoch": 0.33, "learning_rate": 3.922684939891513e-06, "loss": 1.0798, "step": 17390 }, { "epoch": 0.33, "learning_rate": 3.922559320225028e-06, "loss": 0.9233, "step": 17391 }, { "epoch": 0.33, "learning_rate": 3.9224336952467516e-06, "loss": 0.7968, "step": 17392 }, { "epoch": 0.33, "learning_rate": 3.92230806495715e-06, "loss": 1.2145, "step": 17393 }, { "epoch": 0.33, "learning_rate": 3.922182429356695e-06, "loss": 1.3778, "step": 17394 }, { "epoch": 0.33, "learning_rate": 3.922056788445854e-06, "loss": 1.01, "step": 17395 }, { "epoch": 0.33, "learning_rate": 3.921931142225096e-06, "loss": 0.8304, "step": 17396 }, { "epoch": 0.33, "learning_rate": 3.921805490694891e-06, "loss": 0.9481, "step": 17397 }, { "epoch": 0.33, "learning_rate": 3.921679833855708e-06, "loss": 0.8926, "step": 17398 }, { "epoch": 0.33, "learning_rate": 3.921554171708016e-06, "loss": 1.0814, "step": 17399 }, { "epoch": 0.33, "learning_rate": 3.921428504252285e-06, "loss": 1.1561, "step": 17400 }, { "epoch": 0.33, "learning_rate": 3.921302831488983e-06, "loss": 1.0428, "step": 17401 }, { "epoch": 0.33, "learning_rate": 3.9211771534185785e-06, "loss": 0.8321, "step": 17402 }, { "epoch": 0.33, "learning_rate": 3.9210514700415435e-06, "loss": 0.8851, "step": 17403 }, { "epoch": 0.33, "learning_rate": 3.920925781358346e-06, "loss": 0.6765, "step": 17404 }, { "epoch": 0.33, "learning_rate": 3.920800087369455e-06, "loss": 0.8666, "step": 17405 }, { "epoch": 0.33, "learning_rate": 3.9206743880753405e-06, "loss": 0.9525, "step": 17406 }, { "epoch": 0.33, "learning_rate": 3.920548683476471e-06, "loss": 1.0488, "step": 17407 }, { "epoch": 0.33, "learning_rate": 3.920422973573315e-06, "loss": 0.8394, "step": 17408 }, { "epoch": 0.33, "learning_rate": 3.920297258366345e-06, "loss": 0.8635, "step": 17409 }, { "epoch": 0.33, "learning_rate": 3.920171537856028e-06, "loss": 0.9603, "step": 17410 }, { "epoch": 0.33, "learning_rate": 3.920045812042833e-06, "loss": 0.965, "step": 17411 }, { "epoch": 0.33, "learning_rate": 3.919920080927232e-06, "loss": 0.9335, "step": 17412 }, { "epoch": 0.33, "learning_rate": 3.919794344509692e-06, "loss": 0.9716, "step": 17413 }, { "epoch": 0.33, "learning_rate": 3.919668602790684e-06, "loss": 0.8355, "step": 17414 }, { "epoch": 0.33, "learning_rate": 3.919542855770677e-06, "loss": 0.9509, "step": 17415 }, { "epoch": 0.33, "learning_rate": 3.9194171034501396e-06, "loss": 1.0151, "step": 17416 }, { "epoch": 0.33, "learning_rate": 3.9192913458295436e-06, "loss": 0.9842, "step": 17417 }, { "epoch": 0.33, "learning_rate": 3.919165582909356e-06, "loss": 1.1154, "step": 17418 }, { "epoch": 0.33, "learning_rate": 3.919039814690048e-06, "loss": 1.0557, "step": 17419 }, { "epoch": 0.33, "learning_rate": 3.9189140411720894e-06, "loss": 0.8386, "step": 17420 }, { "epoch": 0.33, "learning_rate": 3.918788262355948e-06, "loss": 0.7253, "step": 17421 }, { "epoch": 0.33, "learning_rate": 3.918662478242096e-06, "loss": 1.1487, "step": 17422 }, { "epoch": 0.33, "learning_rate": 3.918536688831002e-06, "loss": 0.8544, "step": 17423 }, { "epoch": 0.33, "learning_rate": 3.918410894123134e-06, "loss": 0.9606, "step": 17424 }, { "epoch": 0.33, "learning_rate": 3.918285094118965e-06, "loss": 0.9861, "step": 17425 }, { "epoch": 0.33, "learning_rate": 3.918159288818962e-06, "loss": 0.6381, "step": 17426 }, { "epoch": 0.33, "learning_rate": 3.918033478223596e-06, "loss": 0.9014, "step": 17427 }, { "epoch": 0.33, "learning_rate": 3.917907662333336e-06, "loss": 1.0145, "step": 17428 }, { "epoch": 0.33, "learning_rate": 3.917781841148652e-06, "loss": 0.7744, "step": 17429 }, { "epoch": 0.33, "learning_rate": 3.917656014670015e-06, "loss": 1.1931, "step": 17430 }, { "epoch": 0.33, "learning_rate": 3.917530182897893e-06, "loss": 1.1857, "step": 17431 }, { "epoch": 0.33, "learning_rate": 3.917404345832758e-06, "loss": 0.6917, "step": 17432 }, { "epoch": 0.33, "learning_rate": 3.917278503475077e-06, "loss": 0.9573, "step": 17433 }, { "epoch": 0.33, "learning_rate": 3.917152655825323e-06, "loss": 0.9988, "step": 17434 }, { "epoch": 0.33, "learning_rate": 3.917026802883964e-06, "loss": 0.9645, "step": 17435 }, { "epoch": 0.33, "learning_rate": 3.91690094465147e-06, "loss": 1.0454, "step": 17436 }, { "epoch": 0.33, "learning_rate": 3.916775081128311e-06, "loss": 0.9853, "step": 17437 }, { "epoch": 0.33, "learning_rate": 3.916649212314958e-06, "loss": 0.9377, "step": 17438 }, { "epoch": 0.33, "learning_rate": 3.91652333821188e-06, "loss": 1.0096, "step": 17439 }, { "epoch": 0.33, "learning_rate": 3.916397458819548e-06, "loss": 0.9719, "step": 17440 }, { "epoch": 0.33, "learning_rate": 3.91627157413843e-06, "loss": 0.8507, "step": 17441 }, { "epoch": 0.33, "learning_rate": 3.916145684168998e-06, "loss": 0.8845, "step": 17442 }, { "epoch": 0.33, "learning_rate": 3.916019788911721e-06, "loss": 1.0977, "step": 17443 }, { "epoch": 0.33, "learning_rate": 3.91589388836707e-06, "loss": 1.1291, "step": 17444 }, { "epoch": 0.33, "learning_rate": 3.9157679825355145e-06, "loss": 0.8597, "step": 17445 }, { "epoch": 0.33, "learning_rate": 3.915642071417525e-06, "loss": 0.8671, "step": 17446 }, { "epoch": 0.33, "learning_rate": 3.9155161550135715e-06, "loss": 0.8546, "step": 17447 }, { "epoch": 0.33, "learning_rate": 3.915390233324124e-06, "loss": 1.0115, "step": 17448 }, { "epoch": 0.33, "learning_rate": 3.915264306349652e-06, "loss": 1.2163, "step": 17449 }, { "epoch": 0.33, "learning_rate": 3.915138374090628e-06, "loss": 1.0499, "step": 17450 }, { "epoch": 0.33, "learning_rate": 3.915012436547519e-06, "loss": 0.8726, "step": 17451 }, { "epoch": 0.33, "learning_rate": 3.914886493720798e-06, "loss": 0.7817, "step": 17452 }, { "epoch": 0.33, "learning_rate": 3.914760545610934e-06, "loss": 1.0471, "step": 17453 }, { "epoch": 0.33, "learning_rate": 3.914634592218398e-06, "loss": 0.8605, "step": 17454 }, { "epoch": 0.33, "learning_rate": 3.914508633543659e-06, "loss": 1.0324, "step": 17455 }, { "epoch": 0.33, "learning_rate": 3.9143826695871885e-06, "loss": 1.2353, "step": 17456 }, { "epoch": 0.33, "learning_rate": 3.914256700349456e-06, "loss": 1.1699, "step": 17457 }, { "epoch": 0.33, "learning_rate": 3.9141307258309324e-06, "loss": 0.8655, "step": 17458 }, { "epoch": 0.33, "learning_rate": 3.914004746032088e-06, "loss": 0.8988, "step": 17459 }, { "epoch": 0.33, "learning_rate": 3.913878760953395e-06, "loss": 0.9476, "step": 17460 }, { "epoch": 0.33, "learning_rate": 3.91375277059532e-06, "loss": 0.9439, "step": 17461 }, { "epoch": 0.33, "learning_rate": 3.9136267749583365e-06, "loss": 1.0569, "step": 17462 }, { "epoch": 0.33, "learning_rate": 3.913500774042914e-06, "loss": 0.9387, "step": 17463 }, { "epoch": 0.33, "learning_rate": 3.913374767849522e-06, "loss": 0.9684, "step": 17464 }, { "epoch": 0.33, "learning_rate": 3.9132487563786325e-06, "loss": 0.9427, "step": 17465 }, { "epoch": 0.33, "learning_rate": 3.913122739630715e-06, "loss": 1.0716, "step": 17466 }, { "epoch": 0.33, "learning_rate": 3.912996717606241e-06, "loss": 0.8748, "step": 17467 }, { "epoch": 0.33, "learning_rate": 3.912870690305681e-06, "loss": 0.9236, "step": 17468 }, { "epoch": 0.33, "learning_rate": 3.912744657729505e-06, "loss": 1.0482, "step": 17469 }, { "epoch": 0.33, "learning_rate": 3.912618619878183e-06, "loss": 0.9901, "step": 17470 }, { "epoch": 0.33, "learning_rate": 3.912492576752187e-06, "loss": 0.8227, "step": 17471 }, { "epoch": 0.33, "learning_rate": 3.912366528351987e-06, "loss": 0.7718, "step": 17472 }, { "epoch": 0.33, "learning_rate": 3.912240474678054e-06, "loss": 0.8979, "step": 17473 }, { "epoch": 0.33, "learning_rate": 3.912114415730858e-06, "loss": 1.0347, "step": 17474 }, { "epoch": 0.33, "learning_rate": 3.911988351510869e-06, "loss": 1.237, "step": 17475 }, { "epoch": 0.33, "learning_rate": 3.91186228201856e-06, "loss": 0.9575, "step": 17476 }, { "epoch": 0.33, "learning_rate": 3.9117362072544e-06, "loss": 0.8391, "step": 17477 }, { "epoch": 0.33, "learning_rate": 3.911610127218861e-06, "loss": 0.8223, "step": 17478 }, { "epoch": 0.33, "learning_rate": 3.911484041912413e-06, "loss": 0.9272, "step": 17479 }, { "epoch": 0.33, "learning_rate": 3.911357951335527e-06, "loss": 0.7464, "step": 17480 }, { "epoch": 0.33, "learning_rate": 3.911231855488673e-06, "loss": 0.698, "step": 17481 }, { "epoch": 0.33, "learning_rate": 3.911105754372323e-06, "loss": 0.9294, "step": 17482 }, { "epoch": 0.33, "learning_rate": 3.9109796479869466e-06, "loss": 0.8862, "step": 17483 }, { "epoch": 0.33, "learning_rate": 3.910853536333016e-06, "loss": 0.9755, "step": 17484 }, { "epoch": 0.33, "learning_rate": 3.910727419411001e-06, "loss": 1.1091, "step": 17485 }, { "epoch": 0.33, "learning_rate": 3.910601297221375e-06, "loss": 0.9427, "step": 17486 }, { "epoch": 0.33, "learning_rate": 3.910475169764605e-06, "loss": 0.8583, "step": 17487 }, { "epoch": 0.33, "learning_rate": 3.9103490370411645e-06, "loss": 1.0186, "step": 17488 }, { "epoch": 0.33, "learning_rate": 3.910222899051525e-06, "loss": 0.9308, "step": 17489 }, { "epoch": 0.33, "learning_rate": 3.9100967557961545e-06, "loss": 0.8246, "step": 17490 }, { "epoch": 0.33, "learning_rate": 3.909970607275527e-06, "loss": 0.6796, "step": 17491 }, { "epoch": 0.33, "learning_rate": 3.909844453490112e-06, "loss": 0.8121, "step": 17492 }, { "epoch": 0.33, "learning_rate": 3.909718294440382e-06, "loss": 0.8571, "step": 17493 }, { "epoch": 0.33, "learning_rate": 3.909592130126807e-06, "loss": 0.8561, "step": 17494 }, { "epoch": 0.33, "learning_rate": 3.909465960549857e-06, "loss": 0.8542, "step": 17495 }, { "epoch": 0.33, "learning_rate": 3.909339785710005e-06, "loss": 0.9212, "step": 17496 }, { "epoch": 0.33, "learning_rate": 3.9092136056077215e-06, "loss": 0.778, "step": 17497 }, { "epoch": 0.33, "learning_rate": 3.909087420243478e-06, "loss": 0.6478, "step": 17498 }, { "epoch": 0.33, "learning_rate": 3.9089612296177446e-06, "loss": 0.9354, "step": 17499 }, { "epoch": 0.33, "learning_rate": 3.908835033730993e-06, "loss": 1.1589, "step": 17500 }, { "epoch": 0.33, "learning_rate": 3.908708832583696e-06, "loss": 0.9631, "step": 17501 }, { "epoch": 0.33, "learning_rate": 3.908582626176322e-06, "loss": 0.8596, "step": 17502 }, { "epoch": 0.33, "learning_rate": 3.908456414509344e-06, "loss": 0.921, "step": 17503 }, { "epoch": 0.33, "learning_rate": 3.9083301975832335e-06, "loss": 1.0777, "step": 17504 }, { "epoch": 0.33, "learning_rate": 3.90820397539846e-06, "loss": 1.0779, "step": 17505 }, { "epoch": 0.33, "learning_rate": 3.908077747955498e-06, "loss": 1.0963, "step": 17506 }, { "epoch": 0.33, "learning_rate": 3.9079515152548156e-06, "loss": 0.8794, "step": 17507 }, { "epoch": 0.33, "learning_rate": 3.907825277296885e-06, "loss": 1.0926, "step": 17508 }, { "epoch": 0.33, "learning_rate": 3.907699034082179e-06, "loss": 0.9696, "step": 17509 }, { "epoch": 0.33, "learning_rate": 3.907572785611167e-06, "loss": 0.9241, "step": 17510 }, { "epoch": 0.33, "learning_rate": 3.907446531884322e-06, "loss": 0.8844, "step": 17511 }, { "epoch": 0.33, "learning_rate": 3.907320272902114e-06, "loss": 1.1652, "step": 17512 }, { "epoch": 0.33, "learning_rate": 3.9071940086650165e-06, "loss": 0.9673, "step": 17513 }, { "epoch": 0.33, "learning_rate": 3.907067739173499e-06, "loss": 0.8655, "step": 17514 }, { "epoch": 0.33, "learning_rate": 3.906941464428033e-06, "loss": 1.1337, "step": 17515 }, { "epoch": 0.33, "learning_rate": 3.906815184429092e-06, "loss": 0.7691, "step": 17516 }, { "epoch": 0.33, "learning_rate": 3.906688899177146e-06, "loss": 1.1055, "step": 17517 }, { "epoch": 0.33, "learning_rate": 3.906562608672666e-06, "loss": 1.0187, "step": 17518 }, { "epoch": 0.33, "learning_rate": 3.906436312916125e-06, "loss": 1.1385, "step": 17519 }, { "epoch": 0.33, "learning_rate": 3.906310011907994e-06, "loss": 0.9701, "step": 17520 }, { "epoch": 0.33, "learning_rate": 3.906183705648744e-06, "loss": 0.963, "step": 17521 }, { "epoch": 0.33, "learning_rate": 3.906057394138848e-06, "loss": 0.9567, "step": 17522 }, { "epoch": 0.33, "learning_rate": 3.905931077378776e-06, "loss": 1.1192, "step": 17523 }, { "epoch": 0.33, "learning_rate": 3.905804755369e-06, "loss": 1.1891, "step": 17524 }, { "epoch": 0.33, "learning_rate": 3.905678428109994e-06, "loss": 1.2181, "step": 17525 }, { "epoch": 0.33, "learning_rate": 3.905552095602227e-06, "loss": 0.8104, "step": 17526 }, { "epoch": 0.33, "learning_rate": 3.905425757846171e-06, "loss": 0.9324, "step": 17527 }, { "epoch": 0.33, "learning_rate": 3.905299414842298e-06, "loss": 1.0417, "step": 17528 }, { "epoch": 0.33, "learning_rate": 3.905173066591081e-06, "loss": 0.7052, "step": 17529 }, { "epoch": 0.33, "learning_rate": 3.90504671309299e-06, "loss": 0.8046, "step": 17530 }, { "epoch": 0.33, "learning_rate": 3.904920354348499e-06, "loss": 1.1272, "step": 17531 }, { "epoch": 0.33, "learning_rate": 3.904793990358077e-06, "loss": 1.0489, "step": 17532 }, { "epoch": 0.33, "learning_rate": 3.904667621122198e-06, "loss": 1.076, "step": 17533 }, { "epoch": 0.33, "learning_rate": 3.904541246641333e-06, "loss": 0.9319, "step": 17534 }, { "epoch": 0.33, "learning_rate": 3.904414866915954e-06, "loss": 0.8101, "step": 17535 }, { "epoch": 0.33, "learning_rate": 3.904288481946534e-06, "loss": 0.9581, "step": 17536 }, { "epoch": 0.33, "learning_rate": 3.904162091733543e-06, "loss": 1.244, "step": 17537 }, { "epoch": 0.33, "learning_rate": 3.904035696277454e-06, "loss": 1.1998, "step": 17538 }, { "epoch": 0.33, "learning_rate": 3.903909295578738e-06, "loss": 0.7318, "step": 17539 }, { "epoch": 0.33, "learning_rate": 3.903782889637868e-06, "loss": 0.9611, "step": 17540 }, { "epoch": 0.33, "learning_rate": 3.903656478455317e-06, "loss": 0.7045, "step": 17541 }, { "epoch": 0.33, "learning_rate": 3.9035300620315545e-06, "loss": 0.9318, "step": 17542 }, { "epoch": 0.33, "learning_rate": 3.9034036403670535e-06, "loss": 0.939, "step": 17543 }, { "epoch": 0.33, "learning_rate": 3.9032772134622875e-06, "loss": 1.1242, "step": 17544 }, { "epoch": 0.33, "learning_rate": 3.903150781317727e-06, "loss": 1.0394, "step": 17545 }, { "epoch": 0.33, "learning_rate": 3.903024343933844e-06, "loss": 0.766, "step": 17546 }, { "epoch": 0.33, "learning_rate": 3.902897901311111e-06, "loss": 0.8459, "step": 17547 }, { "epoch": 0.33, "learning_rate": 3.902771453450001e-06, "loss": 1.0114, "step": 17548 }, { "epoch": 0.33, "learning_rate": 3.902645000350985e-06, "loss": 0.8203, "step": 17549 }, { "epoch": 0.33, "learning_rate": 3.902518542014536e-06, "loss": 1.2693, "step": 17550 }, { "epoch": 0.33, "learning_rate": 3.902392078441125e-06, "loss": 1.0963, "step": 17551 }, { "epoch": 0.33, "learning_rate": 3.902265609631226e-06, "loss": 0.8456, "step": 17552 }, { "epoch": 0.33, "learning_rate": 3.902139135585309e-06, "loss": 1.0807, "step": 17553 }, { "epoch": 0.33, "learning_rate": 3.902012656303849e-06, "loss": 1.064, "step": 17554 }, { "epoch": 0.33, "learning_rate": 3.901886171787315e-06, "loss": 1.0065, "step": 17555 }, { "epoch": 0.33, "learning_rate": 3.9017596820361816e-06, "loss": 0.9226, "step": 17556 }, { "epoch": 0.33, "learning_rate": 3.901633187050921e-06, "loss": 0.8643, "step": 17557 }, { "epoch": 0.33, "learning_rate": 3.9015066868320055e-06, "loss": 0.8913, "step": 17558 }, { "epoch": 0.33, "learning_rate": 3.901380181379906e-06, "loss": 1.0493, "step": 17559 }, { "epoch": 0.33, "learning_rate": 3.901253670695096e-06, "loss": 0.8089, "step": 17560 }, { "epoch": 0.33, "learning_rate": 3.901127154778048e-06, "loss": 0.8439, "step": 17561 }, { "epoch": 0.33, "learning_rate": 3.901000633629234e-06, "loss": 1.1619, "step": 17562 }, { "epoch": 0.33, "learning_rate": 3.900874107249126e-06, "loss": 0.9847, "step": 17563 }, { "epoch": 0.33, "learning_rate": 3.900747575638199e-06, "loss": 0.9538, "step": 17564 }, { "epoch": 0.33, "learning_rate": 3.9006210387969215e-06, "loss": 0.8836, "step": 17565 }, { "epoch": 0.33, "learning_rate": 3.900494496725769e-06, "loss": 0.8961, "step": 17566 }, { "epoch": 0.33, "learning_rate": 3.900367949425212e-06, "loss": 1.0104, "step": 17567 }, { "epoch": 0.33, "learning_rate": 3.900241396895726e-06, "loss": 1.0498, "step": 17568 }, { "epoch": 0.33, "learning_rate": 3.9001148391377795e-06, "loss": 0.9984, "step": 17569 }, { "epoch": 0.33, "learning_rate": 3.899988276151848e-06, "loss": 0.9023, "step": 17570 }, { "epoch": 0.33, "learning_rate": 3.899861707938403e-06, "loss": 0.8925, "step": 17571 }, { "epoch": 0.33, "learning_rate": 3.899735134497917e-06, "loss": 0.9049, "step": 17572 }, { "epoch": 0.33, "learning_rate": 3.899608555830864e-06, "loss": 1.0032, "step": 17573 }, { "epoch": 0.33, "learning_rate": 3.899481971937714e-06, "loss": 0.8564, "step": 17574 }, { "epoch": 0.33, "learning_rate": 3.899355382818942e-06, "loss": 1.0289, "step": 17575 }, { "epoch": 0.33, "learning_rate": 3.89922878847502e-06, "loss": 0.9128, "step": 17576 }, { "epoch": 0.33, "learning_rate": 3.8991021889064205e-06, "loss": 0.8986, "step": 17577 }, { "epoch": 0.33, "learning_rate": 3.8989755841136166e-06, "loss": 0.9423, "step": 17578 }, { "epoch": 0.33, "learning_rate": 3.898848974097082e-06, "loss": 0.981, "step": 17579 }, { "epoch": 0.33, "learning_rate": 3.898722358857286e-06, "loss": 1.1093, "step": 17580 }, { "epoch": 0.33, "learning_rate": 3.8985957383947045e-06, "loss": 1.1735, "step": 17581 }, { "epoch": 0.33, "learning_rate": 3.898469112709809e-06, "loss": 0.9732, "step": 17582 }, { "epoch": 0.33, "learning_rate": 3.898342481803073e-06, "loss": 0.8687, "step": 17583 }, { "epoch": 0.33, "learning_rate": 3.898215845674969e-06, "loss": 0.9268, "step": 17584 }, { "epoch": 0.33, "learning_rate": 3.89808920432597e-06, "loss": 0.8598, "step": 17585 }, { "epoch": 0.33, "learning_rate": 3.897962557756549e-06, "loss": 0.7441, "step": 17586 }, { "epoch": 0.33, "learning_rate": 3.897835905967179e-06, "loss": 1.0576, "step": 17587 }, { "epoch": 0.33, "learning_rate": 3.897709248958331e-06, "loss": 0.6853, "step": 17588 }, { "epoch": 0.33, "learning_rate": 3.89758258673048e-06, "loss": 1.1134, "step": 17589 }, { "epoch": 0.33, "learning_rate": 3.8974559192841e-06, "loss": 0.9104, "step": 17590 }, { "epoch": 0.33, "learning_rate": 3.897329246619661e-06, "loss": 0.9102, "step": 17591 }, { "epoch": 0.33, "learning_rate": 3.897202568737638e-06, "loss": 0.8426, "step": 17592 }, { "epoch": 0.33, "learning_rate": 3.897075885638504e-06, "loss": 0.9636, "step": 17593 }, { "epoch": 0.33, "learning_rate": 3.89694919732273e-06, "loss": 1.0645, "step": 17594 }, { "epoch": 0.33, "learning_rate": 3.896822503790791e-06, "loss": 0.9656, "step": 17595 }, { "epoch": 0.33, "learning_rate": 3.89669580504316e-06, "loss": 0.9058, "step": 17596 }, { "epoch": 0.33, "learning_rate": 3.89656910108031e-06, "loss": 0.7726, "step": 17597 }, { "epoch": 0.33, "learning_rate": 3.896442391902714e-06, "loss": 0.9279, "step": 17598 }, { "epoch": 0.33, "learning_rate": 3.896315677510844e-06, "loss": 0.8632, "step": 17599 }, { "epoch": 0.33, "learning_rate": 3.896188957905174e-06, "loss": 1.0393, "step": 17600 }, { "epoch": 0.33, "learning_rate": 3.8960622330861775e-06, "loss": 0.9199, "step": 17601 }, { "epoch": 0.33, "learning_rate": 3.895935503054328e-06, "loss": 0.8694, "step": 17602 }, { "epoch": 0.33, "learning_rate": 3.895808767810097e-06, "loss": 0.7635, "step": 17603 }, { "epoch": 0.33, "learning_rate": 3.895682027353961e-06, "loss": 0.8539, "step": 17604 }, { "epoch": 0.33, "learning_rate": 3.895555281686389e-06, "loss": 1.1652, "step": 17605 }, { "epoch": 0.33, "learning_rate": 3.895428530807857e-06, "loss": 1.0157, "step": 17606 }, { "epoch": 0.33, "learning_rate": 3.8953017747188376e-06, "loss": 0.8723, "step": 17607 }, { "epoch": 0.33, "learning_rate": 3.895175013419804e-06, "loss": 0.7643, "step": 17608 }, { "epoch": 0.33, "learning_rate": 3.89504824691123e-06, "loss": 0.7825, "step": 17609 }, { "epoch": 0.33, "learning_rate": 3.894921475193588e-06, "loss": 0.9462, "step": 17610 }, { "epoch": 0.33, "learning_rate": 3.894794698267354e-06, "loss": 0.8649, "step": 17611 }, { "epoch": 0.33, "learning_rate": 3.894667916132997e-06, "loss": 1.215, "step": 17612 }, { "epoch": 0.33, "learning_rate": 3.894541128790993e-06, "loss": 0.9886, "step": 17613 }, { "epoch": 0.33, "learning_rate": 3.894414336241817e-06, "loss": 0.8315, "step": 17614 }, { "epoch": 0.33, "learning_rate": 3.894287538485939e-06, "loss": 0.9624, "step": 17615 }, { "epoch": 0.33, "learning_rate": 3.894160735523834e-06, "loss": 0.8281, "step": 17616 }, { "epoch": 0.33, "learning_rate": 3.894033927355977e-06, "loss": 0.9602, "step": 17617 }, { "epoch": 0.33, "learning_rate": 3.8939071139828386e-06, "loss": 1.2554, "step": 17618 }, { "epoch": 0.33, "learning_rate": 3.8937802954048945e-06, "loss": 1.2491, "step": 17619 }, { "epoch": 0.33, "learning_rate": 3.8936534716226175e-06, "loss": 0.9448, "step": 17620 }, { "epoch": 0.33, "learning_rate": 3.893526642636481e-06, "loss": 0.9432, "step": 17621 }, { "epoch": 0.33, "learning_rate": 3.893399808446958e-06, "loss": 0.8773, "step": 17622 }, { "epoch": 0.33, "learning_rate": 3.8932729690545245e-06, "loss": 0.7443, "step": 17623 }, { "epoch": 0.33, "learning_rate": 3.893146124459651e-06, "loss": 1.0961, "step": 17624 }, { "epoch": 0.33, "learning_rate": 3.8930192746628135e-06, "loss": 1.0898, "step": 17625 }, { "epoch": 0.33, "learning_rate": 3.892892419664484e-06, "loss": 1.1608, "step": 17626 }, { "epoch": 0.33, "learning_rate": 3.892765559465137e-06, "loss": 0.7441, "step": 17627 }, { "epoch": 0.33, "learning_rate": 3.892638694065247e-06, "loss": 1.0994, "step": 17628 }, { "epoch": 0.33, "learning_rate": 3.892511823465286e-06, "loss": 0.9625, "step": 17629 }, { "epoch": 0.33, "learning_rate": 3.892384947665728e-06, "loss": 1.0858, "step": 17630 }, { "epoch": 0.33, "learning_rate": 3.892258066667049e-06, "loss": 1.1181, "step": 17631 }, { "epoch": 0.33, "learning_rate": 3.89213118046972e-06, "loss": 1.0294, "step": 17632 }, { "epoch": 0.33, "learning_rate": 3.892004289074216e-06, "loss": 1.0215, "step": 17633 }, { "epoch": 0.33, "learning_rate": 3.891877392481011e-06, "loss": 0.9214, "step": 17634 }, { "epoch": 0.33, "learning_rate": 3.891750490690578e-06, "loss": 0.8541, "step": 17635 }, { "epoch": 0.33, "learning_rate": 3.891623583703391e-06, "loss": 0.9543, "step": 17636 }, { "epoch": 0.33, "learning_rate": 3.891496671519924e-06, "loss": 1.087, "step": 17637 }, { "epoch": 0.33, "learning_rate": 3.891369754140652e-06, "loss": 1.0585, "step": 17638 }, { "epoch": 0.33, "learning_rate": 3.891242831566048e-06, "loss": 1.11, "step": 17639 }, { "epoch": 0.33, "learning_rate": 3.891115903796586e-06, "loss": 0.9055, "step": 17640 }, { "epoch": 0.33, "learning_rate": 3.890988970832739e-06, "loss": 0.8388, "step": 17641 }, { "epoch": 0.33, "learning_rate": 3.8908620326749826e-06, "loss": 0.854, "step": 17642 }, { "epoch": 0.33, "learning_rate": 3.89073508932379e-06, "loss": 1.0343, "step": 17643 }, { "epoch": 0.33, "learning_rate": 3.8906081407796345e-06, "loss": 1.1178, "step": 17644 }, { "epoch": 0.33, "learning_rate": 3.890481187042992e-06, "loss": 0.9106, "step": 17645 }, { "epoch": 0.33, "learning_rate": 3.890354228114334e-06, "loss": 0.8017, "step": 17646 }, { "epoch": 0.33, "learning_rate": 3.890227263994137e-06, "loss": 0.8961, "step": 17647 }, { "epoch": 0.33, "learning_rate": 3.8901002946828736e-06, "loss": 1.0756, "step": 17648 }, { "epoch": 0.33, "learning_rate": 3.889973320181018e-06, "loss": 1.1463, "step": 17649 }, { "epoch": 0.33, "learning_rate": 3.889846340489046e-06, "loss": 1.1984, "step": 17650 }, { "epoch": 0.33, "learning_rate": 3.889719355607429e-06, "loss": 0.9555, "step": 17651 }, { "epoch": 0.33, "learning_rate": 3.889592365536643e-06, "loss": 0.9502, "step": 17652 }, { "epoch": 0.33, "learning_rate": 3.889465370277162e-06, "loss": 1.0386, "step": 17653 }, { "epoch": 0.33, "learning_rate": 3.8893383698294595e-06, "loss": 0.8742, "step": 17654 }, { "epoch": 0.33, "learning_rate": 3.88921136419401e-06, "loss": 0.9673, "step": 17655 }, { "epoch": 0.33, "learning_rate": 3.8890843533712885e-06, "loss": 0.9182, "step": 17656 }, { "epoch": 0.33, "learning_rate": 3.888957337361768e-06, "loss": 0.8688, "step": 17657 }, { "epoch": 0.33, "learning_rate": 3.888830316165924e-06, "loss": 0.9105, "step": 17658 }, { "epoch": 0.33, "learning_rate": 3.888703289784229e-06, "loss": 0.8762, "step": 17659 }, { "epoch": 0.33, "learning_rate": 3.888576258217159e-06, "loss": 1.0888, "step": 17660 }, { "epoch": 0.33, "learning_rate": 3.8884492214651884e-06, "loss": 0.7621, "step": 17661 }, { "epoch": 0.33, "learning_rate": 3.888322179528791e-06, "loss": 0.9383, "step": 17662 }, { "epoch": 0.33, "learning_rate": 3.88819513240844e-06, "loss": 1.0966, "step": 17663 }, { "epoch": 0.33, "learning_rate": 3.888068080104612e-06, "loss": 1.0081, "step": 17664 }, { "epoch": 0.33, "learning_rate": 3.8879410226177805e-06, "loss": 0.9427, "step": 17665 }, { "epoch": 0.33, "learning_rate": 3.887813959948419e-06, "loss": 0.8318, "step": 17666 }, { "epoch": 0.33, "learning_rate": 3.8876868920970034e-06, "loss": 0.8808, "step": 17667 }, { "epoch": 0.33, "learning_rate": 3.887559819064007e-06, "loss": 1.0819, "step": 17668 }, { "epoch": 0.33, "learning_rate": 3.887432740849904e-06, "loss": 0.9968, "step": 17669 }, { "epoch": 0.33, "learning_rate": 3.8873056574551715e-06, "loss": 0.9939, "step": 17670 }, { "epoch": 0.33, "learning_rate": 3.887178568880281e-06, "loss": 0.9679, "step": 17671 }, { "epoch": 0.33, "learning_rate": 3.887051475125709e-06, "loss": 0.8015, "step": 17672 }, { "epoch": 0.33, "learning_rate": 3.8869243761919295e-06, "loss": 0.7572, "step": 17673 }, { "epoch": 0.33, "learning_rate": 3.886797272079415e-06, "loss": 0.9159, "step": 17674 }, { "epoch": 0.33, "learning_rate": 3.886670162788644e-06, "loss": 1.1201, "step": 17675 }, { "epoch": 0.33, "learning_rate": 3.886543048320089e-06, "loss": 1.0459, "step": 17676 }, { "epoch": 0.33, "learning_rate": 3.886415928674225e-06, "loss": 1.0275, "step": 17677 }, { "epoch": 0.33, "learning_rate": 3.8862888038515244e-06, "loss": 1.0986, "step": 17678 }, { "epoch": 0.33, "learning_rate": 3.886161673852465e-06, "loss": 0.792, "step": 17679 }, { "epoch": 0.33, "learning_rate": 3.886034538677521e-06, "loss": 0.9231, "step": 17680 }, { "epoch": 0.33, "learning_rate": 3.885907398327166e-06, "loss": 1.0339, "step": 17681 }, { "epoch": 0.33, "learning_rate": 3.885780252801875e-06, "loss": 0.7106, "step": 17682 }, { "epoch": 0.33, "learning_rate": 3.885653102102124e-06, "loss": 1.0499, "step": 17683 }, { "epoch": 0.33, "learning_rate": 3.885525946228386e-06, "loss": 0.8804, "step": 17684 }, { "epoch": 0.33, "learning_rate": 3.885398785181137e-06, "loss": 1.0667, "step": 17685 }, { "epoch": 0.33, "learning_rate": 3.8852716189608505e-06, "loss": 0.957, "step": 17686 }, { "epoch": 0.33, "learning_rate": 3.885144447568004e-06, "loss": 1.0853, "step": 17687 }, { "epoch": 0.33, "learning_rate": 3.8850172710030685e-06, "loss": 1.0287, "step": 17688 }, { "epoch": 0.33, "learning_rate": 3.884890089266523e-06, "loss": 0.8422, "step": 17689 }, { "epoch": 0.33, "learning_rate": 3.884762902358839e-06, "loss": 0.8907, "step": 17690 }, { "epoch": 0.33, "learning_rate": 3.8846357102804935e-06, "loss": 0.7572, "step": 17691 }, { "epoch": 0.33, "learning_rate": 3.884508513031961e-06, "loss": 0.8117, "step": 17692 }, { "epoch": 0.33, "learning_rate": 3.884381310613715e-06, "loss": 0.9264, "step": 17693 }, { "epoch": 0.33, "learning_rate": 3.884254103026232e-06, "loss": 1.2071, "step": 17694 }, { "epoch": 0.33, "learning_rate": 3.884126890269987e-06, "loss": 0.7895, "step": 17695 }, { "epoch": 0.33, "learning_rate": 3.883999672345454e-06, "loss": 0.7085, "step": 17696 }, { "epoch": 0.33, "learning_rate": 3.883872449253109e-06, "loss": 0.8692, "step": 17697 }, { "epoch": 0.33, "learning_rate": 3.883745220993427e-06, "loss": 0.9177, "step": 17698 }, { "epoch": 0.33, "learning_rate": 3.883617987566882e-06, "loss": 1.1764, "step": 17699 }, { "epoch": 0.33, "learning_rate": 3.883490748973952e-06, "loss": 1.1215, "step": 17700 }, { "epoch": 0.33, "learning_rate": 3.8833635052151074e-06, "loss": 0.9378, "step": 17701 }, { "epoch": 0.33, "learning_rate": 3.883236256290827e-06, "loss": 0.7198, "step": 17702 }, { "epoch": 0.33, "learning_rate": 3.883109002201585e-06, "loss": 0.8638, "step": 17703 }, { "epoch": 0.33, "learning_rate": 3.882981742947855e-06, "loss": 0.8636, "step": 17704 }, { "epoch": 0.33, "learning_rate": 3.8828544785301155e-06, "loss": 0.9387, "step": 17705 }, { "epoch": 0.33, "learning_rate": 3.882727208948838e-06, "loss": 1.1392, "step": 17706 }, { "epoch": 0.33, "learning_rate": 3.8825999342045016e-06, "loss": 0.9879, "step": 17707 }, { "epoch": 0.33, "learning_rate": 3.8824726542975786e-06, "loss": 0.9084, "step": 17708 }, { "epoch": 0.33, "learning_rate": 3.8823453692285445e-06, "loss": 0.7982, "step": 17709 }, { "epoch": 0.33, "learning_rate": 3.8822180789978755e-06, "loss": 0.7758, "step": 17710 }, { "epoch": 0.33, "learning_rate": 3.882090783606046e-06, "loss": 0.8337, "step": 17711 }, { "epoch": 0.33, "learning_rate": 3.881963483053533e-06, "loss": 1.045, "step": 17712 }, { "epoch": 0.33, "learning_rate": 3.88183617734081e-06, "loss": 1.0101, "step": 17713 }, { "epoch": 0.33, "learning_rate": 3.8817088664683535e-06, "loss": 0.9954, "step": 17714 }, { "epoch": 0.33, "learning_rate": 3.881581550436638e-06, "loss": 0.9497, "step": 17715 }, { "epoch": 0.33, "learning_rate": 3.88145422924614e-06, "loss": 0.847, "step": 17716 }, { "epoch": 0.33, "learning_rate": 3.881326902897333e-06, "loss": 0.9077, "step": 17717 }, { "epoch": 0.33, "learning_rate": 3.881199571390694e-06, "loss": 1.0789, "step": 17718 }, { "epoch": 0.33, "learning_rate": 3.881072234726699e-06, "loss": 1.1548, "step": 17719 }, { "epoch": 0.33, "learning_rate": 3.880944892905822e-06, "loss": 0.9636, "step": 17720 }, { "epoch": 0.33, "learning_rate": 3.88081754592854e-06, "loss": 1.0256, "step": 17721 }, { "epoch": 0.33, "learning_rate": 3.880690193795327e-06, "loss": 0.7795, "step": 17722 }, { "epoch": 0.33, "learning_rate": 3.8805628365066596e-06, "loss": 0.9099, "step": 17723 }, { "epoch": 0.33, "learning_rate": 3.880435474063012e-06, "loss": 1.0453, "step": 17724 }, { "epoch": 0.33, "learning_rate": 3.880308106464862e-06, "loss": 1.0595, "step": 17725 }, { "epoch": 0.33, "learning_rate": 3.8801807337126825e-06, "loss": 1.1716, "step": 17726 }, { "epoch": 0.33, "learning_rate": 3.880053355806951e-06, "loss": 0.8461, "step": 17727 }, { "epoch": 0.33, "learning_rate": 3.879925972748142e-06, "loss": 0.8107, "step": 17728 }, { "epoch": 0.33, "learning_rate": 3.879798584536732e-06, "loss": 1.0837, "step": 17729 }, { "epoch": 0.33, "learning_rate": 3.879671191173197e-06, "loss": 0.8218, "step": 17730 }, { "epoch": 0.33, "learning_rate": 3.879543792658011e-06, "loss": 1.2092, "step": 17731 }, { "epoch": 0.33, "learning_rate": 3.879416388991652e-06, "loss": 0.6579, "step": 17732 }, { "epoch": 0.33, "learning_rate": 3.879288980174594e-06, "loss": 0.6856, "step": 17733 }, { "epoch": 0.33, "learning_rate": 3.879161566207314e-06, "loss": 0.9217, "step": 17734 }, { "epoch": 0.33, "learning_rate": 3.879034147090286e-06, "loss": 1.0228, "step": 17735 }, { "epoch": 0.33, "learning_rate": 3.878906722823988e-06, "loss": 0.9517, "step": 17736 }, { "epoch": 0.33, "learning_rate": 3.878779293408893e-06, "loss": 1.0197, "step": 17737 }, { "epoch": 0.33, "learning_rate": 3.878651858845478e-06, "loss": 1.0003, "step": 17738 }, { "epoch": 0.33, "learning_rate": 3.878524419134221e-06, "loss": 1.0517, "step": 17739 }, { "epoch": 0.33, "learning_rate": 3.878396974275595e-06, "loss": 0.8987, "step": 17740 }, { "epoch": 0.33, "learning_rate": 3.878269524270077e-06, "loss": 0.9529, "step": 17741 }, { "epoch": 0.33, "learning_rate": 3.8781420691181435e-06, "loss": 0.9354, "step": 17742 }, { "epoch": 0.33, "learning_rate": 3.878014608820269e-06, "loss": 0.9485, "step": 17743 }, { "epoch": 0.33, "learning_rate": 3.877887143376931e-06, "loss": 0.8581, "step": 17744 }, { "epoch": 0.33, "learning_rate": 3.8777596727886035e-06, "loss": 0.957, "step": 17745 }, { "epoch": 0.33, "learning_rate": 3.877632197055764e-06, "loss": 0.9041, "step": 17746 }, { "epoch": 0.33, "learning_rate": 3.8775047161788894e-06, "loss": 1.0305, "step": 17747 }, { "epoch": 0.33, "learning_rate": 3.877377230158454e-06, "loss": 0.8712, "step": 17748 }, { "epoch": 0.33, "learning_rate": 3.877249738994932e-06, "loss": 0.8964, "step": 17749 }, { "epoch": 0.33, "learning_rate": 3.877122242688804e-06, "loss": 0.7941, "step": 17750 }, { "epoch": 0.33, "learning_rate": 3.8769947412405436e-06, "loss": 0.8934, "step": 17751 }, { "epoch": 0.33, "learning_rate": 3.876867234650627e-06, "loss": 0.9389, "step": 17752 }, { "epoch": 0.33, "learning_rate": 3.876739722919529e-06, "loss": 0.9131, "step": 17753 }, { "epoch": 0.33, "learning_rate": 3.876612206047729e-06, "loss": 0.8343, "step": 17754 }, { "epoch": 0.33, "learning_rate": 3.8764846840357e-06, "loss": 0.9294, "step": 17755 }, { "epoch": 0.33, "learning_rate": 3.876357156883919e-06, "loss": 0.991, "step": 17756 }, { "epoch": 0.34, "learning_rate": 3.876229624592864e-06, "loss": 1.0607, "step": 17757 }, { "epoch": 0.34, "learning_rate": 3.8761020871630095e-06, "loss": 0.974, "step": 17758 }, { "epoch": 0.34, "learning_rate": 3.875974544594831e-06, "loss": 0.929, "step": 17759 }, { "epoch": 0.34, "learning_rate": 3.875846996888807e-06, "loss": 0.7546, "step": 17760 }, { "epoch": 0.34, "learning_rate": 3.875719444045412e-06, "loss": 0.7603, "step": 17761 }, { "epoch": 0.34, "learning_rate": 3.875591886065122e-06, "loss": 0.9904, "step": 17762 }, { "epoch": 0.34, "learning_rate": 3.875464322948415e-06, "loss": 0.9744, "step": 17763 }, { "epoch": 0.34, "learning_rate": 3.875336754695766e-06, "loss": 0.9517, "step": 17764 }, { "epoch": 0.34, "learning_rate": 3.875209181307652e-06, "loss": 1.0503, "step": 17765 }, { "epoch": 0.34, "learning_rate": 3.8750816027845485e-06, "loss": 0.9437, "step": 17766 }, { "epoch": 0.34, "learning_rate": 3.874954019126933e-06, "loss": 0.8868, "step": 17767 }, { "epoch": 0.34, "learning_rate": 3.874826430335281e-06, "loss": 1.0172, "step": 17768 }, { "epoch": 0.34, "learning_rate": 3.87469883641007e-06, "loss": 1.0371, "step": 17769 }, { "epoch": 0.34, "learning_rate": 3.874571237351774e-06, "loss": 1.0441, "step": 17770 }, { "epoch": 0.34, "learning_rate": 3.874443633160873e-06, "loss": 0.91, "step": 17771 }, { "epoch": 0.34, "learning_rate": 3.874316023837841e-06, "loss": 0.8698, "step": 17772 }, { "epoch": 0.34, "learning_rate": 3.874188409383155e-06, "loss": 0.8953, "step": 17773 }, { "epoch": 0.34, "learning_rate": 3.874060789797292e-06, "loss": 1.2322, "step": 17774 }, { "epoch": 0.34, "learning_rate": 3.8739331650807275e-06, "loss": 1.1407, "step": 17775 }, { "epoch": 0.34, "learning_rate": 3.873805535233939e-06, "loss": 0.9805, "step": 17776 }, { "epoch": 0.34, "learning_rate": 3.873677900257403e-06, "loss": 0.9274, "step": 17777 }, { "epoch": 0.34, "learning_rate": 3.873550260151595e-06, "loss": 0.9578, "step": 17778 }, { "epoch": 0.34, "learning_rate": 3.873422614916993e-06, "loss": 0.8376, "step": 17779 }, { "epoch": 0.34, "learning_rate": 3.873294964554073e-06, "loss": 1.0132, "step": 17780 }, { "epoch": 0.34, "learning_rate": 3.873167309063312e-06, "loss": 1.1602, "step": 17781 }, { "epoch": 0.34, "learning_rate": 3.873039648445186e-06, "loss": 1.2044, "step": 17782 }, { "epoch": 0.34, "learning_rate": 3.872911982700172e-06, "loss": 0.8145, "step": 17783 }, { "epoch": 0.34, "learning_rate": 3.872784311828746e-06, "loss": 0.8409, "step": 17784 }, { "epoch": 0.34, "learning_rate": 3.872656635831387e-06, "loss": 0.8752, "step": 17785 }, { "epoch": 0.34, "learning_rate": 3.87252895470857e-06, "loss": 0.8655, "step": 17786 }, { "epoch": 0.34, "learning_rate": 3.872401268460772e-06, "loss": 1.1485, "step": 17787 }, { "epoch": 0.34, "learning_rate": 3.872273577088469e-06, "loss": 0.8848, "step": 17788 }, { "epoch": 0.34, "learning_rate": 3.872145880592139e-06, "loss": 1.054, "step": 17789 }, { "epoch": 0.34, "learning_rate": 3.8720181789722575e-06, "loss": 0.8093, "step": 17790 }, { "epoch": 0.34, "learning_rate": 3.871890472229303e-06, "loss": 0.8368, "step": 17791 }, { "epoch": 0.34, "learning_rate": 3.871762760363752e-06, "loss": 0.9711, "step": 17792 }, { "epoch": 0.34, "learning_rate": 3.87163504337608e-06, "loss": 1.2104, "step": 17793 }, { "epoch": 0.34, "learning_rate": 3.871507321266765e-06, "loss": 1.0856, "step": 17794 }, { "epoch": 0.34, "learning_rate": 3.8713795940362846e-06, "loss": 1.0169, "step": 17795 }, { "epoch": 0.34, "learning_rate": 3.8712518616851136e-06, "loss": 0.9192, "step": 17796 }, { "epoch": 0.34, "learning_rate": 3.87112412421373e-06, "loss": 1.2195, "step": 17797 }, { "epoch": 0.34, "learning_rate": 3.870996381622613e-06, "loss": 0.813, "step": 17798 }, { "epoch": 0.34, "learning_rate": 3.8708686339122355e-06, "loss": 0.9794, "step": 17799 }, { "epoch": 0.34, "learning_rate": 3.8707408810830774e-06, "loss": 1.0906, "step": 17800 }, { "epoch": 0.34, "learning_rate": 3.870613123135615e-06, "loss": 1.0155, "step": 17801 }, { "epoch": 0.34, "learning_rate": 3.870485360070325e-06, "loss": 0.8108, "step": 17802 }, { "epoch": 0.34, "learning_rate": 3.870357591887684e-06, "loss": 0.8859, "step": 17803 }, { "epoch": 0.34, "learning_rate": 3.8702298185881705e-06, "loss": 0.8936, "step": 17804 }, { "epoch": 0.34, "learning_rate": 3.870102040172261e-06, "loss": 0.7854, "step": 17805 }, { "epoch": 0.34, "learning_rate": 3.869974256640432e-06, "loss": 1.0536, "step": 17806 }, { "epoch": 0.34, "learning_rate": 3.869846467993161e-06, "loss": 0.7903, "step": 17807 }, { "epoch": 0.34, "learning_rate": 3.869718674230926e-06, "loss": 1.0623, "step": 17808 }, { "epoch": 0.34, "learning_rate": 3.869590875354203e-06, "loss": 0.7112, "step": 17809 }, { "epoch": 0.34, "learning_rate": 3.86946307136347e-06, "loss": 0.7753, "step": 17810 }, { "epoch": 0.34, "learning_rate": 3.869335262259204e-06, "loss": 1.0401, "step": 17811 }, { "epoch": 0.34, "learning_rate": 3.869207448041882e-06, "loss": 0.8806, "step": 17812 }, { "epoch": 0.34, "learning_rate": 3.869079628711981e-06, "loss": 0.9911, "step": 17813 }, { "epoch": 0.34, "learning_rate": 3.868951804269979e-06, "loss": 0.8266, "step": 17814 }, { "epoch": 0.34, "learning_rate": 3.868823974716353e-06, "loss": 0.7817, "step": 17815 }, { "epoch": 0.34, "learning_rate": 3.86869614005158e-06, "loss": 0.8557, "step": 17816 }, { "epoch": 0.34, "learning_rate": 3.868568300276137e-06, "loss": 0.9025, "step": 17817 }, { "epoch": 0.34, "learning_rate": 3.868440455390502e-06, "loss": 1.1159, "step": 17818 }, { "epoch": 0.34, "learning_rate": 3.868312605395153e-06, "loss": 1.1379, "step": 17819 }, { "epoch": 0.34, "learning_rate": 3.868184750290567e-06, "loss": 1.0081, "step": 17820 }, { "epoch": 0.34, "learning_rate": 3.86805689007722e-06, "loss": 0.861, "step": 17821 }, { "epoch": 0.34, "learning_rate": 3.867929024755592e-06, "loss": 0.9407, "step": 17822 }, { "epoch": 0.34, "learning_rate": 3.867801154326157e-06, "loss": 0.7637, "step": 17823 }, { "epoch": 0.34, "learning_rate": 3.867673278789396e-06, "loss": 0.996, "step": 17824 }, { "epoch": 0.34, "learning_rate": 3.867545398145784e-06, "loss": 1.0405, "step": 17825 }, { "epoch": 0.34, "learning_rate": 3.8674175123958e-06, "loss": 1.0312, "step": 17826 }, { "epoch": 0.34, "learning_rate": 3.8672896215399206e-06, "loss": 0.9055, "step": 17827 }, { "epoch": 0.34, "learning_rate": 3.867161725578624e-06, "loss": 0.9916, "step": 17828 }, { "epoch": 0.34, "learning_rate": 3.8670338245123875e-06, "loss": 0.9623, "step": 17829 }, { "epoch": 0.34, "learning_rate": 3.866905918341688e-06, "loss": 1.0875, "step": 17830 }, { "epoch": 0.34, "learning_rate": 3.866778007067005e-06, "loss": 1.002, "step": 17831 }, { "epoch": 0.34, "learning_rate": 3.866650090688813e-06, "loss": 1.1314, "step": 17832 }, { "epoch": 0.34, "learning_rate": 3.866522169207593e-06, "loss": 0.7208, "step": 17833 }, { "epoch": 0.34, "learning_rate": 3.86639424262382e-06, "loss": 0.9115, "step": 17834 }, { "epoch": 0.34, "learning_rate": 3.8662663109379735e-06, "loss": 0.9231, "step": 17835 }, { "epoch": 0.34, "learning_rate": 3.86613837415053e-06, "loss": 0.7113, "step": 17836 }, { "epoch": 0.34, "learning_rate": 3.866010432261968e-06, "loss": 0.9274, "step": 17837 }, { "epoch": 0.34, "learning_rate": 3.865882485272765e-06, "loss": 0.8452, "step": 17838 }, { "epoch": 0.34, "learning_rate": 3.865754533183398e-06, "loss": 1.0298, "step": 17839 }, { "epoch": 0.34, "learning_rate": 3.865626575994347e-06, "loss": 0.9206, "step": 17840 }, { "epoch": 0.34, "learning_rate": 3.865498613706087e-06, "loss": 0.8404, "step": 17841 }, { "epoch": 0.34, "learning_rate": 3.8653706463190975e-06, "loss": 0.949, "step": 17842 }, { "epoch": 0.34, "learning_rate": 3.865242673833856e-06, "loss": 0.8941, "step": 17843 }, { "epoch": 0.34, "learning_rate": 3.86511469625084e-06, "loss": 1.1087, "step": 17844 }, { "epoch": 0.34, "learning_rate": 3.8649867135705265e-06, "loss": 1.0704, "step": 17845 }, { "epoch": 0.34, "learning_rate": 3.8648587257933956e-06, "loss": 0.6168, "step": 17846 }, { "epoch": 0.34, "learning_rate": 3.864730732919924e-06, "loss": 1.0445, "step": 17847 }, { "epoch": 0.34, "learning_rate": 3.86460273495059e-06, "loss": 0.8459, "step": 17848 }, { "epoch": 0.34, "learning_rate": 3.86447473188587e-06, "loss": 1.0015, "step": 17849 }, { "epoch": 0.34, "learning_rate": 3.864346723726244e-06, "loss": 1.0019, "step": 17850 }, { "epoch": 0.34, "learning_rate": 3.864218710472189e-06, "loss": 0.937, "step": 17851 }, { "epoch": 0.34, "learning_rate": 3.864090692124184e-06, "loss": 1.0082, "step": 17852 }, { "epoch": 0.34, "learning_rate": 3.8639626686827055e-06, "loss": 0.9168, "step": 17853 }, { "epoch": 0.34, "learning_rate": 3.863834640148232e-06, "loss": 0.8558, "step": 17854 }, { "epoch": 0.34, "learning_rate": 3.8637066065212425e-06, "loss": 0.748, "step": 17855 }, { "epoch": 0.34, "learning_rate": 3.8635785678022135e-06, "loss": 0.9745, "step": 17856 }, { "epoch": 0.34, "learning_rate": 3.8634505239916246e-06, "loss": 1.0267, "step": 17857 }, { "epoch": 0.34, "learning_rate": 3.863322475089953e-06, "loss": 0.925, "step": 17858 }, { "epoch": 0.34, "learning_rate": 3.863194421097677e-06, "loss": 0.9628, "step": 17859 }, { "epoch": 0.34, "learning_rate": 3.863066362015274e-06, "loss": 0.8503, "step": 17860 }, { "epoch": 0.34, "learning_rate": 3.862938297843225e-06, "loss": 0.8242, "step": 17861 }, { "epoch": 0.34, "learning_rate": 3.862810228582005e-06, "loss": 0.9702, "step": 17862 }, { "epoch": 0.34, "learning_rate": 3.862682154232093e-06, "loss": 1.0432, "step": 17863 }, { "epoch": 0.34, "learning_rate": 3.862554074793968e-06, "loss": 0.9007, "step": 17864 }, { "epoch": 0.34, "learning_rate": 3.862425990268108e-06, "loss": 0.823, "step": 17865 }, { "epoch": 0.34, "learning_rate": 3.862297900654991e-06, "loss": 0.7808, "step": 17866 }, { "epoch": 0.34, "learning_rate": 3.8621698059550946e-06, "loss": 0.9243, "step": 17867 }, { "epoch": 0.34, "learning_rate": 3.862041706168899e-06, "loss": 1.1269, "step": 17868 }, { "epoch": 0.34, "learning_rate": 3.861913601296882e-06, "loss": 0.9047, "step": 17869 }, { "epoch": 0.34, "learning_rate": 3.8617854913395205e-06, "loss": 0.8743, "step": 17870 }, { "epoch": 0.34, "learning_rate": 3.8616573762972935e-06, "loss": 0.9345, "step": 17871 }, { "epoch": 0.34, "learning_rate": 3.861529256170679e-06, "loss": 0.959, "step": 17872 }, { "epoch": 0.34, "learning_rate": 3.861401130960157e-06, "loss": 1.0092, "step": 17873 }, { "epoch": 0.34, "learning_rate": 3.861273000666205e-06, "loss": 1.1904, "step": 17874 }, { "epoch": 0.34, "learning_rate": 3.861144865289301e-06, "loss": 1.2737, "step": 17875 }, { "epoch": 0.34, "learning_rate": 3.861016724829925e-06, "loss": 0.9262, "step": 17876 }, { "epoch": 0.34, "learning_rate": 3.860888579288552e-06, "loss": 0.7701, "step": 17877 }, { "epoch": 0.34, "learning_rate": 3.860760428665664e-06, "loss": 0.7971, "step": 17878 }, { "epoch": 0.34, "learning_rate": 3.860632272961739e-06, "loss": 0.8733, "step": 17879 }, { "epoch": 0.34, "learning_rate": 3.860504112177254e-06, "loss": 1.0566, "step": 17880 }, { "epoch": 0.34, "learning_rate": 3.860375946312687e-06, "loss": 1.0359, "step": 17881 }, { "epoch": 0.34, "learning_rate": 3.86024777536852e-06, "loss": 0.9978, "step": 17882 }, { "epoch": 0.34, "learning_rate": 3.86011959934523e-06, "loss": 0.994, "step": 17883 }, { "epoch": 0.34, "learning_rate": 3.859991418243294e-06, "loss": 0.9148, "step": 17884 }, { "epoch": 0.34, "learning_rate": 3.859863232063191e-06, "loss": 0.985, "step": 17885 }, { "epoch": 0.34, "learning_rate": 3.859735040805401e-06, "loss": 0.7263, "step": 17886 }, { "epoch": 0.34, "learning_rate": 3.859606844470402e-06, "loss": 1.2274, "step": 17887 }, { "epoch": 0.34, "learning_rate": 3.859478643058674e-06, "loss": 0.8704, "step": 17888 }, { "epoch": 0.34, "learning_rate": 3.859350436570693e-06, "loss": 0.9861, "step": 17889 }, { "epoch": 0.34, "learning_rate": 3.859222225006939e-06, "loss": 0.8522, "step": 17890 }, { "epoch": 0.34, "learning_rate": 3.859094008367892e-06, "loss": 0.8953, "step": 17891 }, { "epoch": 0.34, "learning_rate": 3.858965786654029e-06, "loss": 0.8453, "step": 17892 }, { "epoch": 0.34, "learning_rate": 3.858837559865829e-06, "loss": 0.9797, "step": 17893 }, { "epoch": 0.34, "learning_rate": 3.858709328003771e-06, "loss": 0.8637, "step": 17894 }, { "epoch": 0.34, "learning_rate": 3.858581091068335e-06, "loss": 1.1254, "step": 17895 }, { "epoch": 0.34, "learning_rate": 3.8584528490599995e-06, "loss": 0.8762, "step": 17896 }, { "epoch": 0.34, "learning_rate": 3.858324601979242e-06, "loss": 0.9724, "step": 17897 }, { "epoch": 0.34, "learning_rate": 3.858196349826541e-06, "loss": 0.8018, "step": 17898 }, { "epoch": 0.34, "learning_rate": 3.858068092602377e-06, "loss": 0.8844, "step": 17899 }, { "epoch": 0.34, "learning_rate": 3.857939830307229e-06, "loss": 1.0744, "step": 17900 }, { "epoch": 0.34, "learning_rate": 3.8578115629415745e-06, "loss": 0.8376, "step": 17901 }, { "epoch": 0.34, "learning_rate": 3.857683290505894e-06, "loss": 1.0956, "step": 17902 }, { "epoch": 0.34, "learning_rate": 3.857555013000665e-06, "loss": 0.7577, "step": 17903 }, { "epoch": 0.34, "learning_rate": 3.857426730426368e-06, "loss": 0.7599, "step": 17904 }, { "epoch": 0.34, "learning_rate": 3.857298442783481e-06, "loss": 0.9993, "step": 17905 }, { "epoch": 0.34, "learning_rate": 3.857170150072484e-06, "loss": 1.1685, "step": 17906 }, { "epoch": 0.34, "learning_rate": 3.857041852293854e-06, "loss": 0.8853, "step": 17907 }, { "epoch": 0.34, "learning_rate": 3.856913549448071e-06, "loss": 0.9099, "step": 17908 }, { "epoch": 0.34, "learning_rate": 3.8567852415356156e-06, "loss": 0.7383, "step": 17909 }, { "epoch": 0.34, "learning_rate": 3.856656928556965e-06, "loss": 0.7668, "step": 17910 }, { "epoch": 0.34, "learning_rate": 3.8565286105126e-06, "loss": 1.0001, "step": 17911 }, { "epoch": 0.34, "learning_rate": 3.856400287402997e-06, "loss": 1.0199, "step": 17912 }, { "epoch": 0.34, "learning_rate": 3.856271959228638e-06, "loss": 1.1061, "step": 17913 }, { "epoch": 0.34, "learning_rate": 3.856143625990002e-06, "loss": 0.9815, "step": 17914 }, { "epoch": 0.34, "learning_rate": 3.8560152876875655e-06, "loss": 0.8415, "step": 17915 }, { "epoch": 0.34, "learning_rate": 3.8558869443218106e-06, "loss": 0.9378, "step": 17916 }, { "epoch": 0.34, "learning_rate": 3.855758595893215e-06, "loss": 0.7539, "step": 17917 }, { "epoch": 0.34, "learning_rate": 3.855630242402259e-06, "loss": 0.9195, "step": 17918 }, { "epoch": 0.34, "learning_rate": 3.85550188384942e-06, "loss": 1.2023, "step": 17919 }, { "epoch": 0.34, "learning_rate": 3.85537352023518e-06, "loss": 0.8426, "step": 17920 }, { "epoch": 0.34, "learning_rate": 3.855245151560016e-06, "loss": 0.86, "step": 17921 }, { "epoch": 0.34, "learning_rate": 3.855116777824408e-06, "loss": 0.918, "step": 17922 }, { "epoch": 0.34, "learning_rate": 3.854988399028836e-06, "loss": 0.8676, "step": 17923 }, { "epoch": 0.34, "learning_rate": 3.854860015173778e-06, "loss": 0.9845, "step": 17924 }, { "epoch": 0.34, "learning_rate": 3.854731626259715e-06, "loss": 0.8214, "step": 17925 }, { "epoch": 0.34, "learning_rate": 3.854603232287126e-06, "loss": 0.9953, "step": 17926 }, { "epoch": 0.34, "learning_rate": 3.854474833256489e-06, "loss": 1.0251, "step": 17927 }, { "epoch": 0.34, "learning_rate": 3.854346429168285e-06, "loss": 0.917, "step": 17928 }, { "epoch": 0.34, "learning_rate": 3.854218020022994e-06, "loss": 0.769, "step": 17929 }, { "epoch": 0.34, "learning_rate": 3.854089605821093e-06, "loss": 0.7247, "step": 17930 }, { "epoch": 0.34, "learning_rate": 3.853961186563063e-06, "loss": 1.16, "step": 17931 }, { "epoch": 0.34, "learning_rate": 3.853832762249385e-06, "loss": 0.9977, "step": 17932 }, { "epoch": 0.34, "learning_rate": 3.853704332880535e-06, "loss": 0.9763, "step": 17933 }, { "epoch": 0.34, "learning_rate": 3.853575898456995e-06, "loss": 0.8222, "step": 17934 }, { "epoch": 0.34, "learning_rate": 3.853447458979245e-06, "loss": 0.9224, "step": 17935 }, { "epoch": 0.34, "learning_rate": 3.8533190144477625e-06, "loss": 1.1552, "step": 17936 }, { "epoch": 0.34, "learning_rate": 3.853190564863028e-06, "loss": 1.0032, "step": 17937 }, { "epoch": 0.34, "learning_rate": 3.853062110225524e-06, "loss": 0.8899, "step": 17938 }, { "epoch": 0.34, "learning_rate": 3.852933650535725e-06, "loss": 0.7987, "step": 17939 }, { "epoch": 0.34, "learning_rate": 3.852805185794114e-06, "loss": 0.9977, "step": 17940 }, { "epoch": 0.34, "learning_rate": 3.85267671600117e-06, "loss": 0.7683, "step": 17941 }, { "epoch": 0.34, "learning_rate": 3.8525482411573736e-06, "loss": 0.7726, "step": 17942 }, { "epoch": 0.34, "learning_rate": 3.852419761263202e-06, "loss": 0.8781, "step": 17943 }, { "epoch": 0.34, "learning_rate": 3.852291276319137e-06, "loss": 1.1476, "step": 17944 }, { "epoch": 0.34, "learning_rate": 3.852162786325658e-06, "loss": 1.0304, "step": 17945 }, { "epoch": 0.34, "learning_rate": 3.852034291283244e-06, "loss": 0.859, "step": 17946 }, { "epoch": 0.34, "learning_rate": 3.851905791192376e-06, "loss": 0.8904, "step": 17947 }, { "epoch": 0.34, "learning_rate": 3.8517772860535334e-06, "loss": 0.8674, "step": 17948 }, { "epoch": 0.34, "learning_rate": 3.851648775867196e-06, "loss": 1.1436, "step": 17949 }, { "epoch": 0.34, "learning_rate": 3.851520260633843e-06, "loss": 1.187, "step": 17950 }, { "epoch": 0.34, "learning_rate": 3.851391740353955e-06, "loss": 1.0555, "step": 17951 }, { "epoch": 0.34, "learning_rate": 3.851263215028011e-06, "loss": 0.7501, "step": 17952 }, { "epoch": 0.34, "learning_rate": 3.851134684656492e-06, "loss": 0.9465, "step": 17953 }, { "epoch": 0.34, "learning_rate": 3.851006149239878e-06, "loss": 0.8596, "step": 17954 }, { "epoch": 0.34, "learning_rate": 3.8508776087786485e-06, "loss": 1.014, "step": 17955 }, { "epoch": 0.34, "learning_rate": 3.850749063273283e-06, "loss": 1.0117, "step": 17956 }, { "epoch": 0.34, "learning_rate": 3.850620512724262e-06, "loss": 0.9212, "step": 17957 }, { "epoch": 0.34, "learning_rate": 3.850491957132065e-06, "loss": 0.9023, "step": 17958 }, { "epoch": 0.34, "learning_rate": 3.850363396497173e-06, "loss": 0.7023, "step": 17959 }, { "epoch": 0.34, "learning_rate": 3.8502348308200655e-06, "loss": 0.8958, "step": 17960 }, { "epoch": 0.34, "learning_rate": 3.850106260101222e-06, "loss": 1.1477, "step": 17961 }, { "epoch": 0.34, "learning_rate": 3.849977684341124e-06, "loss": 0.9789, "step": 17962 }, { "epoch": 0.34, "learning_rate": 3.849849103540249e-06, "loss": 0.83, "step": 17963 }, { "epoch": 0.34, "learning_rate": 3.849720517699081e-06, "loss": 0.81, "step": 17964 }, { "epoch": 0.34, "learning_rate": 3.849591926818097e-06, "loss": 0.7658, "step": 17965 }, { "epoch": 0.34, "learning_rate": 3.849463330897778e-06, "loss": 1.1246, "step": 17966 }, { "epoch": 0.34, "learning_rate": 3.849334729938605e-06, "loss": 0.9313, "step": 17967 }, { "epoch": 0.34, "learning_rate": 3.849206123941057e-06, "loss": 0.8741, "step": 17968 }, { "epoch": 0.34, "learning_rate": 3.8490775129056145e-06, "loss": 1.1525, "step": 17969 }, { "epoch": 0.34, "learning_rate": 3.848948896832757e-06, "loss": 0.8895, "step": 17970 }, { "epoch": 0.34, "learning_rate": 3.8488202757229675e-06, "loss": 0.8833, "step": 17971 }, { "epoch": 0.34, "learning_rate": 3.848691649576723e-06, "loss": 0.9828, "step": 17972 }, { "epoch": 0.34, "learning_rate": 3.848563018394507e-06, "loss": 1.0277, "step": 17973 }, { "epoch": 0.34, "learning_rate": 3.848434382176797e-06, "loss": 0.9207, "step": 17974 }, { "epoch": 0.34, "learning_rate": 3.848305740924074e-06, "loss": 1.1649, "step": 17975 }, { "epoch": 0.34, "learning_rate": 3.848177094636819e-06, "loss": 0.8082, "step": 17976 }, { "epoch": 0.34, "learning_rate": 3.848048443315512e-06, "loss": 0.9436, "step": 17977 }, { "epoch": 0.34, "learning_rate": 3.847919786960633e-06, "loss": 0.9739, "step": 17978 }, { "epoch": 0.34, "learning_rate": 3.8477911255726634e-06, "loss": 0.8226, "step": 17979 }, { "epoch": 0.34, "learning_rate": 3.847662459152084e-06, "loss": 0.8837, "step": 17980 }, { "epoch": 0.34, "learning_rate": 3.847533787699373e-06, "loss": 0.9486, "step": 17981 }, { "epoch": 0.34, "learning_rate": 3.847405111215013e-06, "loss": 1.0524, "step": 17982 }, { "epoch": 0.34, "learning_rate": 3.847276429699483e-06, "loss": 0.7425, "step": 17983 }, { "epoch": 0.34, "learning_rate": 3.847147743153263e-06, "loss": 0.8766, "step": 17984 }, { "epoch": 0.34, "learning_rate": 3.8470190515768366e-06, "loss": 0.9216, "step": 17985 }, { "epoch": 0.34, "learning_rate": 3.846890354970682e-06, "loss": 1.0099, "step": 17986 }, { "epoch": 0.34, "learning_rate": 3.846761653335279e-06, "loss": 0.9719, "step": 17987 }, { "epoch": 0.34, "learning_rate": 3.846632946671111e-06, "loss": 1.1323, "step": 17988 }, { "epoch": 0.34, "learning_rate": 3.846504234978655e-06, "loss": 1.0712, "step": 17989 }, { "epoch": 0.34, "learning_rate": 3.846375518258394e-06, "loss": 1.0088, "step": 17990 }, { "epoch": 0.34, "learning_rate": 3.846246796510809e-06, "loss": 0.7974, "step": 17991 }, { "epoch": 0.34, "learning_rate": 3.84611806973638e-06, "loss": 0.9701, "step": 17992 }, { "epoch": 0.34, "learning_rate": 3.845989337935586e-06, "loss": 1.2633, "step": 17993 }, { "epoch": 0.34, "learning_rate": 3.845860601108909e-06, "loss": 1.1606, "step": 17994 }, { "epoch": 0.34, "learning_rate": 3.845731859256831e-06, "loss": 0.9304, "step": 17995 }, { "epoch": 0.34, "learning_rate": 3.845603112379831e-06, "loss": 0.9612, "step": 17996 }, { "epoch": 0.34, "learning_rate": 3.84547436047839e-06, "loss": 0.886, "step": 17997 }, { "epoch": 0.34, "learning_rate": 3.845345603552989e-06, "loss": 0.827, "step": 17998 }, { "epoch": 0.34, "learning_rate": 3.8452168416041094e-06, "loss": 0.8576, "step": 17999 }, { "epoch": 0.34, "learning_rate": 3.845088074632231e-06, "loss": 1.0361, "step": 18000 }, { "epoch": 0.34, "learning_rate": 3.844959302637835e-06, "loss": 0.7347, "step": 18001 }, { "epoch": 0.34, "learning_rate": 3.844830525621402e-06, "loss": 0.8906, "step": 18002 }, { "epoch": 0.34, "learning_rate": 3.8447017435834125e-06, "loss": 1.091, "step": 18003 }, { "epoch": 0.34, "learning_rate": 3.844572956524348e-06, "loss": 0.8749, "step": 18004 }, { "epoch": 0.34, "learning_rate": 3.84444416444469e-06, "loss": 0.9284, "step": 18005 }, { "epoch": 0.34, "learning_rate": 3.844315367344919e-06, "loss": 1.3192, "step": 18006 }, { "epoch": 0.34, "learning_rate": 3.844186565225515e-06, "loss": 0.8546, "step": 18007 }, { "epoch": 0.34, "learning_rate": 3.844057758086959e-06, "loss": 0.7766, "step": 18008 }, { "epoch": 0.34, "learning_rate": 3.843928945929735e-06, "loss": 0.7968, "step": 18009 }, { "epoch": 0.34, "learning_rate": 3.843800128754319e-06, "loss": 0.8355, "step": 18010 }, { "epoch": 0.34, "learning_rate": 3.843671306561195e-06, "loss": 1.0153, "step": 18011 }, { "epoch": 0.34, "learning_rate": 3.843542479350845e-06, "loss": 1.0081, "step": 18012 }, { "epoch": 0.34, "learning_rate": 3.843413647123747e-06, "loss": 1.1465, "step": 18013 }, { "epoch": 0.34, "learning_rate": 3.8432848098803836e-06, "loss": 0.9083, "step": 18014 }, { "epoch": 0.34, "learning_rate": 3.843155967621237e-06, "loss": 0.9514, "step": 18015 }, { "epoch": 0.34, "learning_rate": 3.843027120346786e-06, "loss": 0.9062, "step": 18016 }, { "epoch": 0.34, "learning_rate": 3.842898268057514e-06, "loss": 0.8736, "step": 18017 }, { "epoch": 0.34, "learning_rate": 3.8427694107539005e-06, "loss": 1.0096, "step": 18018 }, { "epoch": 0.34, "learning_rate": 3.842640548436427e-06, "loss": 1.1863, "step": 18019 }, { "epoch": 0.34, "learning_rate": 3.8425116811055754e-06, "loss": 0.6433, "step": 18020 }, { "epoch": 0.34, "learning_rate": 3.842382808761826e-06, "loss": 0.6657, "step": 18021 }, { "epoch": 0.34, "learning_rate": 3.8422539314056605e-06, "loss": 0.9697, "step": 18022 }, { "epoch": 0.34, "learning_rate": 3.84212504903756e-06, "loss": 0.7254, "step": 18023 }, { "epoch": 0.34, "learning_rate": 3.841996161658005e-06, "loss": 1.0214, "step": 18024 }, { "epoch": 0.34, "learning_rate": 3.841867269267478e-06, "loss": 1.0375, "step": 18025 }, { "epoch": 0.34, "learning_rate": 3.84173837186646e-06, "loss": 0.8658, "step": 18026 }, { "epoch": 0.34, "learning_rate": 3.841609469455432e-06, "loss": 1.0436, "step": 18027 }, { "epoch": 0.34, "learning_rate": 3.841480562034875e-06, "loss": 0.9351, "step": 18028 }, { "epoch": 0.34, "learning_rate": 3.841351649605271e-06, "loss": 0.8859, "step": 18029 }, { "epoch": 0.34, "learning_rate": 3.8412227321671014e-06, "loss": 0.8328, "step": 18030 }, { "epoch": 0.34, "learning_rate": 3.841093809720847e-06, "loss": 0.9933, "step": 18031 }, { "epoch": 0.34, "learning_rate": 3.840964882266989e-06, "loss": 0.9538, "step": 18032 }, { "epoch": 0.34, "learning_rate": 3.84083594980601e-06, "loss": 0.9139, "step": 18033 }, { "epoch": 0.34, "learning_rate": 3.84070701233839e-06, "loss": 0.9685, "step": 18034 }, { "epoch": 0.34, "learning_rate": 3.8405780698646115e-06, "loss": 0.9759, "step": 18035 }, { "epoch": 0.34, "learning_rate": 3.840449122385155e-06, "loss": 0.9596, "step": 18036 }, { "epoch": 0.34, "learning_rate": 3.840320169900503e-06, "loss": 1.175, "step": 18037 }, { "epoch": 0.34, "learning_rate": 3.840191212411137e-06, "loss": 0.9714, "step": 18038 }, { "epoch": 0.34, "learning_rate": 3.840062249917538e-06, "loss": 1.067, "step": 18039 }, { "epoch": 0.34, "learning_rate": 3.8399332824201865e-06, "loss": 0.8555, "step": 18040 }, { "epoch": 0.34, "learning_rate": 3.8398043099195656e-06, "loss": 0.9105, "step": 18041 }, { "epoch": 0.34, "learning_rate": 3.839675332416158e-06, "loss": 0.9199, "step": 18042 }, { "epoch": 0.34, "learning_rate": 3.839546349910442e-06, "loss": 0.9879, "step": 18043 }, { "epoch": 0.34, "learning_rate": 3.8394173624029015e-06, "loss": 1.0568, "step": 18044 }, { "epoch": 0.34, "learning_rate": 3.839288369894019e-06, "loss": 1.0087, "step": 18045 }, { "epoch": 0.34, "learning_rate": 3.839159372384273e-06, "loss": 1.0258, "step": 18046 }, { "epoch": 0.34, "learning_rate": 3.839030369874147e-06, "loss": 1.0043, "step": 18047 }, { "epoch": 0.34, "learning_rate": 3.8389013623641245e-06, "loss": 0.8757, "step": 18048 }, { "epoch": 0.34, "learning_rate": 3.838772349854683e-06, "loss": 1.2073, "step": 18049 }, { "epoch": 0.34, "learning_rate": 3.838643332346308e-06, "loss": 1.1608, "step": 18050 }, { "epoch": 0.34, "learning_rate": 3.838514309839481e-06, "loss": 0.9474, "step": 18051 }, { "epoch": 0.34, "learning_rate": 3.83838528233468e-06, "loss": 1.0461, "step": 18052 }, { "epoch": 0.34, "learning_rate": 3.8382562498323905e-06, "loss": 1.0057, "step": 18053 }, { "epoch": 0.34, "learning_rate": 3.838127212333094e-06, "loss": 0.883, "step": 18054 }, { "epoch": 0.34, "learning_rate": 3.83799816983727e-06, "loss": 1.0578, "step": 18055 }, { "epoch": 0.34, "learning_rate": 3.837869122345403e-06, "loss": 1.3144, "step": 18056 }, { "epoch": 0.34, "learning_rate": 3.837740069857973e-06, "loss": 1.0595, "step": 18057 }, { "epoch": 0.34, "learning_rate": 3.8376110123754635e-06, "loss": 0.8399, "step": 18058 }, { "epoch": 0.34, "learning_rate": 3.837481949898355e-06, "loss": 1.0251, "step": 18059 }, { "epoch": 0.34, "learning_rate": 3.83735288242713e-06, "loss": 0.837, "step": 18060 }, { "epoch": 0.34, "learning_rate": 3.83722380996227e-06, "loss": 1.0444, "step": 18061 }, { "epoch": 0.34, "learning_rate": 3.837094732504257e-06, "loss": 0.8934, "step": 18062 }, { "epoch": 0.34, "learning_rate": 3.836965650053574e-06, "loss": 0.9788, "step": 18063 }, { "epoch": 0.34, "learning_rate": 3.836836562610702e-06, "loss": 0.9256, "step": 18064 }, { "epoch": 0.34, "learning_rate": 3.836707470176123e-06, "loss": 1.0289, "step": 18065 }, { "epoch": 0.34, "learning_rate": 3.83657837275032e-06, "loss": 0.9048, "step": 18066 }, { "epoch": 0.34, "learning_rate": 3.836449270333774e-06, "loss": 0.9927, "step": 18067 }, { "epoch": 0.34, "learning_rate": 3.836320162926967e-06, "loss": 1.1131, "step": 18068 }, { "epoch": 0.34, "learning_rate": 3.836191050530382e-06, "loss": 1.032, "step": 18069 }, { "epoch": 0.34, "learning_rate": 3.836061933144501e-06, "loss": 0.9879, "step": 18070 }, { "epoch": 0.34, "learning_rate": 3.835932810769804e-06, "loss": 0.8571, "step": 18071 }, { "epoch": 0.34, "learning_rate": 3.835803683406776e-06, "loss": 0.8778, "step": 18072 }, { "epoch": 0.34, "learning_rate": 3.835674551055898e-06, "loss": 0.8246, "step": 18073 }, { "epoch": 0.34, "learning_rate": 3.8355454137176515e-06, "loss": 1.1674, "step": 18074 }, { "epoch": 0.34, "learning_rate": 3.83541627139252e-06, "loss": 1.045, "step": 18075 }, { "epoch": 0.34, "learning_rate": 3.8352871240809855e-06, "loss": 0.8532, "step": 18076 }, { "epoch": 0.34, "learning_rate": 3.8351579717835294e-06, "loss": 0.8229, "step": 18077 }, { "epoch": 0.34, "learning_rate": 3.835028814500635e-06, "loss": 1.1003, "step": 18078 }, { "epoch": 0.34, "learning_rate": 3.834899652232783e-06, "loss": 0.6977, "step": 18079 }, { "epoch": 0.34, "learning_rate": 3.834770484980457e-06, "loss": 0.8068, "step": 18080 }, { "epoch": 0.34, "learning_rate": 3.834641312744138e-06, "loss": 1.1344, "step": 18081 }, { "epoch": 0.34, "learning_rate": 3.834512135524311e-06, "loss": 1.0565, "step": 18082 }, { "epoch": 0.34, "learning_rate": 3.834382953321455e-06, "loss": 0.8999, "step": 18083 }, { "epoch": 0.34, "learning_rate": 3.834253766136055e-06, "loss": 0.903, "step": 18084 }, { "epoch": 0.34, "learning_rate": 3.834124573968592e-06, "loss": 1.0118, "step": 18085 }, { "epoch": 0.34, "learning_rate": 3.833995376819549e-06, "loss": 0.8941, "step": 18086 }, { "epoch": 0.34, "learning_rate": 3.833866174689408e-06, "loss": 1.0375, "step": 18087 }, { "epoch": 0.34, "learning_rate": 3.833736967578652e-06, "loss": 0.8913, "step": 18088 }, { "epoch": 0.34, "learning_rate": 3.833607755487762e-06, "loss": 0.9868, "step": 18089 }, { "epoch": 0.34, "learning_rate": 3.833478538417223e-06, "loss": 0.897, "step": 18090 }, { "epoch": 0.34, "learning_rate": 3.833349316367514e-06, "loss": 0.7741, "step": 18091 }, { "epoch": 0.34, "learning_rate": 3.833220089339121e-06, "loss": 0.7945, "step": 18092 }, { "epoch": 0.34, "learning_rate": 3.833090857332525e-06, "loss": 1.1646, "step": 18093 }, { "epoch": 0.34, "learning_rate": 3.832961620348208e-06, "loss": 0.9722, "step": 18094 }, { "epoch": 0.34, "learning_rate": 3.832832378386653e-06, "loss": 0.7379, "step": 18095 }, { "epoch": 0.34, "learning_rate": 3.832703131448344e-06, "loss": 1.0966, "step": 18096 }, { "epoch": 0.34, "learning_rate": 3.832573879533761e-06, "loss": 0.8345, "step": 18097 }, { "epoch": 0.34, "learning_rate": 3.832444622643389e-06, "loss": 0.7418, "step": 18098 }, { "epoch": 0.34, "learning_rate": 3.83231536077771e-06, "loss": 0.8011, "step": 18099 }, { "epoch": 0.34, "learning_rate": 3.832186093937205e-06, "loss": 1.2184, "step": 18100 }, { "epoch": 0.34, "learning_rate": 3.8320568221223586e-06, "loss": 0.9583, "step": 18101 }, { "epoch": 0.34, "learning_rate": 3.831927545333652e-06, "loss": 0.805, "step": 18102 }, { "epoch": 0.34, "learning_rate": 3.83179826357157e-06, "loss": 0.9293, "step": 18103 }, { "epoch": 0.34, "learning_rate": 3.8316689768365935e-06, "loss": 0.9337, "step": 18104 }, { "epoch": 0.34, "learning_rate": 3.831539685129207e-06, "loss": 1.0492, "step": 18105 }, { "epoch": 0.34, "learning_rate": 3.831410388449891e-06, "loss": 1.1408, "step": 18106 }, { "epoch": 0.34, "learning_rate": 3.831281086799129e-06, "loss": 0.9394, "step": 18107 }, { "epoch": 0.34, "learning_rate": 3.831151780177406e-06, "loss": 0.9656, "step": 18108 }, { "epoch": 0.34, "learning_rate": 3.8310224685852015e-06, "loss": 1.0296, "step": 18109 }, { "epoch": 0.34, "learning_rate": 3.830893152023e-06, "loss": 0.8821, "step": 18110 }, { "epoch": 0.34, "learning_rate": 3.830763830491285e-06, "loss": 1.0089, "step": 18111 }, { "epoch": 0.34, "learning_rate": 3.830634503990539e-06, "loss": 1.0054, "step": 18112 }, { "epoch": 0.34, "learning_rate": 3.8305051725212435e-06, "loss": 1.14, "step": 18113 }, { "epoch": 0.34, "learning_rate": 3.830375836083883e-06, "loss": 0.9, "step": 18114 }, { "epoch": 0.34, "learning_rate": 3.83024649467894e-06, "loss": 0.8772, "step": 18115 }, { "epoch": 0.34, "learning_rate": 3.830117148306897e-06, "loss": 0.9216, "step": 18116 }, { "epoch": 0.34, "learning_rate": 3.829987796968237e-06, "loss": 0.7792, "step": 18117 }, { "epoch": 0.34, "learning_rate": 3.829858440663444e-06, "loss": 1.119, "step": 18118 }, { "epoch": 0.34, "learning_rate": 3.829729079393e-06, "loss": 1.0728, "step": 18119 }, { "epoch": 0.34, "learning_rate": 3.82959971315739e-06, "loss": 1.0098, "step": 18120 }, { "epoch": 0.34, "learning_rate": 3.829470341957092e-06, "loss": 0.8506, "step": 18121 }, { "epoch": 0.34, "learning_rate": 3.829340965792595e-06, "loss": 0.86, "step": 18122 }, { "epoch": 0.34, "learning_rate": 3.82921158466438e-06, "loss": 1.0542, "step": 18123 }, { "epoch": 0.34, "learning_rate": 3.829082198572928e-06, "loss": 1.1245, "step": 18124 }, { "epoch": 0.34, "learning_rate": 3.828952807518725e-06, "loss": 1.2166, "step": 18125 }, { "epoch": 0.34, "learning_rate": 3.828823411502252e-06, "loss": 1.1163, "step": 18126 }, { "epoch": 0.34, "learning_rate": 3.8286940105239944e-06, "loss": 0.9624, "step": 18127 }, { "epoch": 0.34, "learning_rate": 3.828564604584433e-06, "loss": 0.8432, "step": 18128 }, { "epoch": 0.34, "learning_rate": 3.8284351936840525e-06, "loss": 0.7845, "step": 18129 }, { "epoch": 0.34, "learning_rate": 3.828305777823336e-06, "loss": 1.0762, "step": 18130 }, { "epoch": 0.34, "learning_rate": 3.828176357002766e-06, "loss": 1.2299, "step": 18131 }, { "epoch": 0.34, "learning_rate": 3.828046931222827e-06, "loss": 1.0884, "step": 18132 }, { "epoch": 0.34, "learning_rate": 3.827917500484001e-06, "loss": 0.8965, "step": 18133 }, { "epoch": 0.34, "learning_rate": 3.8277880647867715e-06, "loss": 0.7286, "step": 18134 }, { "epoch": 0.34, "learning_rate": 3.827658624131623e-06, "loss": 0.8359, "step": 18135 }, { "epoch": 0.34, "learning_rate": 3.827529178519036e-06, "loss": 0.9382, "step": 18136 }, { "epoch": 0.34, "learning_rate": 3.827399727949497e-06, "loss": 1.0335, "step": 18137 }, { "epoch": 0.34, "learning_rate": 3.827270272423488e-06, "loss": 1.1307, "step": 18138 }, { "epoch": 0.34, "learning_rate": 3.8271408119414925e-06, "loss": 0.7706, "step": 18139 }, { "epoch": 0.34, "learning_rate": 3.827011346503994e-06, "loss": 0.8159, "step": 18140 }, { "epoch": 0.34, "learning_rate": 3.826881876111476e-06, "loss": 1.1418, "step": 18141 }, { "epoch": 0.34, "learning_rate": 3.8267524007644215e-06, "loss": 0.7863, "step": 18142 }, { "epoch": 0.34, "learning_rate": 3.826622920463314e-06, "loss": 0.9076, "step": 18143 }, { "epoch": 0.34, "learning_rate": 3.826493435208637e-06, "loss": 1.0004, "step": 18144 }, { "epoch": 0.34, "learning_rate": 3.826363945000875e-06, "loss": 0.9731, "step": 18145 }, { "epoch": 0.34, "learning_rate": 3.82623444984051e-06, "loss": 0.9703, "step": 18146 }, { "epoch": 0.34, "learning_rate": 3.826104949728027e-06, "loss": 0.9584, "step": 18147 }, { "epoch": 0.34, "learning_rate": 3.825975444663908e-06, "loss": 0.8657, "step": 18148 }, { "epoch": 0.34, "learning_rate": 3.825845934648637e-06, "loss": 0.8405, "step": 18149 }, { "epoch": 0.34, "learning_rate": 3.825716419682699e-06, "loss": 1.0627, "step": 18150 }, { "epoch": 0.34, "learning_rate": 3.825586899766576e-06, "loss": 0.7943, "step": 18151 }, { "epoch": 0.34, "learning_rate": 3.825457374900753e-06, "loss": 1.0057, "step": 18152 }, { "epoch": 0.34, "learning_rate": 3.825327845085711e-06, "loss": 0.7255, "step": 18153 }, { "epoch": 0.34, "learning_rate": 3.825198310321937e-06, "loss": 0.9042, "step": 18154 }, { "epoch": 0.34, "learning_rate": 3.825068770609913e-06, "loss": 0.9417, "step": 18155 }, { "epoch": 0.34, "learning_rate": 3.824939225950123e-06, "loss": 1.0596, "step": 18156 }, { "epoch": 0.34, "learning_rate": 3.8248096763430485e-06, "loss": 0.9189, "step": 18157 }, { "epoch": 0.34, "learning_rate": 3.824680121789177e-06, "loss": 0.8405, "step": 18158 }, { "epoch": 0.34, "learning_rate": 3.824550562288991e-06, "loss": 0.8976, "step": 18159 }, { "epoch": 0.34, "learning_rate": 3.824420997842973e-06, "loss": 0.8755, "step": 18160 }, { "epoch": 0.34, "learning_rate": 3.824291428451608e-06, "loss": 0.9148, "step": 18161 }, { "epoch": 0.34, "learning_rate": 3.824161854115379e-06, "loss": 0.9709, "step": 18162 }, { "epoch": 0.34, "learning_rate": 3.8240322748347706e-06, "loss": 0.9051, "step": 18163 }, { "epoch": 0.34, "learning_rate": 3.823902690610266e-06, "loss": 0.863, "step": 18164 }, { "epoch": 0.34, "learning_rate": 3.82377310144235e-06, "loss": 0.9678, "step": 18165 }, { "epoch": 0.34, "learning_rate": 3.823643507331505e-06, "loss": 0.77, "step": 18166 }, { "epoch": 0.34, "learning_rate": 3.8235139082782155e-06, "loss": 0.9299, "step": 18167 }, { "epoch": 0.34, "learning_rate": 3.823384304282967e-06, "loss": 1.1458, "step": 18168 }, { "epoch": 0.34, "learning_rate": 3.823254695346241e-06, "loss": 1.0482, "step": 18169 }, { "epoch": 0.34, "learning_rate": 3.823125081468522e-06, "loss": 1.0555, "step": 18170 }, { "epoch": 0.34, "learning_rate": 3.8229954626502955e-06, "loss": 0.8951, "step": 18171 }, { "epoch": 0.34, "learning_rate": 3.8228658388920445e-06, "loss": 0.9545, "step": 18172 }, { "epoch": 0.34, "learning_rate": 3.822736210194253e-06, "loss": 0.9155, "step": 18173 }, { "epoch": 0.34, "learning_rate": 3.822606576557405e-06, "loss": 0.8277, "step": 18174 }, { "epoch": 0.34, "learning_rate": 3.822476937981985e-06, "loss": 1.1314, "step": 18175 }, { "epoch": 0.34, "learning_rate": 3.822347294468476e-06, "loss": 1.1698, "step": 18176 }, { "epoch": 0.34, "learning_rate": 3.822217646017362e-06, "loss": 0.9738, "step": 18177 }, { "epoch": 0.34, "learning_rate": 3.8220879926291285e-06, "loss": 0.9966, "step": 18178 }, { "epoch": 0.34, "learning_rate": 3.82195833430426e-06, "loss": 0.7255, "step": 18179 }, { "epoch": 0.34, "learning_rate": 3.821828671043238e-06, "loss": 0.9583, "step": 18180 }, { "epoch": 0.34, "learning_rate": 3.82169900284655e-06, "loss": 0.9102, "step": 18181 }, { "epoch": 0.34, "learning_rate": 3.821569329714677e-06, "loss": 1.0558, "step": 18182 }, { "epoch": 0.34, "learning_rate": 3.821439651648106e-06, "loss": 1.0595, "step": 18183 }, { "epoch": 0.34, "learning_rate": 3.8213099686473186e-06, "loss": 0.8572, "step": 18184 }, { "epoch": 0.34, "learning_rate": 3.821180280712801e-06, "loss": 0.8446, "step": 18185 }, { "epoch": 0.34, "learning_rate": 3.821050587845036e-06, "loss": 0.9694, "step": 18186 }, { "epoch": 0.34, "learning_rate": 3.8209208900445085e-06, "loss": 0.9486, "step": 18187 }, { "epoch": 0.34, "learning_rate": 3.820791187311704e-06, "loss": 0.8648, "step": 18188 }, { "epoch": 0.34, "learning_rate": 3.8206614796471055e-06, "loss": 0.9537, "step": 18189 }, { "epoch": 0.34, "learning_rate": 3.820531767051196e-06, "loss": 0.8372, "step": 18190 }, { "epoch": 0.34, "learning_rate": 3.820402049524463e-06, "loss": 1.02, "step": 18191 }, { "epoch": 0.34, "learning_rate": 3.820272327067389e-06, "loss": 0.8162, "step": 18192 }, { "epoch": 0.34, "learning_rate": 3.820142599680458e-06, "loss": 0.9208, "step": 18193 }, { "epoch": 0.34, "learning_rate": 3.820012867364156e-06, "loss": 0.9933, "step": 18194 }, { "epoch": 0.34, "learning_rate": 3.819883130118965e-06, "loss": 1.0389, "step": 18195 }, { "epoch": 0.34, "learning_rate": 3.819753387945372e-06, "loss": 0.9341, "step": 18196 }, { "epoch": 0.34, "learning_rate": 3.81962364084386e-06, "loss": 0.9608, "step": 18197 }, { "epoch": 0.34, "learning_rate": 3.819493888814915e-06, "loss": 0.7591, "step": 18198 }, { "epoch": 0.34, "learning_rate": 3.819364131859018e-06, "loss": 0.8153, "step": 18199 }, { "epoch": 0.34, "learning_rate": 3.819234369976657e-06, "loss": 1.0863, "step": 18200 }, { "epoch": 0.34, "learning_rate": 3.819104603168315e-06, "loss": 0.9871, "step": 18201 }, { "epoch": 0.34, "learning_rate": 3.818974831434477e-06, "loss": 0.7653, "step": 18202 }, { "epoch": 0.34, "learning_rate": 3.818845054775628e-06, "loss": 0.825, "step": 18203 }, { "epoch": 0.34, "learning_rate": 3.818715273192251e-06, "loss": 0.9144, "step": 18204 }, { "epoch": 0.34, "learning_rate": 3.818585486684832e-06, "loss": 0.81, "step": 18205 }, { "epoch": 0.34, "learning_rate": 3.818455695253856e-06, "loss": 1.0825, "step": 18206 }, { "epoch": 0.34, "learning_rate": 3.818325898899805e-06, "loss": 0.8122, "step": 18207 }, { "epoch": 0.34, "learning_rate": 3.818196097623167e-06, "loss": 0.9957, "step": 18208 }, { "epoch": 0.34, "learning_rate": 3.818066291424425e-06, "loss": 0.8115, "step": 18209 }, { "epoch": 0.34, "learning_rate": 3.817936480304064e-06, "loss": 0.7945, "step": 18210 }, { "epoch": 0.34, "learning_rate": 3.817806664262568e-06, "loss": 0.9926, "step": 18211 }, { "epoch": 0.34, "learning_rate": 3.817676843300422e-06, "loss": 1.0356, "step": 18212 }, { "epoch": 0.34, "learning_rate": 3.8175470174181125e-06, "loss": 1.017, "step": 18213 }, { "epoch": 0.34, "learning_rate": 3.817417186616121e-06, "loss": 0.9454, "step": 18214 }, { "epoch": 0.34, "learning_rate": 3.817287350894936e-06, "loss": 1.0317, "step": 18215 }, { "epoch": 0.34, "learning_rate": 3.81715751025504e-06, "loss": 1.016, "step": 18216 }, { "epoch": 0.34, "learning_rate": 3.817027664696917e-06, "loss": 0.8301, "step": 18217 }, { "epoch": 0.34, "learning_rate": 3.816897814221054e-06, "loss": 0.8896, "step": 18218 }, { "epoch": 0.34, "learning_rate": 3.8167679588279345e-06, "loss": 1.246, "step": 18219 }, { "epoch": 0.34, "learning_rate": 3.816638098518044e-06, "loss": 0.9196, "step": 18220 }, { "epoch": 0.34, "learning_rate": 3.8165082332918676e-06, "loss": 0.8605, "step": 18221 }, { "epoch": 0.34, "learning_rate": 3.816378363149889e-06, "loss": 1.0341, "step": 18222 }, { "epoch": 0.34, "learning_rate": 3.816248488092596e-06, "loss": 0.775, "step": 18223 }, { "epoch": 0.34, "learning_rate": 3.81611860812047e-06, "loss": 1.2519, "step": 18224 }, { "epoch": 0.34, "learning_rate": 3.815988723233997e-06, "loss": 1.1877, "step": 18225 }, { "epoch": 0.34, "learning_rate": 3.815858833433663e-06, "loss": 0.9254, "step": 18226 }, { "epoch": 0.34, "learning_rate": 3.815728938719953e-06, "loss": 0.9238, "step": 18227 }, { "epoch": 0.34, "learning_rate": 3.815599039093351e-06, "loss": 0.8788, "step": 18228 }, { "epoch": 0.34, "learning_rate": 3.815469134554342e-06, "loss": 0.8327, "step": 18229 }, { "epoch": 0.34, "learning_rate": 3.815339225103412e-06, "loss": 0.7287, "step": 18230 }, { "epoch": 0.34, "learning_rate": 3.815209310741045e-06, "loss": 1.0148, "step": 18231 }, { "epoch": 0.34, "learning_rate": 3.815079391467728e-06, "loss": 0.9467, "step": 18232 }, { "epoch": 0.34, "learning_rate": 3.814949467283944e-06, "loss": 0.9716, "step": 18233 }, { "epoch": 0.34, "learning_rate": 3.814819538190179e-06, "loss": 0.768, "step": 18234 }, { "epoch": 0.34, "learning_rate": 3.8146896041869186e-06, "loss": 0.7701, "step": 18235 }, { "epoch": 0.34, "learning_rate": 3.8145596652746475e-06, "loss": 0.8513, "step": 18236 }, { "epoch": 0.34, "learning_rate": 3.8144297214538512e-06, "loss": 0.9769, "step": 18237 }, { "epoch": 0.34, "learning_rate": 3.814299772725014e-06, "loss": 0.8939, "step": 18238 }, { "epoch": 0.34, "learning_rate": 3.8141698190886222e-06, "loss": 0.9021, "step": 18239 }, { "epoch": 0.34, "learning_rate": 3.81403986054516e-06, "loss": 0.8376, "step": 18240 }, { "epoch": 0.34, "learning_rate": 3.813909897095114e-06, "loss": 0.9571, "step": 18241 }, { "epoch": 0.34, "learning_rate": 3.8137799287389683e-06, "loss": 1.1541, "step": 18242 }, { "epoch": 0.34, "learning_rate": 3.813649955477209e-06, "loss": 0.9459, "step": 18243 }, { "epoch": 0.34, "learning_rate": 3.8135199773103206e-06, "loss": 1.0605, "step": 18244 }, { "epoch": 0.34, "learning_rate": 3.8133899942387884e-06, "loss": 0.9597, "step": 18245 }, { "epoch": 0.34, "learning_rate": 3.8132600062630994e-06, "loss": 0.9516, "step": 18246 }, { "epoch": 0.34, "learning_rate": 3.8131300133837367e-06, "loss": 0.728, "step": 18247 }, { "epoch": 0.34, "learning_rate": 3.8130000156011875e-06, "loss": 0.9185, "step": 18248 }, { "epoch": 0.34, "learning_rate": 3.812870012915936e-06, "loss": 1.0734, "step": 18249 }, { "epoch": 0.34, "learning_rate": 3.8127400053284693e-06, "loss": 1.0551, "step": 18250 }, { "epoch": 0.34, "learning_rate": 3.8126099928392703e-06, "loss": 0.7187, "step": 18251 }, { "epoch": 0.34, "learning_rate": 3.812479975448826e-06, "loss": 0.7416, "step": 18252 }, { "epoch": 0.34, "learning_rate": 3.8123499531576224e-06, "loss": 0.809, "step": 18253 }, { "epoch": 0.34, "learning_rate": 3.8122199259661443e-06, "loss": 0.9062, "step": 18254 }, { "epoch": 0.34, "learning_rate": 3.812089893874876e-06, "loss": 0.9205, "step": 18255 }, { "epoch": 0.34, "learning_rate": 3.811959856884306e-06, "loss": 1.1931, "step": 18256 }, { "epoch": 0.34, "learning_rate": 3.8118298149949173e-06, "loss": 0.9555, "step": 18257 }, { "epoch": 0.34, "learning_rate": 3.811699768207196e-06, "loss": 0.7611, "step": 18258 }, { "epoch": 0.34, "learning_rate": 3.8115697165216286e-06, "loss": 0.9378, "step": 18259 }, { "epoch": 0.34, "learning_rate": 3.8114396599386993e-06, "loss": 0.884, "step": 18260 }, { "epoch": 0.34, "learning_rate": 3.8113095984588955e-06, "loss": 0.9502, "step": 18261 }, { "epoch": 0.34, "learning_rate": 3.8111795320827012e-06, "loss": 1.0762, "step": 18262 }, { "epoch": 0.34, "learning_rate": 3.811049460810603e-06, "loss": 1.171, "step": 18263 }, { "epoch": 0.34, "learning_rate": 3.810919384643086e-06, "loss": 0.9797, "step": 18264 }, { "epoch": 0.34, "learning_rate": 3.8107893035806363e-06, "loss": 0.6762, "step": 18265 }, { "epoch": 0.34, "learning_rate": 3.81065921762374e-06, "loss": 0.9312, "step": 18266 }, { "epoch": 0.34, "learning_rate": 3.8105291267728817e-06, "loss": 0.8131, "step": 18267 }, { "epoch": 0.34, "learning_rate": 3.8103990310285475e-06, "loss": 1.0447, "step": 18268 }, { "epoch": 0.34, "learning_rate": 3.8102689303912245e-06, "loss": 0.8152, "step": 18269 }, { "epoch": 0.34, "learning_rate": 3.810138824861397e-06, "loss": 0.9102, "step": 18270 }, { "epoch": 0.34, "learning_rate": 3.8100087144395517e-06, "loss": 1.0266, "step": 18271 }, { "epoch": 0.34, "learning_rate": 3.8098785991261733e-06, "loss": 0.9823, "step": 18272 }, { "epoch": 0.34, "learning_rate": 3.809748478921749e-06, "loss": 0.8704, "step": 18273 }, { "epoch": 0.34, "learning_rate": 3.8096183538267638e-06, "loss": 1.0898, "step": 18274 }, { "epoch": 0.34, "learning_rate": 3.8094882238417037e-06, "loss": 1.0818, "step": 18275 }, { "epoch": 0.34, "learning_rate": 3.8093580889670545e-06, "loss": 1.0547, "step": 18276 }, { "epoch": 0.34, "learning_rate": 3.8092279492033035e-06, "loss": 0.8821, "step": 18277 }, { "epoch": 0.34, "learning_rate": 3.809097804550934e-06, "loss": 0.9229, "step": 18278 }, { "epoch": 0.34, "learning_rate": 3.808967655010435e-06, "loss": 0.9037, "step": 18279 }, { "epoch": 0.34, "learning_rate": 3.8088375005822898e-06, "loss": 0.9391, "step": 18280 }, { "epoch": 0.34, "learning_rate": 3.808707341266986e-06, "loss": 1.2322, "step": 18281 }, { "epoch": 0.34, "learning_rate": 3.808577177065008e-06, "loss": 1.0474, "step": 18282 }, { "epoch": 0.34, "learning_rate": 3.8084470079768443e-06, "loss": 0.8871, "step": 18283 }, { "epoch": 0.34, "learning_rate": 3.8083168340029785e-06, "loss": 0.9047, "step": 18284 }, { "epoch": 0.34, "learning_rate": 3.8081866551438984e-06, "loss": 0.8646, "step": 18285 }, { "epoch": 0.34, "learning_rate": 3.80805647140009e-06, "loss": 0.9015, "step": 18286 }, { "epoch": 0.35, "learning_rate": 3.807926282772038e-06, "loss": 1.0209, "step": 18287 }, { "epoch": 0.35, "learning_rate": 3.8077960892602296e-06, "loss": 0.9774, "step": 18288 }, { "epoch": 0.35, "learning_rate": 3.807665890865151e-06, "loss": 0.9388, "step": 18289 }, { "epoch": 0.35, "learning_rate": 3.8075356875872873e-06, "loss": 0.9578, "step": 18290 }, { "epoch": 0.35, "learning_rate": 3.807405479427126e-06, "loss": 1.1773, "step": 18291 }, { "epoch": 0.35, "learning_rate": 3.8072752663851533e-06, "loss": 0.8954, "step": 18292 }, { "epoch": 0.35, "learning_rate": 3.8071450484618535e-06, "loss": 1.0433, "step": 18293 }, { "epoch": 0.35, "learning_rate": 3.8070148256577143e-06, "loss": 1.0255, "step": 18294 }, { "epoch": 0.35, "learning_rate": 3.806884597973223e-06, "loss": 1.0738, "step": 18295 }, { "epoch": 0.35, "learning_rate": 3.8067543654088633e-06, "loss": 0.845, "step": 18296 }, { "epoch": 0.35, "learning_rate": 3.806624127965124e-06, "loss": 0.6967, "step": 18297 }, { "epoch": 0.35, "learning_rate": 3.80649388564249e-06, "loss": 0.8593, "step": 18298 }, { "epoch": 0.35, "learning_rate": 3.8063636384414474e-06, "loss": 1.0139, "step": 18299 }, { "epoch": 0.35, "learning_rate": 3.8062333863624834e-06, "loss": 1.0648, "step": 18300 }, { "epoch": 0.35, "learning_rate": 3.8061031294060846e-06, "loss": 0.8999, "step": 18301 }, { "epoch": 0.35, "learning_rate": 3.8059728675727357e-06, "loss": 0.8763, "step": 18302 }, { "epoch": 0.35, "learning_rate": 3.8058426008629246e-06, "loss": 0.9686, "step": 18303 }, { "epoch": 0.35, "learning_rate": 3.805712329277137e-06, "loss": 0.7881, "step": 18304 }, { "epoch": 0.35, "learning_rate": 3.8055820528158593e-06, "loss": 0.8209, "step": 18305 }, { "epoch": 0.35, "learning_rate": 3.805451771479579e-06, "loss": 1.0286, "step": 18306 }, { "epoch": 0.35, "learning_rate": 3.805321485268782e-06, "loss": 0.8712, "step": 18307 }, { "epoch": 0.35, "learning_rate": 3.8051911941839544e-06, "loss": 0.868, "step": 18308 }, { "epoch": 0.35, "learning_rate": 3.8050608982255823e-06, "loss": 0.9474, "step": 18309 }, { "epoch": 0.35, "learning_rate": 3.804930597394153e-06, "loss": 0.7838, "step": 18310 }, { "epoch": 0.35, "learning_rate": 3.8048002916901526e-06, "loss": 0.8907, "step": 18311 }, { "epoch": 0.35, "learning_rate": 3.8046699811140687e-06, "loss": 1.0568, "step": 18312 }, { "epoch": 0.35, "learning_rate": 3.804539665666387e-06, "loss": 0.8161, "step": 18313 }, { "epoch": 0.35, "learning_rate": 3.804409345347594e-06, "loss": 0.9342, "step": 18314 }, { "epoch": 0.35, "learning_rate": 3.8042790201581765e-06, "loss": 0.8957, "step": 18315 }, { "epoch": 0.35, "learning_rate": 3.8041486900986213e-06, "loss": 0.9464, "step": 18316 }, { "epoch": 0.35, "learning_rate": 3.8040183551694143e-06, "loss": 0.8753, "step": 18317 }, { "epoch": 0.35, "learning_rate": 3.8038880153710427e-06, "loss": 1.1265, "step": 18318 }, { "epoch": 0.35, "learning_rate": 3.803757670703994e-06, "loss": 1.0259, "step": 18319 }, { "epoch": 0.35, "learning_rate": 3.8036273211687537e-06, "loss": 0.8644, "step": 18320 }, { "epoch": 0.35, "learning_rate": 3.8034969667658087e-06, "loss": 0.8555, "step": 18321 }, { "epoch": 0.35, "learning_rate": 3.8033666074956464e-06, "loss": 0.8075, "step": 18322 }, { "epoch": 0.35, "learning_rate": 3.8032362433587533e-06, "loss": 0.7267, "step": 18323 }, { "epoch": 0.35, "learning_rate": 3.8031058743556158e-06, "loss": 0.955, "step": 18324 }, { "epoch": 0.35, "learning_rate": 3.8029755004867207e-06, "loss": 0.9191, "step": 18325 }, { "epoch": 0.35, "learning_rate": 3.8028451217525552e-06, "loss": 1.1101, "step": 18326 }, { "epoch": 0.35, "learning_rate": 3.8027147381536055e-06, "loss": 1.0617, "step": 18327 }, { "epoch": 0.35, "learning_rate": 3.8025843496903603e-06, "loss": 1.044, "step": 18328 }, { "epoch": 0.35, "learning_rate": 3.802453956363304e-06, "loss": 0.8698, "step": 18329 }, { "epoch": 0.35, "learning_rate": 3.8023235581729244e-06, "loss": 1.0729, "step": 18330 }, { "epoch": 0.35, "learning_rate": 3.8021931551197087e-06, "loss": 0.988, "step": 18331 }, { "epoch": 0.35, "learning_rate": 3.802062747204144e-06, "loss": 0.8138, "step": 18332 }, { "epoch": 0.35, "learning_rate": 3.8019323344267167e-06, "loss": 0.9623, "step": 18333 }, { "epoch": 0.35, "learning_rate": 3.801801916787915e-06, "loss": 1.1096, "step": 18334 }, { "epoch": 0.35, "learning_rate": 3.801671494288224e-06, "loss": 0.7004, "step": 18335 }, { "epoch": 0.35, "learning_rate": 3.8015410669281305e-06, "loss": 0.7267, "step": 18336 }, { "epoch": 0.35, "learning_rate": 3.801410634708124e-06, "loss": 1.0514, "step": 18337 }, { "epoch": 0.35, "learning_rate": 3.8012801976286894e-06, "loss": 0.972, "step": 18338 }, { "epoch": 0.35, "learning_rate": 3.801149755690314e-06, "loss": 0.9488, "step": 18339 }, { "epoch": 0.35, "learning_rate": 3.8010193088934866e-06, "loss": 0.8044, "step": 18340 }, { "epoch": 0.35, "learning_rate": 3.8008888572386926e-06, "loss": 0.7693, "step": 18341 }, { "epoch": 0.35, "learning_rate": 3.8007584007264192e-06, "loss": 0.741, "step": 18342 }, { "epoch": 0.35, "learning_rate": 3.8006279393571543e-06, "loss": 0.9718, "step": 18343 }, { "epoch": 0.35, "learning_rate": 3.8004974731313836e-06, "loss": 0.8913, "step": 18344 }, { "epoch": 0.35, "learning_rate": 3.8003670020495963e-06, "loss": 0.9723, "step": 18345 }, { "epoch": 0.35, "learning_rate": 3.8002365261122774e-06, "loss": 1.0092, "step": 18346 }, { "epoch": 0.35, "learning_rate": 3.8001060453199155e-06, "loss": 0.8755, "step": 18347 }, { "epoch": 0.35, "learning_rate": 3.799975559672998e-06, "loss": 0.8265, "step": 18348 }, { "epoch": 0.35, "learning_rate": 3.799845069172012e-06, "loss": 1.2231, "step": 18349 }, { "epoch": 0.35, "learning_rate": 3.7997145738174436e-06, "loss": 0.8533, "step": 18350 }, { "epoch": 0.35, "learning_rate": 3.7995840736097804e-06, "loss": 0.8191, "step": 18351 }, { "epoch": 0.35, "learning_rate": 3.7994535685495104e-06, "loss": 0.9146, "step": 18352 }, { "epoch": 0.35, "learning_rate": 3.799323058637121e-06, "loss": 1.0735, "step": 18353 }, { "epoch": 0.35, "learning_rate": 3.7991925438730993e-06, "loss": 1.0381, "step": 18354 }, { "epoch": 0.35, "learning_rate": 3.799062024257932e-06, "loss": 1.1745, "step": 18355 }, { "epoch": 0.35, "learning_rate": 3.7989314997921073e-06, "loss": 1.1184, "step": 18356 }, { "epoch": 0.35, "learning_rate": 3.798800970476112e-06, "loss": 1.0505, "step": 18357 }, { "epoch": 0.35, "learning_rate": 3.798670436310434e-06, "loss": 0.9164, "step": 18358 }, { "epoch": 0.35, "learning_rate": 3.7985398972955594e-06, "loss": 0.9132, "step": 18359 }, { "epoch": 0.35, "learning_rate": 3.7984093534319778e-06, "loss": 0.9061, "step": 18360 }, { "epoch": 0.35, "learning_rate": 3.798278804720175e-06, "loss": 1.0668, "step": 18361 }, { "epoch": 0.35, "learning_rate": 3.798148251160639e-06, "loss": 0.966, "step": 18362 }, { "epoch": 0.35, "learning_rate": 3.798017692753857e-06, "loss": 1.1274, "step": 18363 }, { "epoch": 0.35, "learning_rate": 3.7978871295003173e-06, "loss": 0.9384, "step": 18364 }, { "epoch": 0.35, "learning_rate": 3.797756561400506e-06, "loss": 0.886, "step": 18365 }, { "epoch": 0.35, "learning_rate": 3.7976259884549123e-06, "loss": 0.8246, "step": 18366 }, { "epoch": 0.35, "learning_rate": 3.7974954106640227e-06, "loss": 0.9058, "step": 18367 }, { "epoch": 0.35, "learning_rate": 3.797364828028325e-06, "loss": 1.0784, "step": 18368 }, { "epoch": 0.35, "learning_rate": 3.7972342405483064e-06, "loss": 1.0381, "step": 18369 }, { "epoch": 0.35, "learning_rate": 3.7971036482244554e-06, "loss": 0.9067, "step": 18370 }, { "epoch": 0.35, "learning_rate": 3.796973051057259e-06, "loss": 0.8921, "step": 18371 }, { "epoch": 0.35, "learning_rate": 3.796842449047205e-06, "loss": 0.6945, "step": 18372 }, { "epoch": 0.35, "learning_rate": 3.796711842194781e-06, "loss": 0.8471, "step": 18373 }, { "epoch": 0.35, "learning_rate": 3.7965812305004746e-06, "loss": 0.9184, "step": 18374 }, { "epoch": 0.35, "learning_rate": 3.7964506139647746e-06, "loss": 1.1794, "step": 18375 }, { "epoch": 0.35, "learning_rate": 3.7963199925881666e-06, "loss": 0.838, "step": 18376 }, { "epoch": 0.35, "learning_rate": 3.79618936637114e-06, "loss": 1.0463, "step": 18377 }, { "epoch": 0.35, "learning_rate": 3.796058735314182e-06, "loss": 0.9343, "step": 18378 }, { "epoch": 0.35, "learning_rate": 3.7959280994177807e-06, "loss": 0.821, "step": 18379 }, { "epoch": 0.35, "learning_rate": 3.7957974586824227e-06, "loss": 0.9735, "step": 18380 }, { "epoch": 0.35, "learning_rate": 3.7956668131085974e-06, "loss": 1.1315, "step": 18381 }, { "epoch": 0.35, "learning_rate": 3.7955361626967918e-06, "loss": 0.8602, "step": 18382 }, { "epoch": 0.35, "learning_rate": 3.7954055074474937e-06, "loss": 0.7116, "step": 18383 }, { "epoch": 0.35, "learning_rate": 3.795274847361192e-06, "loss": 1.0423, "step": 18384 }, { "epoch": 0.35, "learning_rate": 3.795144182438373e-06, "loss": 0.8306, "step": 18385 }, { "epoch": 0.35, "learning_rate": 3.795013512679525e-06, "loss": 0.706, "step": 18386 }, { "epoch": 0.35, "learning_rate": 3.794882838085137e-06, "loss": 1.0431, "step": 18387 }, { "epoch": 0.35, "learning_rate": 3.7947521586556958e-06, "loss": 1.0353, "step": 18388 }, { "epoch": 0.35, "learning_rate": 3.79462147439169e-06, "loss": 0.8216, "step": 18389 }, { "epoch": 0.35, "learning_rate": 3.7944907852936076e-06, "loss": 0.9491, "step": 18390 }, { "epoch": 0.35, "learning_rate": 3.7943600913619357e-06, "loss": 0.8071, "step": 18391 }, { "epoch": 0.35, "learning_rate": 3.794229392597163e-06, "loss": 0.8542, "step": 18392 }, { "epoch": 0.35, "learning_rate": 3.7940986889997773e-06, "loss": 1.0891, "step": 18393 }, { "epoch": 0.35, "learning_rate": 3.7939679805702665e-06, "loss": 1.0251, "step": 18394 }, { "epoch": 0.35, "learning_rate": 3.7938372673091194e-06, "loss": 0.6955, "step": 18395 }, { "epoch": 0.35, "learning_rate": 3.793706549216824e-06, "loss": 1.0483, "step": 18396 }, { "epoch": 0.35, "learning_rate": 3.7935758262938672e-06, "loss": 0.8494, "step": 18397 }, { "epoch": 0.35, "learning_rate": 3.793445098540739e-06, "loss": 0.9573, "step": 18398 }, { "epoch": 0.35, "learning_rate": 3.7933143659579257e-06, "loss": 0.9585, "step": 18399 }, { "epoch": 0.35, "learning_rate": 3.793183628545916e-06, "loss": 1.108, "step": 18400 }, { "epoch": 0.35, "learning_rate": 3.7930528863051984e-06, "loss": 1.0005, "step": 18401 }, { "epoch": 0.35, "learning_rate": 3.7929221392362613e-06, "loss": 1.0406, "step": 18402 }, { "epoch": 0.35, "learning_rate": 3.7927913873395926e-06, "loss": 0.9835, "step": 18403 }, { "epoch": 0.35, "learning_rate": 3.7926606306156797e-06, "loss": 0.7694, "step": 18404 }, { "epoch": 0.35, "learning_rate": 3.792529869065013e-06, "loss": 1.0623, "step": 18405 }, { "epoch": 0.35, "learning_rate": 3.7923991026880786e-06, "loss": 1.0761, "step": 18406 }, { "epoch": 0.35, "learning_rate": 3.792268331485366e-06, "loss": 1.1622, "step": 18407 }, { "epoch": 0.35, "learning_rate": 3.7921375554573627e-06, "loss": 0.8153, "step": 18408 }, { "epoch": 0.35, "learning_rate": 3.7920067746045567e-06, "loss": 0.8425, "step": 18409 }, { "epoch": 0.35, "learning_rate": 3.7918759889274378e-06, "loss": 0.9403, "step": 18410 }, { "epoch": 0.35, "learning_rate": 3.791745198426494e-06, "loss": 0.8539, "step": 18411 }, { "epoch": 0.35, "learning_rate": 3.7916144031022124e-06, "loss": 0.8847, "step": 18412 }, { "epoch": 0.35, "learning_rate": 3.7914836029550826e-06, "loss": 0.8843, "step": 18413 }, { "epoch": 0.35, "learning_rate": 3.7913527979855923e-06, "loss": 0.8119, "step": 18414 }, { "epoch": 0.35, "learning_rate": 3.79122198819423e-06, "loss": 0.744, "step": 18415 }, { "epoch": 0.35, "learning_rate": 3.791091173581485e-06, "loss": 0.9041, "step": 18416 }, { "epoch": 0.35, "learning_rate": 3.7909603541478455e-06, "loss": 0.7934, "step": 18417 }, { "epoch": 0.35, "learning_rate": 3.790829529893799e-06, "loss": 1.0864, "step": 18418 }, { "epoch": 0.35, "learning_rate": 3.7906987008198346e-06, "loss": 1.1574, "step": 18419 }, { "epoch": 0.35, "learning_rate": 3.7905678669264417e-06, "loss": 0.8023, "step": 18420 }, { "epoch": 0.35, "learning_rate": 3.790437028214107e-06, "loss": 1.0779, "step": 18421 }, { "epoch": 0.35, "learning_rate": 3.79030618468332e-06, "loss": 0.861, "step": 18422 }, { "epoch": 0.35, "learning_rate": 3.7901753363345696e-06, "loss": 0.7827, "step": 18423 }, { "epoch": 0.35, "learning_rate": 3.790044483168344e-06, "loss": 0.8715, "step": 18424 }, { "epoch": 0.35, "learning_rate": 3.789913625185132e-06, "loss": 0.9714, "step": 18425 }, { "epoch": 0.35, "learning_rate": 3.789782762385422e-06, "loss": 0.7558, "step": 18426 }, { "epoch": 0.35, "learning_rate": 3.7896518947697023e-06, "loss": 0.9889, "step": 18427 }, { "epoch": 0.35, "learning_rate": 3.7895210223384626e-06, "loss": 1.0125, "step": 18428 }, { "epoch": 0.35, "learning_rate": 3.78939014509219e-06, "loss": 0.8793, "step": 18429 }, { "epoch": 0.35, "learning_rate": 3.789259263031375e-06, "loss": 0.9852, "step": 18430 }, { "epoch": 0.35, "learning_rate": 3.789128376156505e-06, "loss": 1.0936, "step": 18431 }, { "epoch": 0.35, "learning_rate": 3.78899748446807e-06, "loss": 1.0346, "step": 18432 }, { "epoch": 0.35, "learning_rate": 3.788866587966557e-06, "loss": 0.8635, "step": 18433 }, { "epoch": 0.35, "learning_rate": 3.7887356866524562e-06, "loss": 0.8622, "step": 18434 }, { "epoch": 0.35, "learning_rate": 3.788604780526255e-06, "loss": 0.7599, "step": 18435 }, { "epoch": 0.35, "learning_rate": 3.7884738695884437e-06, "loss": 0.8788, "step": 18436 }, { "epoch": 0.35, "learning_rate": 3.7883429538395105e-06, "loss": 1.1235, "step": 18437 }, { "epoch": 0.35, "learning_rate": 3.7882120332799443e-06, "loss": 1.1722, "step": 18438 }, { "epoch": 0.35, "learning_rate": 3.7880811079102343e-06, "loss": 1.1068, "step": 18439 }, { "epoch": 0.35, "learning_rate": 3.787950177730868e-06, "loss": 0.7729, "step": 18440 }, { "epoch": 0.35, "learning_rate": 3.7878192427423355e-06, "loss": 1.1042, "step": 18441 }, { "epoch": 0.35, "learning_rate": 3.787688302945125e-06, "loss": 0.88, "step": 18442 }, { "epoch": 0.35, "learning_rate": 3.7875573583397263e-06, "loss": 0.9294, "step": 18443 }, { "epoch": 0.35, "learning_rate": 3.7874264089266287e-06, "loss": 1.1592, "step": 18444 }, { "epoch": 0.35, "learning_rate": 3.787295454706319e-06, "loss": 0.9279, "step": 18445 }, { "epoch": 0.35, "learning_rate": 3.7871644956792886e-06, "loss": 0.9894, "step": 18446 }, { "epoch": 0.35, "learning_rate": 3.787033531846025e-06, "loss": 0.8348, "step": 18447 }, { "epoch": 0.35, "learning_rate": 3.7869025632070176e-06, "loss": 0.7698, "step": 18448 }, { "epoch": 0.35, "learning_rate": 3.7867715897627554e-06, "loss": 0.9874, "step": 18449 }, { "epoch": 0.35, "learning_rate": 3.786640611513728e-06, "loss": 1.0571, "step": 18450 }, { "epoch": 0.35, "learning_rate": 3.7865096284604237e-06, "loss": 1.0055, "step": 18451 }, { "epoch": 0.35, "learning_rate": 3.786378640603332e-06, "loss": 0.8796, "step": 18452 }, { "epoch": 0.35, "learning_rate": 3.786247647942942e-06, "loss": 0.9008, "step": 18453 }, { "epoch": 0.35, "learning_rate": 3.7861166504797418e-06, "loss": 0.9195, "step": 18454 }, { "epoch": 0.35, "learning_rate": 3.785985648214222e-06, "loss": 0.9529, "step": 18455 }, { "epoch": 0.35, "learning_rate": 3.7858546411468723e-06, "loss": 1.0182, "step": 18456 }, { "epoch": 0.35, "learning_rate": 3.7857236292781797e-06, "loss": 0.9276, "step": 18457 }, { "epoch": 0.35, "learning_rate": 3.785592612608634e-06, "loss": 0.7324, "step": 18458 }, { "epoch": 0.35, "learning_rate": 3.785461591138726e-06, "loss": 0.9776, "step": 18459 }, { "epoch": 0.35, "learning_rate": 3.785330564868943e-06, "loss": 0.9094, "step": 18460 }, { "epoch": 0.35, "learning_rate": 3.785199533799776e-06, "loss": 0.7159, "step": 18461 }, { "epoch": 0.35, "learning_rate": 3.7850684979317133e-06, "loss": 0.9376, "step": 18462 }, { "epoch": 0.35, "learning_rate": 3.784937457265243e-06, "loss": 0.9988, "step": 18463 }, { "epoch": 0.35, "learning_rate": 3.7848064118008563e-06, "loss": 0.7631, "step": 18464 }, { "epoch": 0.35, "learning_rate": 3.784675361539042e-06, "loss": 0.8416, "step": 18465 }, { "epoch": 0.35, "learning_rate": 3.7845443064802896e-06, "loss": 0.7949, "step": 18466 }, { "epoch": 0.35, "learning_rate": 3.784413246625087e-06, "loss": 0.807, "step": 18467 }, { "epoch": 0.35, "learning_rate": 3.784282181973926e-06, "loss": 1.0587, "step": 18468 }, { "epoch": 0.35, "learning_rate": 3.7841511125272943e-06, "loss": 0.8663, "step": 18469 }, { "epoch": 0.35, "learning_rate": 3.784020038285682e-06, "loss": 0.9564, "step": 18470 }, { "epoch": 0.35, "learning_rate": 3.7838889592495776e-06, "loss": 0.7757, "step": 18471 }, { "epoch": 0.35, "learning_rate": 3.7837578754194713e-06, "loss": 0.8547, "step": 18472 }, { "epoch": 0.35, "learning_rate": 3.7836267867958527e-06, "loss": 0.9996, "step": 18473 }, { "epoch": 0.35, "learning_rate": 3.783495693379211e-06, "loss": 0.9189, "step": 18474 }, { "epoch": 0.35, "learning_rate": 3.783364595170036e-06, "loss": 0.929, "step": 18475 }, { "epoch": 0.35, "learning_rate": 3.783233492168816e-06, "loss": 0.9183, "step": 18476 }, { "epoch": 0.35, "learning_rate": 3.7831023843760424e-06, "loss": 0.8781, "step": 18477 }, { "epoch": 0.35, "learning_rate": 3.7829712717922033e-06, "loss": 0.8989, "step": 18478 }, { "epoch": 0.35, "learning_rate": 3.7828401544177895e-06, "loss": 0.8906, "step": 18479 }, { "epoch": 0.35, "learning_rate": 3.7827090322532895e-06, "loss": 0.9254, "step": 18480 }, { "epoch": 0.35, "learning_rate": 3.782577905299193e-06, "loss": 1.1802, "step": 18481 }, { "epoch": 0.35, "learning_rate": 3.7824467735559913e-06, "loss": 0.8078, "step": 18482 }, { "epoch": 0.35, "learning_rate": 3.782315637024171e-06, "loss": 0.9006, "step": 18483 }, { "epoch": 0.35, "learning_rate": 3.782184495704223e-06, "loss": 0.9149, "step": 18484 }, { "epoch": 0.35, "learning_rate": 3.7820533495966392e-06, "loss": 0.9414, "step": 18485 }, { "epoch": 0.35, "learning_rate": 3.781922198701906e-06, "loss": 0.8488, "step": 18486 }, { "epoch": 0.35, "learning_rate": 3.7817910430205157e-06, "loss": 1.0575, "step": 18487 }, { "epoch": 0.35, "learning_rate": 3.781659882552957e-06, "loss": 0.8863, "step": 18488 }, { "epoch": 0.35, "learning_rate": 3.781528717299719e-06, "loss": 0.8365, "step": 18489 }, { "epoch": 0.35, "learning_rate": 3.781397547261292e-06, "loss": 0.9847, "step": 18490 }, { "epoch": 0.35, "learning_rate": 3.781266372438166e-06, "loss": 0.8175, "step": 18491 }, { "epoch": 0.35, "learning_rate": 3.7811351928308303e-06, "loss": 0.9358, "step": 18492 }, { "epoch": 0.35, "learning_rate": 3.7810040084397757e-06, "loss": 0.9371, "step": 18493 }, { "epoch": 0.35, "learning_rate": 3.780872819265492e-06, "loss": 0.9702, "step": 18494 }, { "epoch": 0.35, "learning_rate": 3.780741625308467e-06, "loss": 0.8035, "step": 18495 }, { "epoch": 0.35, "learning_rate": 3.7806104265691928e-06, "loss": 0.9061, "step": 18496 }, { "epoch": 0.35, "learning_rate": 3.7804792230481587e-06, "loss": 1.0162, "step": 18497 }, { "epoch": 0.35, "learning_rate": 3.780348014745854e-06, "loss": 0.97, "step": 18498 }, { "epoch": 0.35, "learning_rate": 3.7802168016627687e-06, "loss": 0.8828, "step": 18499 }, { "epoch": 0.35, "learning_rate": 3.7800855837993945e-06, "loss": 0.9774, "step": 18500 }, { "epoch": 0.35, "learning_rate": 3.7799543611562185e-06, "loss": 0.7765, "step": 18501 }, { "epoch": 0.35, "learning_rate": 3.779823133733733e-06, "loss": 0.9158, "step": 18502 }, { "epoch": 0.35, "learning_rate": 3.7796919015324273e-06, "loss": 0.9119, "step": 18503 }, { "epoch": 0.35, "learning_rate": 3.7795606645527905e-06, "loss": 0.856, "step": 18504 }, { "epoch": 0.35, "learning_rate": 3.779429422795313e-06, "loss": 0.9424, "step": 18505 }, { "epoch": 0.35, "learning_rate": 3.7792981762604873e-06, "loss": 1.1179, "step": 18506 }, { "epoch": 0.35, "learning_rate": 3.7791669249488e-06, "loss": 1.089, "step": 18507 }, { "epoch": 0.35, "learning_rate": 3.7790356688607425e-06, "loss": 0.8272, "step": 18508 }, { "epoch": 0.35, "learning_rate": 3.778904407996806e-06, "loss": 0.8968, "step": 18509 }, { "epoch": 0.35, "learning_rate": 3.778773142357479e-06, "loss": 0.9959, "step": 18510 }, { "epoch": 0.35, "learning_rate": 3.778641871943252e-06, "loss": 0.9677, "step": 18511 }, { "epoch": 0.35, "learning_rate": 3.778510596754616e-06, "loss": 0.9572, "step": 18512 }, { "epoch": 0.35, "learning_rate": 3.77837931679206e-06, "loss": 1.0322, "step": 18513 }, { "epoch": 0.35, "learning_rate": 3.7782480320560755e-06, "loss": 0.8877, "step": 18514 }, { "epoch": 0.35, "learning_rate": 3.778116742547152e-06, "loss": 0.7497, "step": 18515 }, { "epoch": 0.35, "learning_rate": 3.7779854482657797e-06, "loss": 1.0156, "step": 18516 }, { "epoch": 0.35, "learning_rate": 3.777854149212449e-06, "loss": 0.9393, "step": 18517 }, { "epoch": 0.35, "learning_rate": 3.7777228453876493e-06, "loss": 1.1792, "step": 18518 }, { "epoch": 0.35, "learning_rate": 3.777591536791872e-06, "loss": 1.0541, "step": 18519 }, { "epoch": 0.35, "learning_rate": 3.7774602234256074e-06, "loss": 0.8752, "step": 18520 }, { "epoch": 0.35, "learning_rate": 3.777328905289346e-06, "loss": 0.9524, "step": 18521 }, { "epoch": 0.35, "learning_rate": 3.7771975823835767e-06, "loss": 0.9082, "step": 18522 }, { "epoch": 0.35, "learning_rate": 3.7770662547087912e-06, "loss": 0.8822, "step": 18523 }, { "epoch": 0.35, "learning_rate": 3.7769349222654792e-06, "loss": 0.9744, "step": 18524 }, { "epoch": 0.35, "learning_rate": 3.776803585054132e-06, "loss": 1.0577, "step": 18525 }, { "epoch": 0.35, "learning_rate": 3.7766722430752377e-06, "loss": 0.9734, "step": 18526 }, { "epoch": 0.35, "learning_rate": 3.7765408963292903e-06, "loss": 0.9786, "step": 18527 }, { "epoch": 0.35, "learning_rate": 3.7764095448167776e-06, "loss": 0.9948, "step": 18528 }, { "epoch": 0.35, "learning_rate": 3.7762781885381906e-06, "loss": 0.9109, "step": 18529 }, { "epoch": 0.35, "learning_rate": 3.7761468274940204e-06, "loss": 1.0556, "step": 18530 }, { "epoch": 0.35, "learning_rate": 3.7760154616847567e-06, "loss": 1.1496, "step": 18531 }, { "epoch": 0.35, "learning_rate": 3.7758840911108907e-06, "loss": 1.0302, "step": 18532 }, { "epoch": 0.35, "learning_rate": 3.7757527157729125e-06, "loss": 0.9755, "step": 18533 }, { "epoch": 0.35, "learning_rate": 3.7756213356713125e-06, "loss": 1.0207, "step": 18534 }, { "epoch": 0.35, "learning_rate": 3.775489950806582e-06, "loss": 0.931, "step": 18535 }, { "epoch": 0.35, "learning_rate": 3.775358561179211e-06, "loss": 0.9254, "step": 18536 }, { "epoch": 0.35, "learning_rate": 3.77522716678969e-06, "loss": 1.1559, "step": 18537 }, { "epoch": 0.35, "learning_rate": 3.7750957676385104e-06, "loss": 0.8458, "step": 18538 }, { "epoch": 0.35, "learning_rate": 3.774964363726161e-06, "loss": 1.139, "step": 18539 }, { "epoch": 0.35, "learning_rate": 3.774832955053135e-06, "loss": 0.8967, "step": 18540 }, { "epoch": 0.35, "learning_rate": 3.774701541619922e-06, "loss": 0.9376, "step": 18541 }, { "epoch": 0.35, "learning_rate": 3.7745701234270117e-06, "loss": 0.8438, "step": 18542 }, { "epoch": 0.35, "learning_rate": 3.7744387004748962e-06, "loss": 1.2748, "step": 18543 }, { "epoch": 0.35, "learning_rate": 3.774307272764065e-06, "loss": 1.0808, "step": 18544 }, { "epoch": 0.35, "learning_rate": 3.77417584029501e-06, "loss": 0.8636, "step": 18545 }, { "epoch": 0.35, "learning_rate": 3.774044403068222e-06, "loss": 0.9235, "step": 18546 }, { "epoch": 0.35, "learning_rate": 3.7739129610841895e-06, "loss": 0.8321, "step": 18547 }, { "epoch": 0.35, "learning_rate": 3.773781514343407e-06, "loss": 0.8683, "step": 18548 }, { "epoch": 0.35, "learning_rate": 3.7736500628463624e-06, "loss": 0.9667, "step": 18549 }, { "epoch": 0.35, "learning_rate": 3.773518606593548e-06, "loss": 0.8842, "step": 18550 }, { "epoch": 0.35, "learning_rate": 3.7733871455854544e-06, "loss": 1.0888, "step": 18551 }, { "epoch": 0.35, "learning_rate": 3.7732556798225717e-06, "loss": 1.1285, "step": 18552 }, { "epoch": 0.35, "learning_rate": 3.773124209305391e-06, "loss": 1.0338, "step": 18553 }, { "epoch": 0.35, "learning_rate": 3.772992734034404e-06, "loss": 0.773, "step": 18554 }, { "epoch": 0.35, "learning_rate": 3.7728612540101006e-06, "loss": 0.9486, "step": 18555 }, { "epoch": 0.35, "learning_rate": 3.7727297692329732e-06, "loss": 0.8163, "step": 18556 }, { "epoch": 0.35, "learning_rate": 3.7725982797035116e-06, "loss": 0.8636, "step": 18557 }, { "epoch": 0.35, "learning_rate": 3.772466785422207e-06, "loss": 0.9362, "step": 18558 }, { "epoch": 0.35, "learning_rate": 3.77233528638955e-06, "loss": 0.9017, "step": 18559 }, { "epoch": 0.35, "learning_rate": 3.772203782606032e-06, "loss": 0.8993, "step": 18560 }, { "epoch": 0.35, "learning_rate": 3.772072274072145e-06, "loss": 0.7935, "step": 18561 }, { "epoch": 0.35, "learning_rate": 3.7719407607883783e-06, "loss": 0.9026, "step": 18562 }, { "epoch": 0.35, "learning_rate": 3.771809242755224e-06, "loss": 0.8576, "step": 18563 }, { "epoch": 0.35, "learning_rate": 3.7716777199731735e-06, "loss": 0.938, "step": 18564 }, { "epoch": 0.35, "learning_rate": 3.7715461924427167e-06, "loss": 0.9138, "step": 18565 }, { "epoch": 0.35, "learning_rate": 3.7714146601643462e-06, "loss": 1.1001, "step": 18566 }, { "epoch": 0.35, "learning_rate": 3.771283123138552e-06, "loss": 0.7683, "step": 18567 }, { "epoch": 0.35, "learning_rate": 3.7711515813658246e-06, "loss": 1.0374, "step": 18568 }, { "epoch": 0.35, "learning_rate": 3.7710200348466573e-06, "loss": 0.9816, "step": 18569 }, { "epoch": 0.35, "learning_rate": 3.7708884835815394e-06, "loss": 1.0014, "step": 18570 }, { "epoch": 0.35, "learning_rate": 3.7707569275709634e-06, "loss": 1.0786, "step": 18571 }, { "epoch": 0.35, "learning_rate": 3.7706253668154203e-06, "loss": 0.8457, "step": 18572 }, { "epoch": 0.35, "learning_rate": 3.7704938013154008e-06, "loss": 0.975, "step": 18573 }, { "epoch": 0.35, "learning_rate": 3.7703622310713962e-06, "loss": 1.0121, "step": 18574 }, { "epoch": 0.35, "learning_rate": 3.7702306560838975e-06, "loss": 1.1425, "step": 18575 }, { "epoch": 0.35, "learning_rate": 3.770099076353397e-06, "loss": 0.9118, "step": 18576 }, { "epoch": 0.35, "learning_rate": 3.769967491880386e-06, "loss": 0.8904, "step": 18577 }, { "epoch": 0.35, "learning_rate": 3.7698359026653553e-06, "loss": 0.9294, "step": 18578 }, { "epoch": 0.35, "learning_rate": 3.7697043087087955e-06, "loss": 0.8558, "step": 18579 }, { "epoch": 0.35, "learning_rate": 3.769572710011199e-06, "loss": 0.8778, "step": 18580 }, { "epoch": 0.35, "learning_rate": 3.7694411065730564e-06, "loss": 1.0413, "step": 18581 }, { "epoch": 0.35, "learning_rate": 3.76930949839486e-06, "loss": 0.8615, "step": 18582 }, { "epoch": 0.35, "learning_rate": 3.769177885477101e-06, "loss": 0.9428, "step": 18583 }, { "epoch": 0.35, "learning_rate": 3.769046267820271e-06, "loss": 0.9855, "step": 18584 }, { "epoch": 0.35, "learning_rate": 3.768914645424861e-06, "loss": 0.8712, "step": 18585 }, { "epoch": 0.35, "learning_rate": 3.7687830182913622e-06, "loss": 1.0802, "step": 18586 }, { "epoch": 0.35, "learning_rate": 3.7686513864202677e-06, "loss": 1.2742, "step": 18587 }, { "epoch": 0.35, "learning_rate": 3.768519749812066e-06, "loss": 0.9981, "step": 18588 }, { "epoch": 0.35, "learning_rate": 3.768388108467251e-06, "loss": 1.0722, "step": 18589 }, { "epoch": 0.35, "learning_rate": 3.768256462386315e-06, "loss": 0.7811, "step": 18590 }, { "epoch": 0.35, "learning_rate": 3.7681248115697473e-06, "loss": 1.0189, "step": 18591 }, { "epoch": 0.35, "learning_rate": 3.7679931560180404e-06, "loss": 0.7132, "step": 18592 }, { "epoch": 0.35, "learning_rate": 3.7678614957316863e-06, "loss": 1.0778, "step": 18593 }, { "epoch": 0.35, "learning_rate": 3.7677298307111756e-06, "loss": 0.9734, "step": 18594 }, { "epoch": 0.35, "learning_rate": 3.767598160957001e-06, "loss": 1.0458, "step": 18595 }, { "epoch": 0.35, "learning_rate": 3.767466486469653e-06, "loss": 0.7499, "step": 18596 }, { "epoch": 0.35, "learning_rate": 3.7673348072496253e-06, "loss": 1.0142, "step": 18597 }, { "epoch": 0.35, "learning_rate": 3.7672031232974078e-06, "loss": 0.7102, "step": 18598 }, { "epoch": 0.35, "learning_rate": 3.7670714346134922e-06, "loss": 1.0179, "step": 18599 }, { "epoch": 0.35, "learning_rate": 3.766939741198371e-06, "loss": 1.0676, "step": 18600 }, { "epoch": 0.35, "learning_rate": 3.766808043052536e-06, "loss": 1.0781, "step": 18601 }, { "epoch": 0.35, "learning_rate": 3.7666763401764776e-06, "loss": 0.798, "step": 18602 }, { "epoch": 0.35, "learning_rate": 3.7665446325706893e-06, "loss": 0.9962, "step": 18603 }, { "epoch": 0.35, "learning_rate": 3.7664129202356627e-06, "loss": 0.9475, "step": 18604 }, { "epoch": 0.35, "learning_rate": 3.7662812031718888e-06, "loss": 1.0845, "step": 18605 }, { "epoch": 0.35, "learning_rate": 3.766149481379859e-06, "loss": 0.942, "step": 18606 }, { "epoch": 0.35, "learning_rate": 3.766017754860067e-06, "loss": 1.0832, "step": 18607 }, { "epoch": 0.35, "learning_rate": 3.7658860236130024e-06, "loss": 0.701, "step": 18608 }, { "epoch": 0.35, "learning_rate": 3.7657542876391582e-06, "loss": 0.9307, "step": 18609 }, { "epoch": 0.35, "learning_rate": 3.7656225469390273e-06, "loss": 0.972, "step": 18610 }, { "epoch": 0.35, "learning_rate": 3.7654908015130997e-06, "loss": 0.9554, "step": 18611 }, { "epoch": 0.35, "learning_rate": 3.7653590513618688e-06, "loss": 0.7508, "step": 18612 }, { "epoch": 0.35, "learning_rate": 3.7652272964858262e-06, "loss": 0.912, "step": 18613 }, { "epoch": 0.35, "learning_rate": 3.7650955368854625e-06, "loss": 0.9312, "step": 18614 }, { "epoch": 0.35, "learning_rate": 3.764963772561272e-06, "loss": 0.9457, "step": 18615 }, { "epoch": 0.35, "learning_rate": 3.7648320035137455e-06, "loss": 0.8096, "step": 18616 }, { "epoch": 0.35, "learning_rate": 3.7647002297433743e-06, "loss": 1.1836, "step": 18617 }, { "epoch": 0.35, "learning_rate": 3.7645684512506514e-06, "loss": 1.0673, "step": 18618 }, { "epoch": 0.35, "learning_rate": 3.7644366680360696e-06, "loss": 1.1351, "step": 18619 }, { "epoch": 0.35, "learning_rate": 3.7643048801001193e-06, "loss": 1.0411, "step": 18620 }, { "epoch": 0.35, "learning_rate": 3.764173087443293e-06, "loss": 0.9903, "step": 18621 }, { "epoch": 0.35, "learning_rate": 3.7640412900660838e-06, "loss": 0.972, "step": 18622 }, { "epoch": 0.35, "learning_rate": 3.763909487968983e-06, "loss": 0.9345, "step": 18623 }, { "epoch": 0.35, "learning_rate": 3.763777681152483e-06, "loss": 0.96, "step": 18624 }, { "epoch": 0.35, "learning_rate": 3.763645869617075e-06, "loss": 1.118, "step": 18625 }, { "epoch": 0.35, "learning_rate": 3.763514053363253e-06, "loss": 1.0401, "step": 18626 }, { "epoch": 0.35, "learning_rate": 3.763382232391508e-06, "loss": 0.901, "step": 18627 }, { "epoch": 0.35, "learning_rate": 3.7632504067023334e-06, "loss": 0.7128, "step": 18628 }, { "epoch": 0.35, "learning_rate": 3.7631185762962198e-06, "loss": 0.9067, "step": 18629 }, { "epoch": 0.35, "learning_rate": 3.76298674117366e-06, "loss": 0.9784, "step": 18630 }, { "epoch": 0.35, "learning_rate": 3.762854901335146e-06, "loss": 1.0071, "step": 18631 }, { "epoch": 0.35, "learning_rate": 3.7627230567811712e-06, "loss": 0.7799, "step": 18632 }, { "epoch": 0.35, "learning_rate": 3.7625912075122272e-06, "loss": 0.7439, "step": 18633 }, { "epoch": 0.35, "learning_rate": 3.7624593535288063e-06, "loss": 0.8148, "step": 18634 }, { "epoch": 0.35, "learning_rate": 3.7623274948314005e-06, "loss": 0.7712, "step": 18635 }, { "epoch": 0.35, "learning_rate": 3.762195631420503e-06, "loss": 0.9702, "step": 18636 }, { "epoch": 0.35, "learning_rate": 3.762063763296605e-06, "loss": 1.0827, "step": 18637 }, { "epoch": 0.35, "learning_rate": 3.7619318904602004e-06, "loss": 0.8681, "step": 18638 }, { "epoch": 0.35, "learning_rate": 3.7618000129117803e-06, "loss": 0.9738, "step": 18639 }, { "epoch": 0.35, "learning_rate": 3.761668130651838e-06, "loss": 0.9423, "step": 18640 }, { "epoch": 0.35, "learning_rate": 3.7615362436808656e-06, "loss": 0.8484, "step": 18641 }, { "epoch": 0.35, "learning_rate": 3.761404351999355e-06, "loss": 0.8244, "step": 18642 }, { "epoch": 0.35, "learning_rate": 3.761272455607801e-06, "loss": 1.1446, "step": 18643 }, { "epoch": 0.35, "learning_rate": 3.7611405545066915e-06, "loss": 0.9784, "step": 18644 }, { "epoch": 0.35, "learning_rate": 3.7610086486965238e-06, "loss": 0.8305, "step": 18645 }, { "epoch": 0.35, "learning_rate": 3.760876738177788e-06, "loss": 0.9111, "step": 18646 }, { "epoch": 0.35, "learning_rate": 3.760744822950977e-06, "loss": 0.7856, "step": 18647 }, { "epoch": 0.35, "learning_rate": 3.760612903016583e-06, "loss": 0.9514, "step": 18648 }, { "epoch": 0.35, "learning_rate": 3.7604809783751006e-06, "loss": 1.0883, "step": 18649 }, { "epoch": 0.35, "learning_rate": 3.76034904902702e-06, "loss": 1.1104, "step": 18650 }, { "epoch": 0.35, "learning_rate": 3.760217114972834e-06, "loss": 0.8751, "step": 18651 }, { "epoch": 0.35, "learning_rate": 3.7600851762130362e-06, "loss": 0.8337, "step": 18652 }, { "epoch": 0.35, "learning_rate": 3.7599532327481196e-06, "loss": 0.9361, "step": 18653 }, { "epoch": 0.35, "learning_rate": 3.7598212845785757e-06, "loss": 1.0346, "step": 18654 }, { "epoch": 0.35, "learning_rate": 3.759689331704899e-06, "loss": 0.9389, "step": 18655 }, { "epoch": 0.35, "learning_rate": 3.7595573741275794e-06, "loss": 1.1308, "step": 18656 }, { "epoch": 0.35, "learning_rate": 3.759425411847112e-06, "loss": 0.7726, "step": 18657 }, { "epoch": 0.35, "learning_rate": 3.7592934448639885e-06, "loss": 0.9924, "step": 18658 }, { "epoch": 0.35, "learning_rate": 3.7591614731787018e-06, "loss": 0.8103, "step": 18659 }, { "epoch": 0.35, "learning_rate": 3.7590294967917448e-06, "loss": 0.9819, "step": 18660 }, { "epoch": 0.35, "learning_rate": 3.75889751570361e-06, "loss": 0.9544, "step": 18661 }, { "epoch": 0.35, "learning_rate": 3.7587655299147906e-06, "loss": 1.1789, "step": 18662 }, { "epoch": 0.35, "learning_rate": 3.75863353942578e-06, "loss": 1.0117, "step": 18663 }, { "epoch": 0.35, "learning_rate": 3.75850154423707e-06, "loss": 1.0847, "step": 18664 }, { "epoch": 0.35, "learning_rate": 3.758369544349153e-06, "loss": 0.9637, "step": 18665 }, { "epoch": 0.35, "learning_rate": 3.758237539762524e-06, "loss": 0.7339, "step": 18666 }, { "epoch": 0.35, "learning_rate": 3.7581055304776737e-06, "loss": 0.874, "step": 18667 }, { "epoch": 0.35, "learning_rate": 3.7579735164950966e-06, "loss": 1.0749, "step": 18668 }, { "epoch": 0.35, "learning_rate": 3.7578414978152844e-06, "loss": 0.9657, "step": 18669 }, { "epoch": 0.35, "learning_rate": 3.757709474438731e-06, "loss": 0.8415, "step": 18670 }, { "epoch": 0.35, "learning_rate": 3.7575774463659288e-06, "loss": 0.9561, "step": 18671 }, { "epoch": 0.35, "learning_rate": 3.7574454135973705e-06, "loss": 0.8396, "step": 18672 }, { "epoch": 0.35, "learning_rate": 3.7573133761335502e-06, "loss": 0.8602, "step": 18673 }, { "epoch": 0.35, "learning_rate": 3.7571813339749596e-06, "loss": 0.8998, "step": 18674 }, { "epoch": 0.35, "learning_rate": 3.757049287122093e-06, "loss": 1.025, "step": 18675 }, { "epoch": 0.35, "learning_rate": 3.7569172355754436e-06, "loss": 0.8835, "step": 18676 }, { "epoch": 0.35, "learning_rate": 3.7567851793355024e-06, "loss": 0.879, "step": 18677 }, { "epoch": 0.35, "learning_rate": 3.756653118402765e-06, "loss": 0.843, "step": 18678 }, { "epoch": 0.35, "learning_rate": 3.756521052777723e-06, "loss": 0.8831, "step": 18679 }, { "epoch": 0.35, "learning_rate": 3.756388982460869e-06, "loss": 0.8314, "step": 18680 }, { "epoch": 0.35, "learning_rate": 3.7562569074526976e-06, "loss": 1.1101, "step": 18681 }, { "epoch": 0.35, "learning_rate": 3.7561248277537025e-06, "loss": 0.9501, "step": 18682 }, { "epoch": 0.35, "learning_rate": 3.755992743364375e-06, "loss": 0.9174, "step": 18683 }, { "epoch": 0.35, "learning_rate": 3.7558606542852092e-06, "loss": 0.9858, "step": 18684 }, { "epoch": 0.35, "learning_rate": 3.7557285605166983e-06, "loss": 0.8822, "step": 18685 }, { "epoch": 0.35, "learning_rate": 3.755596462059335e-06, "loss": 0.9038, "step": 18686 }, { "epoch": 0.35, "learning_rate": 3.755464358913613e-06, "loss": 1.1426, "step": 18687 }, { "epoch": 0.35, "learning_rate": 3.755332251080026e-06, "loss": 0.9138, "step": 18688 }, { "epoch": 0.35, "learning_rate": 3.755200138559067e-06, "loss": 0.886, "step": 18689 }, { "epoch": 0.35, "learning_rate": 3.755068021351229e-06, "loss": 0.9038, "step": 18690 }, { "epoch": 0.35, "learning_rate": 3.7549358994570058e-06, "loss": 0.9559, "step": 18691 }, { "epoch": 0.35, "learning_rate": 3.7548037728768893e-06, "loss": 0.8784, "step": 18692 }, { "epoch": 0.35, "learning_rate": 3.754671641611375e-06, "loss": 1.1298, "step": 18693 }, { "epoch": 0.35, "learning_rate": 3.7545395056609545e-06, "loss": 1.0976, "step": 18694 }, { "epoch": 0.35, "learning_rate": 3.7544073650261224e-06, "loss": 0.8281, "step": 18695 }, { "epoch": 0.35, "learning_rate": 3.754275219707372e-06, "loss": 0.8266, "step": 18696 }, { "epoch": 0.35, "learning_rate": 3.754143069705196e-06, "loss": 0.8881, "step": 18697 }, { "epoch": 0.35, "learning_rate": 3.754010915020089e-06, "loss": 0.8239, "step": 18698 }, { "epoch": 0.35, "learning_rate": 3.7538787556525426e-06, "loss": 0.8446, "step": 18699 }, { "epoch": 0.35, "learning_rate": 3.7537465916030513e-06, "loss": 1.1697, "step": 18700 }, { "epoch": 0.35, "learning_rate": 3.7536144228721093e-06, "loss": 1.1348, "step": 18701 }, { "epoch": 0.35, "learning_rate": 3.7534822494602095e-06, "loss": 0.9199, "step": 18702 }, { "epoch": 0.35, "learning_rate": 3.7533500713678454e-06, "loss": 0.9452, "step": 18703 }, { "epoch": 0.35, "learning_rate": 3.7532178885955108e-06, "loss": 0.8427, "step": 18704 }, { "epoch": 0.35, "learning_rate": 3.753085701143698e-06, "loss": 0.7397, "step": 18705 }, { "epoch": 0.35, "learning_rate": 3.7529535090129026e-06, "loss": 1.2284, "step": 18706 }, { "epoch": 0.35, "learning_rate": 3.7528213122036162e-06, "loss": 0.9799, "step": 18707 }, { "epoch": 0.35, "learning_rate": 3.7526891107163343e-06, "loss": 0.7911, "step": 18708 }, { "epoch": 0.35, "learning_rate": 3.7525569045515496e-06, "loss": 0.8452, "step": 18709 }, { "epoch": 0.35, "learning_rate": 3.752424693709756e-06, "loss": 0.836, "step": 18710 }, { "epoch": 0.35, "learning_rate": 3.7522924781914473e-06, "loss": 1.0038, "step": 18711 }, { "epoch": 0.35, "learning_rate": 3.7521602579971157e-06, "loss": 1.0425, "step": 18712 }, { "epoch": 0.35, "learning_rate": 3.7520280331272563e-06, "loss": 0.8918, "step": 18713 }, { "epoch": 0.35, "learning_rate": 3.751895803582363e-06, "loss": 0.7263, "step": 18714 }, { "epoch": 0.35, "learning_rate": 3.751763569362929e-06, "loss": 0.9249, "step": 18715 }, { "epoch": 0.35, "learning_rate": 3.7516313304694487e-06, "loss": 0.853, "step": 18716 }, { "epoch": 0.35, "learning_rate": 3.7514990869024148e-06, "loss": 0.9042, "step": 18717 }, { "epoch": 0.35, "learning_rate": 3.751366838662322e-06, "loss": 0.9104, "step": 18718 }, { "epoch": 0.35, "learning_rate": 3.7512345857496633e-06, "loss": 1.1193, "step": 18719 }, { "epoch": 0.35, "learning_rate": 3.7511023281649338e-06, "loss": 0.901, "step": 18720 }, { "epoch": 0.35, "learning_rate": 3.7509700659086257e-06, "loss": 0.8502, "step": 18721 }, { "epoch": 0.35, "learning_rate": 3.7508377989812337e-06, "loss": 0.9168, "step": 18722 }, { "epoch": 0.35, "learning_rate": 3.7507055273832534e-06, "loss": 0.7899, "step": 18723 }, { "epoch": 0.35, "learning_rate": 3.7505732511151755e-06, "loss": 1.0132, "step": 18724 }, { "epoch": 0.35, "learning_rate": 3.7504409701774956e-06, "loss": 0.8852, "step": 18725 }, { "epoch": 0.35, "learning_rate": 3.750308684570708e-06, "loss": 0.9472, "step": 18726 }, { "epoch": 0.35, "learning_rate": 3.7501763942953056e-06, "loss": 0.8942, "step": 18727 }, { "epoch": 0.35, "learning_rate": 3.750044099351782e-06, "loss": 0.9966, "step": 18728 }, { "epoch": 0.35, "learning_rate": 3.7499117997406338e-06, "loss": 1.0109, "step": 18729 }, { "epoch": 0.35, "learning_rate": 3.7497794954623524e-06, "loss": 1.1017, "step": 18730 }, { "epoch": 0.35, "learning_rate": 3.749647186517433e-06, "loss": 1.1183, "step": 18731 }, { "epoch": 0.35, "learning_rate": 3.749514872906369e-06, "loss": 0.9357, "step": 18732 }, { "epoch": 0.35, "learning_rate": 3.7493825546296547e-06, "loss": 1.0134, "step": 18733 }, { "epoch": 0.35, "learning_rate": 3.7492502316877842e-06, "loss": 0.9576, "step": 18734 }, { "epoch": 0.35, "learning_rate": 3.749117904081252e-06, "loss": 0.8781, "step": 18735 }, { "epoch": 0.35, "learning_rate": 3.7489855718105515e-06, "loss": 1.0497, "step": 18736 }, { "epoch": 0.35, "learning_rate": 3.7488532348761774e-06, "loss": 1.3163, "step": 18737 }, { "epoch": 0.35, "learning_rate": 3.748720893278624e-06, "loss": 1.081, "step": 18738 }, { "epoch": 0.35, "learning_rate": 3.748588547018385e-06, "loss": 0.843, "step": 18739 }, { "epoch": 0.35, "learning_rate": 3.7484561960959537e-06, "loss": 1.0465, "step": 18740 }, { "epoch": 0.35, "learning_rate": 3.7483238405118263e-06, "loss": 0.9043, "step": 18741 }, { "epoch": 0.35, "learning_rate": 3.748191480266495e-06, "loss": 0.6926, "step": 18742 }, { "epoch": 0.35, "learning_rate": 3.7480591153604555e-06, "loss": 1.2701, "step": 18743 }, { "epoch": 0.35, "learning_rate": 3.747926745794202e-06, "loss": 1.0682, "step": 18744 }, { "epoch": 0.35, "learning_rate": 3.7477943715682273e-06, "loss": 0.8865, "step": 18745 }, { "epoch": 0.35, "learning_rate": 3.747661992683027e-06, "loss": 0.8047, "step": 18746 }, { "epoch": 0.35, "learning_rate": 3.747529609139096e-06, "loss": 1.412, "step": 18747 }, { "epoch": 0.35, "learning_rate": 3.7473972209369264e-06, "loss": 0.8441, "step": 18748 }, { "epoch": 0.35, "learning_rate": 3.747264828077014e-06, "loss": 0.8876, "step": 18749 }, { "epoch": 0.35, "learning_rate": 3.747132430559854e-06, "loss": 1.1839, "step": 18750 }, { "epoch": 0.35, "learning_rate": 3.7470000283859387e-06, "loss": 0.9279, "step": 18751 }, { "epoch": 0.35, "learning_rate": 3.7468676215557644e-06, "loss": 0.8419, "step": 18752 }, { "epoch": 0.35, "learning_rate": 3.746735210069824e-06, "loss": 0.9505, "step": 18753 }, { "epoch": 0.35, "learning_rate": 3.7466027939286134e-06, "loss": 0.7003, "step": 18754 }, { "epoch": 0.35, "learning_rate": 3.7464703731326246e-06, "loss": 0.9186, "step": 18755 }, { "epoch": 0.35, "learning_rate": 3.7463379476823546e-06, "loss": 1.0885, "step": 18756 }, { "epoch": 0.35, "learning_rate": 3.7462055175782967e-06, "loss": 0.7996, "step": 18757 }, { "epoch": 0.35, "learning_rate": 3.7460730828209456e-06, "loss": 1.1241, "step": 18758 }, { "epoch": 0.35, "learning_rate": 3.7459406434107963e-06, "loss": 0.7695, "step": 18759 }, { "epoch": 0.35, "learning_rate": 3.7458081993483427e-06, "loss": 0.8705, "step": 18760 }, { "epoch": 0.35, "learning_rate": 3.745675750634079e-06, "loss": 1.0134, "step": 18761 }, { "epoch": 0.35, "learning_rate": 3.7455432972685008e-06, "loss": 1.1461, "step": 18762 }, { "epoch": 0.35, "learning_rate": 3.7454108392521018e-06, "loss": 0.9808, "step": 18763 }, { "epoch": 0.35, "learning_rate": 3.7452783765853767e-06, "loss": 0.8832, "step": 18764 }, { "epoch": 0.35, "learning_rate": 3.7451459092688207e-06, "loss": 0.9661, "step": 18765 }, { "epoch": 0.35, "learning_rate": 3.745013437302928e-06, "loss": 1.0161, "step": 18766 }, { "epoch": 0.35, "learning_rate": 3.744880960688193e-06, "loss": 0.8494, "step": 18767 }, { "epoch": 0.35, "learning_rate": 3.7447484794251115e-06, "loss": 1.0087, "step": 18768 }, { "epoch": 0.35, "learning_rate": 3.744615993514176e-06, "loss": 0.9188, "step": 18769 }, { "epoch": 0.35, "learning_rate": 3.7444835029558834e-06, "loss": 0.8914, "step": 18770 }, { "epoch": 0.35, "learning_rate": 3.7443510077507278e-06, "loss": 0.8293, "step": 18771 }, { "epoch": 0.35, "learning_rate": 3.7442185078992034e-06, "loss": 1.0369, "step": 18772 }, { "epoch": 0.35, "learning_rate": 3.7440860034018045e-06, "loss": 0.7888, "step": 18773 }, { "epoch": 0.35, "learning_rate": 3.743953494259028e-06, "loss": 1.0428, "step": 18774 }, { "epoch": 0.35, "learning_rate": 3.7438209804713666e-06, "loss": 1.0878, "step": 18775 }, { "epoch": 0.35, "learning_rate": 3.7436884620393156e-06, "loss": 0.9413, "step": 18776 }, { "epoch": 0.35, "learning_rate": 3.74355593896337e-06, "loss": 1.0208, "step": 18777 }, { "epoch": 0.35, "learning_rate": 3.743423411244025e-06, "loss": 0.8684, "step": 18778 }, { "epoch": 0.35, "learning_rate": 3.7432908788817744e-06, "loss": 0.8087, "step": 18779 }, { "epoch": 0.35, "learning_rate": 3.743158341877115e-06, "loss": 0.7869, "step": 18780 }, { "epoch": 0.35, "learning_rate": 3.74302580023054e-06, "loss": 1.0678, "step": 18781 }, { "epoch": 0.35, "learning_rate": 3.7428932539425437e-06, "loss": 1.0903, "step": 18782 }, { "epoch": 0.35, "learning_rate": 3.742760703013623e-06, "loss": 0.7253, "step": 18783 }, { "epoch": 0.35, "learning_rate": 3.7426281474442714e-06, "loss": 0.7633, "step": 18784 }, { "epoch": 0.35, "learning_rate": 3.7424955872349855e-06, "loss": 0.8555, "step": 18785 }, { "epoch": 0.35, "learning_rate": 3.7423630223862587e-06, "loss": 0.7692, "step": 18786 }, { "epoch": 0.35, "learning_rate": 3.7422304528985866e-06, "loss": 1.007, "step": 18787 }, { "epoch": 0.35, "learning_rate": 3.7420978787724634e-06, "loss": 0.9666, "step": 18788 }, { "epoch": 0.35, "learning_rate": 3.7419653000083855e-06, "loss": 0.8622, "step": 18789 }, { "epoch": 0.35, "learning_rate": 3.741832716606846e-06, "loss": 1.0317, "step": 18790 }, { "epoch": 0.35, "learning_rate": 3.7417001285683423e-06, "loss": 0.84, "step": 18791 }, { "epoch": 0.35, "learning_rate": 3.741567535893369e-06, "loss": 0.7963, "step": 18792 }, { "epoch": 0.35, "learning_rate": 3.7414349385824196e-06, "loss": 0.9578, "step": 18793 }, { "epoch": 0.35, "learning_rate": 3.74130233663599e-06, "loss": 0.9835, "step": 18794 }, { "epoch": 0.35, "learning_rate": 3.741169730054577e-06, "loss": 0.7635, "step": 18795 }, { "epoch": 0.35, "learning_rate": 3.7410371188386728e-06, "loss": 0.8008, "step": 18796 }, { "epoch": 0.35, "learning_rate": 3.7409045029887747e-06, "loss": 0.8527, "step": 18797 }, { "epoch": 0.35, "learning_rate": 3.740771882505377e-06, "loss": 0.7923, "step": 18798 }, { "epoch": 0.35, "learning_rate": 3.740639257388975e-06, "loss": 0.9474, "step": 18799 }, { "epoch": 0.35, "learning_rate": 3.7405066276400643e-06, "loss": 0.8572, "step": 18800 }, { "epoch": 0.35, "learning_rate": 3.7403739932591398e-06, "loss": 0.7317, "step": 18801 }, { "epoch": 0.35, "learning_rate": 3.740241354246697e-06, "loss": 0.7206, "step": 18802 }, { "epoch": 0.35, "learning_rate": 3.7401087106032306e-06, "loss": 0.9616, "step": 18803 }, { "epoch": 0.35, "learning_rate": 3.7399760623292366e-06, "loss": 0.7387, "step": 18804 }, { "epoch": 0.35, "learning_rate": 3.73984340942521e-06, "loss": 0.9619, "step": 18805 }, { "epoch": 0.35, "learning_rate": 3.739710751891646e-06, "loss": 1.197, "step": 18806 }, { "epoch": 0.35, "learning_rate": 3.73957808972904e-06, "loss": 1.0293, "step": 18807 }, { "epoch": 0.35, "learning_rate": 3.7394454229378878e-06, "loss": 1.0687, "step": 18808 }, { "epoch": 0.35, "learning_rate": 3.7393127515186846e-06, "loss": 0.9285, "step": 18809 }, { "epoch": 0.35, "learning_rate": 3.739180075471925e-06, "loss": 0.8896, "step": 18810 }, { "epoch": 0.35, "learning_rate": 3.739047394798105e-06, "loss": 0.9937, "step": 18811 }, { "epoch": 0.35, "learning_rate": 3.7389147094977197e-06, "loss": 1.0707, "step": 18812 }, { "epoch": 0.35, "learning_rate": 3.7387820195712655e-06, "loss": 0.8227, "step": 18813 }, { "epoch": 0.35, "learning_rate": 3.7386493250192376e-06, "loss": 1.0692, "step": 18814 }, { "epoch": 0.35, "learning_rate": 3.7385166258421302e-06, "loss": 0.9226, "step": 18815 }, { "epoch": 0.35, "learning_rate": 3.7383839220404407e-06, "loss": 0.993, "step": 18816 }, { "epoch": 0.36, "learning_rate": 3.7382512136146624e-06, "loss": 0.5912, "step": 18817 }, { "epoch": 0.36, "learning_rate": 3.7381185005652925e-06, "loss": 1.036, "step": 18818 }, { "epoch": 0.36, "learning_rate": 3.737985782892826e-06, "loss": 0.9304, "step": 18819 }, { "epoch": 0.36, "learning_rate": 3.7378530605977586e-06, "loss": 0.9295, "step": 18820 }, { "epoch": 0.36, "learning_rate": 3.7377203336805857e-06, "loss": 0.8871, "step": 18821 }, { "epoch": 0.36, "learning_rate": 3.737587602141804e-06, "loss": 0.8514, "step": 18822 }, { "epoch": 0.36, "learning_rate": 3.737454865981907e-06, "loss": 0.8525, "step": 18823 }, { "epoch": 0.36, "learning_rate": 3.737322125201392e-06, "loss": 1.0697, "step": 18824 }, { "epoch": 0.36, "learning_rate": 3.7371893798007537e-06, "loss": 0.9484, "step": 18825 }, { "epoch": 0.36, "learning_rate": 3.7370566297804882e-06, "loss": 0.8394, "step": 18826 }, { "epoch": 0.36, "learning_rate": 3.736923875141092e-06, "loss": 0.8091, "step": 18827 }, { "epoch": 0.36, "learning_rate": 3.7367911158830594e-06, "loss": 0.9353, "step": 18828 }, { "epoch": 0.36, "learning_rate": 3.7366583520068866e-06, "loss": 0.8388, "step": 18829 }, { "epoch": 0.36, "learning_rate": 3.7365255835130698e-06, "loss": 0.9538, "step": 18830 }, { "epoch": 0.36, "learning_rate": 3.7363928104021042e-06, "loss": 1.0372, "step": 18831 }, { "epoch": 0.36, "learning_rate": 3.736260032674485e-06, "loss": 1.0336, "step": 18832 }, { "epoch": 0.36, "learning_rate": 3.73612725033071e-06, "loss": 0.9665, "step": 18833 }, { "epoch": 0.36, "learning_rate": 3.735994463371273e-06, "loss": 0.8703, "step": 18834 }, { "epoch": 0.36, "learning_rate": 3.7358616717966706e-06, "loss": 1.0173, "step": 18835 }, { "epoch": 0.36, "learning_rate": 3.7357288756073988e-06, "loss": 0.8076, "step": 18836 }, { "epoch": 0.36, "learning_rate": 3.735596074803953e-06, "loss": 1.1868, "step": 18837 }, { "epoch": 0.36, "learning_rate": 3.73546326938683e-06, "loss": 1.0213, "step": 18838 }, { "epoch": 0.36, "learning_rate": 3.7353304593565243e-06, "loss": 0.9584, "step": 18839 }, { "epoch": 0.36, "learning_rate": 3.735197644713533e-06, "loss": 1.0028, "step": 18840 }, { "epoch": 0.36, "learning_rate": 3.735064825458351e-06, "loss": 0.998, "step": 18841 }, { "epoch": 0.36, "learning_rate": 3.734932001591476e-06, "loss": 1.017, "step": 18842 }, { "epoch": 0.36, "learning_rate": 3.7347991731134013e-06, "loss": 0.93, "step": 18843 }, { "epoch": 0.36, "learning_rate": 3.7346663400246252e-06, "loss": 1.0886, "step": 18844 }, { "epoch": 0.36, "learning_rate": 3.7345335023256424e-06, "loss": 0.928, "step": 18845 }, { "epoch": 0.36, "learning_rate": 3.7344006600169496e-06, "loss": 0.885, "step": 18846 }, { "epoch": 0.36, "learning_rate": 3.7342678130990427e-06, "loss": 0.8665, "step": 18847 }, { "epoch": 0.36, "learning_rate": 3.7341349615724177e-06, "loss": 0.9879, "step": 18848 }, { "epoch": 0.36, "learning_rate": 3.734002105437571e-06, "loss": 1.1323, "step": 18849 }, { "epoch": 0.36, "learning_rate": 3.733869244694997e-06, "loss": 0.904, "step": 18850 }, { "epoch": 0.36, "learning_rate": 3.733736379345194e-06, "loss": 0.815, "step": 18851 }, { "epoch": 0.36, "learning_rate": 3.733603509388657e-06, "loss": 0.8359, "step": 18852 }, { "epoch": 0.36, "learning_rate": 3.733470634825882e-06, "loss": 0.8651, "step": 18853 }, { "epoch": 0.36, "learning_rate": 3.733337755657366e-06, "loss": 0.8444, "step": 18854 }, { "epoch": 0.36, "learning_rate": 3.7332048718836045e-06, "loss": 1.0576, "step": 18855 }, { "epoch": 0.36, "learning_rate": 3.7330719835050934e-06, "loss": 1.1369, "step": 18856 }, { "epoch": 0.36, "learning_rate": 3.73293909052233e-06, "loss": 0.8235, "step": 18857 }, { "epoch": 0.36, "learning_rate": 3.7328061929358093e-06, "loss": 0.8283, "step": 18858 }, { "epoch": 0.36, "learning_rate": 3.7326732907460282e-06, "loss": 1.0319, "step": 18859 }, { "epoch": 0.36, "learning_rate": 3.7325403839534824e-06, "loss": 0.8359, "step": 18860 }, { "epoch": 0.36, "learning_rate": 3.732407472558669e-06, "loss": 0.946, "step": 18861 }, { "epoch": 0.36, "learning_rate": 3.7322745565620846e-06, "loss": 1.0095, "step": 18862 }, { "epoch": 0.36, "learning_rate": 3.732141635964224e-06, "loss": 0.9775, "step": 18863 }, { "epoch": 0.36, "learning_rate": 3.7320087107655844e-06, "loss": 0.8927, "step": 18864 }, { "epoch": 0.36, "learning_rate": 3.7318757809666616e-06, "loss": 0.9171, "step": 18865 }, { "epoch": 0.36, "learning_rate": 3.731742846567953e-06, "loss": 1.0182, "step": 18866 }, { "epoch": 0.36, "learning_rate": 3.731609907569954e-06, "loss": 1.0624, "step": 18867 }, { "epoch": 0.36, "learning_rate": 3.731476963973162e-06, "loss": 1.0533, "step": 18868 }, { "epoch": 0.36, "learning_rate": 3.731344015778073e-06, "loss": 1.1497, "step": 18869 }, { "epoch": 0.36, "learning_rate": 3.7312110629851824e-06, "loss": 0.7568, "step": 18870 }, { "epoch": 0.36, "learning_rate": 3.7310781055949875e-06, "loss": 0.9261, "step": 18871 }, { "epoch": 0.36, "learning_rate": 3.730945143607985e-06, "loss": 0.8533, "step": 18872 }, { "epoch": 0.36, "learning_rate": 3.7308121770246706e-06, "loss": 0.9496, "step": 18873 }, { "epoch": 0.36, "learning_rate": 3.730679205845541e-06, "loss": 1.0862, "step": 18874 }, { "epoch": 0.36, "learning_rate": 3.7305462300710943e-06, "loss": 0.9364, "step": 18875 }, { "epoch": 0.36, "learning_rate": 3.730413249701825e-06, "loss": 0.9278, "step": 18876 }, { "epoch": 0.36, "learning_rate": 3.7302802647382304e-06, "loss": 0.9012, "step": 18877 }, { "epoch": 0.36, "learning_rate": 3.730147275180807e-06, "loss": 1.0584, "step": 18878 }, { "epoch": 0.36, "learning_rate": 3.730014281030051e-06, "loss": 0.8517, "step": 18879 }, { "epoch": 0.36, "learning_rate": 3.72988128228646e-06, "loss": 1.0112, "step": 18880 }, { "epoch": 0.36, "learning_rate": 3.7297482789505294e-06, "loss": 1.3484, "step": 18881 }, { "epoch": 0.36, "learning_rate": 3.7296152710227567e-06, "loss": 0.8456, "step": 18882 }, { "epoch": 0.36, "learning_rate": 3.7294822585036384e-06, "loss": 0.8639, "step": 18883 }, { "epoch": 0.36, "learning_rate": 3.729349241393671e-06, "loss": 1.0211, "step": 18884 }, { "epoch": 0.36, "learning_rate": 3.7292162196933514e-06, "loss": 0.8339, "step": 18885 }, { "epoch": 0.36, "learning_rate": 3.7290831934031757e-06, "loss": 0.9973, "step": 18886 }, { "epoch": 0.36, "learning_rate": 3.7289501625236413e-06, "loss": 1.214, "step": 18887 }, { "epoch": 0.36, "learning_rate": 3.728817127055244e-06, "loss": 1.0516, "step": 18888 }, { "epoch": 0.36, "learning_rate": 3.728684086998482e-06, "loss": 0.8436, "step": 18889 }, { "epoch": 0.36, "learning_rate": 3.7285510423538517e-06, "loss": 0.9441, "step": 18890 }, { "epoch": 0.36, "learning_rate": 3.7284179931218488e-06, "loss": 0.8615, "step": 18891 }, { "epoch": 0.36, "learning_rate": 3.7282849393029706e-06, "loss": 0.799, "step": 18892 }, { "epoch": 0.36, "learning_rate": 3.7281518808977152e-06, "loss": 0.9435, "step": 18893 }, { "epoch": 0.36, "learning_rate": 3.7280188179065773e-06, "loss": 1.0128, "step": 18894 }, { "epoch": 0.36, "learning_rate": 3.7278857503300545e-06, "loss": 0.9032, "step": 18895 }, { "epoch": 0.36, "learning_rate": 3.7277526781686445e-06, "loss": 1.071, "step": 18896 }, { "epoch": 0.36, "learning_rate": 3.727619601422844e-06, "loss": 0.832, "step": 18897 }, { "epoch": 0.36, "learning_rate": 3.7274865200931488e-06, "loss": 0.7988, "step": 18898 }, { "epoch": 0.36, "learning_rate": 3.7273534341800575e-06, "loss": 1.0287, "step": 18899 }, { "epoch": 0.36, "learning_rate": 3.7272203436840654e-06, "loss": 1.0385, "step": 18900 }, { "epoch": 0.36, "learning_rate": 3.7270872486056702e-06, "loss": 0.9851, "step": 18901 }, { "epoch": 0.36, "learning_rate": 3.7269541489453686e-06, "loss": 0.8249, "step": 18902 }, { "epoch": 0.36, "learning_rate": 3.7268210447036584e-06, "loss": 0.9299, "step": 18903 }, { "epoch": 0.36, "learning_rate": 3.726687935881036e-06, "loss": 0.8813, "step": 18904 }, { "epoch": 0.36, "learning_rate": 3.7265548224779983e-06, "loss": 0.9158, "step": 18905 }, { "epoch": 0.36, "learning_rate": 3.7264217044950424e-06, "loss": 1.0596, "step": 18906 }, { "epoch": 0.36, "learning_rate": 3.7262885819326656e-06, "loss": 1.0326, "step": 18907 }, { "epoch": 0.36, "learning_rate": 3.7261554547913647e-06, "loss": 0.858, "step": 18908 }, { "epoch": 0.36, "learning_rate": 3.7260223230716367e-06, "loss": 0.8878, "step": 18909 }, { "epoch": 0.36, "learning_rate": 3.7258891867739795e-06, "loss": 0.788, "step": 18910 }, { "epoch": 0.36, "learning_rate": 3.7257560458988897e-06, "loss": 0.796, "step": 18911 }, { "epoch": 0.36, "learning_rate": 3.7256229004468637e-06, "loss": 0.9357, "step": 18912 }, { "epoch": 0.36, "learning_rate": 3.7254897504183996e-06, "loss": 0.9405, "step": 18913 }, { "epoch": 0.36, "learning_rate": 3.7253565958139946e-06, "loss": 0.9944, "step": 18914 }, { "epoch": 0.36, "learning_rate": 3.7252234366341454e-06, "loss": 0.9476, "step": 18915 }, { "epoch": 0.36, "learning_rate": 3.7250902728793494e-06, "loss": 0.8746, "step": 18916 }, { "epoch": 0.36, "learning_rate": 3.7249571045501044e-06, "loss": 0.8939, "step": 18917 }, { "epoch": 0.36, "learning_rate": 3.724823931646907e-06, "loss": 0.89, "step": 18918 }, { "epoch": 0.36, "learning_rate": 3.7246907541702543e-06, "loss": 1.1302, "step": 18919 }, { "epoch": 0.36, "learning_rate": 3.724557572120644e-06, "loss": 1.0876, "step": 18920 }, { "epoch": 0.36, "learning_rate": 3.7244243854985735e-06, "loss": 0.8148, "step": 18921 }, { "epoch": 0.36, "learning_rate": 3.7242911943045394e-06, "loss": 0.9081, "step": 18922 }, { "epoch": 0.36, "learning_rate": 3.7241579985390397e-06, "loss": 0.8073, "step": 18923 }, { "epoch": 0.36, "learning_rate": 3.724024798202571e-06, "loss": 1.0716, "step": 18924 }, { "epoch": 0.36, "learning_rate": 3.7238915932956322e-06, "loss": 0.9981, "step": 18925 }, { "epoch": 0.36, "learning_rate": 3.7237583838187198e-06, "loss": 0.9308, "step": 18926 }, { "epoch": 0.36, "learning_rate": 3.723625169772331e-06, "loss": 0.8114, "step": 18927 }, { "epoch": 0.36, "learning_rate": 3.723491951156963e-06, "loss": 1.0043, "step": 18928 }, { "epoch": 0.36, "learning_rate": 3.723358727973113e-06, "loss": 0.8046, "step": 18929 }, { "epoch": 0.36, "learning_rate": 3.7232255002212797e-06, "loss": 0.9227, "step": 18930 }, { "epoch": 0.36, "learning_rate": 3.72309226790196e-06, "loss": 1.0485, "step": 18931 }, { "epoch": 0.36, "learning_rate": 3.722959031015651e-06, "loss": 0.9681, "step": 18932 }, { "epoch": 0.36, "learning_rate": 3.7228257895628504e-06, "loss": 0.8008, "step": 18933 }, { "epoch": 0.36, "learning_rate": 3.7226925435440557e-06, "loss": 1.0671, "step": 18934 }, { "epoch": 0.36, "learning_rate": 3.7225592929597653e-06, "loss": 0.8774, "step": 18935 }, { "epoch": 0.36, "learning_rate": 3.7224260378104755e-06, "loss": 0.744, "step": 18936 }, { "epoch": 0.36, "learning_rate": 3.722292778096684e-06, "loss": 1.0057, "step": 18937 }, { "epoch": 0.36, "learning_rate": 3.722159513818889e-06, "loss": 1.0038, "step": 18938 }, { "epoch": 0.36, "learning_rate": 3.722026244977588e-06, "loss": 0.873, "step": 18939 }, { "epoch": 0.36, "learning_rate": 3.721892971573278e-06, "loss": 0.8969, "step": 18940 }, { "epoch": 0.36, "learning_rate": 3.721759693606458e-06, "loss": 0.9467, "step": 18941 }, { "epoch": 0.36, "learning_rate": 3.7216264110776245e-06, "loss": 0.9299, "step": 18942 }, { "epoch": 0.36, "learning_rate": 3.721493123987275e-06, "loss": 1.033, "step": 18943 }, { "epoch": 0.36, "learning_rate": 3.7213598323359075e-06, "loss": 1.2024, "step": 18944 }, { "epoch": 0.36, "learning_rate": 3.72122653612402e-06, "loss": 0.785, "step": 18945 }, { "epoch": 0.36, "learning_rate": 3.7210932353521107e-06, "loss": 0.9281, "step": 18946 }, { "epoch": 0.36, "learning_rate": 3.7209599300206762e-06, "loss": 0.7979, "step": 18947 }, { "epoch": 0.36, "learning_rate": 3.7208266201302144e-06, "loss": 0.8654, "step": 18948 }, { "epoch": 0.36, "learning_rate": 3.7206933056812245e-06, "loss": 0.9843, "step": 18949 }, { "epoch": 0.36, "learning_rate": 3.7205599866742013e-06, "loss": 0.95, "step": 18950 }, { "epoch": 0.36, "learning_rate": 3.7204266631096466e-06, "loss": 0.998, "step": 18951 }, { "epoch": 0.36, "learning_rate": 3.7202933349880554e-06, "loss": 0.9823, "step": 18952 }, { "epoch": 0.36, "learning_rate": 3.720160002309926e-06, "loss": 0.824, "step": 18953 }, { "epoch": 0.36, "learning_rate": 3.7200266650757565e-06, "loss": 0.9438, "step": 18954 }, { "epoch": 0.36, "learning_rate": 3.7198933232860458e-06, "loss": 0.992, "step": 18955 }, { "epoch": 0.36, "learning_rate": 3.7197599769412895e-06, "loss": 1.1061, "step": 18956 }, { "epoch": 0.36, "learning_rate": 3.7196266260419876e-06, "loss": 0.7031, "step": 18957 }, { "epoch": 0.36, "learning_rate": 3.719493270588637e-06, "loss": 0.7221, "step": 18958 }, { "epoch": 0.36, "learning_rate": 3.7193599105817363e-06, "loss": 1.0565, "step": 18959 }, { "epoch": 0.36, "learning_rate": 3.7192265460217826e-06, "loss": 1.0272, "step": 18960 }, { "epoch": 0.36, "learning_rate": 3.7190931769092754e-06, "loss": 0.7317, "step": 18961 }, { "epoch": 0.36, "learning_rate": 3.7189598032447106e-06, "loss": 1.0122, "step": 18962 }, { "epoch": 0.36, "learning_rate": 3.7188264250285873e-06, "loss": 1.132, "step": 18963 }, { "epoch": 0.36, "learning_rate": 3.7186930422614037e-06, "loss": 0.7465, "step": 18964 }, { "epoch": 0.36, "learning_rate": 3.7185596549436576e-06, "loss": 0.8502, "step": 18965 }, { "epoch": 0.36, "learning_rate": 3.718426263075847e-06, "loss": 0.9036, "step": 18966 }, { "epoch": 0.36, "learning_rate": 3.7182928666584705e-06, "loss": 0.8988, "step": 18967 }, { "epoch": 0.36, "learning_rate": 3.7181594656920256e-06, "loss": 1.039, "step": 18968 }, { "epoch": 0.36, "learning_rate": 3.7180260601770103e-06, "loss": 1.0297, "step": 18969 }, { "epoch": 0.36, "learning_rate": 3.717892650113924e-06, "loss": 0.9962, "step": 18970 }, { "epoch": 0.36, "learning_rate": 3.717759235503262e-06, "loss": 1.1023, "step": 18971 }, { "epoch": 0.36, "learning_rate": 3.7176258163455257e-06, "loss": 1.1667, "step": 18972 }, { "epoch": 0.36, "learning_rate": 3.717492392641212e-06, "loss": 0.8713, "step": 18973 }, { "epoch": 0.36, "learning_rate": 3.7173589643908193e-06, "loss": 0.9855, "step": 18974 }, { "epoch": 0.36, "learning_rate": 3.7172255315948447e-06, "loss": 1.1105, "step": 18975 }, { "epoch": 0.36, "learning_rate": 3.717092094253788e-06, "loss": 1.1398, "step": 18976 }, { "epoch": 0.36, "learning_rate": 3.716958652368147e-06, "loss": 0.7838, "step": 18977 }, { "epoch": 0.36, "learning_rate": 3.7168252059384185e-06, "loss": 1.0067, "step": 18978 }, { "epoch": 0.36, "learning_rate": 3.716691754965103e-06, "loss": 0.8183, "step": 18979 }, { "epoch": 0.36, "learning_rate": 3.7165582994486972e-06, "loss": 0.7557, "step": 18980 }, { "epoch": 0.36, "learning_rate": 3.7164248393896996e-06, "loss": 0.8807, "step": 18981 }, { "epoch": 0.36, "learning_rate": 3.71629137478861e-06, "loss": 1.0416, "step": 18982 }, { "epoch": 0.36, "learning_rate": 3.716157905645925e-06, "loss": 0.9459, "step": 18983 }, { "epoch": 0.36, "learning_rate": 3.716024431962144e-06, "loss": 0.9875, "step": 18984 }, { "epoch": 0.36, "learning_rate": 3.715890953737765e-06, "loss": 0.8233, "step": 18985 }, { "epoch": 0.36, "learning_rate": 3.7157574709732863e-06, "loss": 0.8829, "step": 18986 }, { "epoch": 0.36, "learning_rate": 3.7156239836692063e-06, "loss": 1.0666, "step": 18987 }, { "epoch": 0.36, "learning_rate": 3.715490491826024e-06, "loss": 1.054, "step": 18988 }, { "epoch": 0.36, "learning_rate": 3.7153569954442374e-06, "loss": 0.9698, "step": 18989 }, { "epoch": 0.36, "learning_rate": 3.7152234945243446e-06, "loss": 1.0673, "step": 18990 }, { "epoch": 0.36, "learning_rate": 3.7150899890668455e-06, "loss": 1.0043, "step": 18991 }, { "epoch": 0.36, "learning_rate": 3.714956479072237e-06, "loss": 0.7839, "step": 18992 }, { "epoch": 0.36, "learning_rate": 3.7148229645410184e-06, "loss": 1.3225, "step": 18993 }, { "epoch": 0.36, "learning_rate": 3.7146894454736883e-06, "loss": 1.1277, "step": 18994 }, { "epoch": 0.36, "learning_rate": 3.714555921870745e-06, "loss": 0.817, "step": 18995 }, { "epoch": 0.36, "learning_rate": 3.7144223937326862e-06, "loss": 0.9636, "step": 18996 }, { "epoch": 0.36, "learning_rate": 3.7142888610600126e-06, "loss": 1.034, "step": 18997 }, { "epoch": 0.36, "learning_rate": 3.714155323853221e-06, "loss": 0.9219, "step": 18998 }, { "epoch": 0.36, "learning_rate": 3.714021782112811e-06, "loss": 1.174, "step": 18999 }, { "epoch": 0.36, "learning_rate": 3.713888235839281e-06, "loss": 1.1899, "step": 19000 }, { "epoch": 0.36, "learning_rate": 3.7137546850331285e-06, "loss": 0.9758, "step": 19001 }, { "epoch": 0.36, "learning_rate": 3.7136211296948544e-06, "loss": 0.8071, "step": 19002 }, { "epoch": 0.36, "learning_rate": 3.713487569824956e-06, "loss": 0.9697, "step": 19003 }, { "epoch": 0.36, "learning_rate": 3.713354005423932e-06, "loss": 1.0405, "step": 19004 }, { "epoch": 0.36, "learning_rate": 3.7132204364922815e-06, "loss": 0.8376, "step": 19005 }, { "epoch": 0.36, "learning_rate": 3.713086863030503e-06, "loss": 1.1259, "step": 19006 }, { "epoch": 0.36, "learning_rate": 3.712953285039095e-06, "loss": 0.9636, "step": 19007 }, { "epoch": 0.36, "learning_rate": 3.7128197025185565e-06, "loss": 0.9219, "step": 19008 }, { "epoch": 0.36, "learning_rate": 3.7126861154693873e-06, "loss": 0.669, "step": 19009 }, { "epoch": 0.36, "learning_rate": 3.7125525238920846e-06, "loss": 0.9555, "step": 19010 }, { "epoch": 0.36, "learning_rate": 3.712418927787148e-06, "loss": 0.7602, "step": 19011 }, { "epoch": 0.36, "learning_rate": 3.7122853271550776e-06, "loss": 0.9929, "step": 19012 }, { "epoch": 0.36, "learning_rate": 3.7121517219963686e-06, "loss": 1.1334, "step": 19013 }, { "epoch": 0.36, "learning_rate": 3.712018112311524e-06, "loss": 1.074, "step": 19014 }, { "epoch": 0.36, "learning_rate": 3.7118844981010403e-06, "loss": 0.907, "step": 19015 }, { "epoch": 0.36, "learning_rate": 3.711750879365417e-06, "loss": 0.9545, "step": 19016 }, { "epoch": 0.36, "learning_rate": 3.7116172561051533e-06, "loss": 0.8972, "step": 19017 }, { "epoch": 0.36, "learning_rate": 3.7114836283207484e-06, "loss": 0.9452, "step": 19018 }, { "epoch": 0.36, "learning_rate": 3.7113499960127004e-06, "loss": 1.2409, "step": 19019 }, { "epoch": 0.36, "learning_rate": 3.711216359181508e-06, "loss": 0.9153, "step": 19020 }, { "epoch": 0.36, "learning_rate": 3.7110827178276717e-06, "loss": 1.0142, "step": 19021 }, { "epoch": 0.36, "learning_rate": 3.7109490719516887e-06, "loss": 0.9471, "step": 19022 }, { "epoch": 0.36, "learning_rate": 3.71081542155406e-06, "loss": 1.0739, "step": 19023 }, { "epoch": 0.36, "learning_rate": 3.7106817666352836e-06, "loss": 1.0995, "step": 19024 }, { "epoch": 0.36, "learning_rate": 3.7105481071958577e-06, "loss": 1.1207, "step": 19025 }, { "epoch": 0.36, "learning_rate": 3.7104144432362833e-06, "loss": 1.0934, "step": 19026 }, { "epoch": 0.36, "learning_rate": 3.7102807747570575e-06, "loss": 0.9768, "step": 19027 }, { "epoch": 0.36, "learning_rate": 3.710147101758681e-06, "loss": 0.9267, "step": 19028 }, { "epoch": 0.36, "learning_rate": 3.7100134242416518e-06, "loss": 0.8954, "step": 19029 }, { "epoch": 0.36, "learning_rate": 3.7098797422064705e-06, "loss": 0.9414, "step": 19030 }, { "epoch": 0.36, "learning_rate": 3.7097460556536347e-06, "loss": 0.957, "step": 19031 }, { "epoch": 0.36, "learning_rate": 3.7096123645836446e-06, "loss": 0.8169, "step": 19032 }, { "epoch": 0.36, "learning_rate": 3.7094786689969988e-06, "loss": 0.8696, "step": 19033 }, { "epoch": 0.36, "learning_rate": 3.7093449688941964e-06, "loss": 1.0472, "step": 19034 }, { "epoch": 0.36, "learning_rate": 3.7092112642757374e-06, "loss": 0.6652, "step": 19035 }, { "epoch": 0.36, "learning_rate": 3.7090775551421205e-06, "loss": 0.8941, "step": 19036 }, { "epoch": 0.36, "learning_rate": 3.708943841493845e-06, "loss": 1.2748, "step": 19037 }, { "epoch": 0.36, "learning_rate": 3.70881012333141e-06, "loss": 1.137, "step": 19038 }, { "epoch": 0.36, "learning_rate": 3.708676400655316e-06, "loss": 0.9286, "step": 19039 }, { "epoch": 0.36, "learning_rate": 3.7085426734660607e-06, "loss": 0.8453, "step": 19040 }, { "epoch": 0.36, "learning_rate": 3.7084089417641432e-06, "loss": 0.7029, "step": 19041 }, { "epoch": 0.36, "learning_rate": 3.708275205550065e-06, "loss": 0.7769, "step": 19042 }, { "epoch": 0.36, "learning_rate": 3.708141464824324e-06, "loss": 0.8151, "step": 19043 }, { "epoch": 0.36, "learning_rate": 3.7080077195874204e-06, "loss": 1.0801, "step": 19044 }, { "epoch": 0.36, "learning_rate": 3.7078739698398527e-06, "loss": 0.8767, "step": 19045 }, { "epoch": 0.36, "learning_rate": 3.70774021558212e-06, "loss": 0.7532, "step": 19046 }, { "epoch": 0.36, "learning_rate": 3.707606456814723e-06, "loss": 1.0151, "step": 19047 }, { "epoch": 0.36, "learning_rate": 3.70747269353816e-06, "loss": 0.6654, "step": 19048 }, { "epoch": 0.36, "learning_rate": 3.7073389257529307e-06, "loss": 0.9575, "step": 19049 }, { "epoch": 0.36, "learning_rate": 3.7072051534595355e-06, "loss": 1.1104, "step": 19050 }, { "epoch": 0.36, "learning_rate": 3.7070713766584736e-06, "loss": 0.9471, "step": 19051 }, { "epoch": 0.36, "learning_rate": 3.7069375953502436e-06, "loss": 1.0345, "step": 19052 }, { "epoch": 0.36, "learning_rate": 3.7068038095353455e-06, "loss": 0.8456, "step": 19053 }, { "epoch": 0.36, "learning_rate": 3.7066700192142792e-06, "loss": 0.8483, "step": 19054 }, { "epoch": 0.36, "learning_rate": 3.706536224387544e-06, "loss": 0.9112, "step": 19055 }, { "epoch": 0.36, "learning_rate": 3.7064024250556395e-06, "loss": 1.0635, "step": 19056 }, { "epoch": 0.36, "learning_rate": 3.7062686212190656e-06, "loss": 0.9838, "step": 19057 }, { "epoch": 0.36, "learning_rate": 3.7061348128783215e-06, "loss": 0.8391, "step": 19058 }, { "epoch": 0.36, "learning_rate": 3.706001000033907e-06, "loss": 1.0256, "step": 19059 }, { "epoch": 0.36, "learning_rate": 3.7058671826863226e-06, "loss": 0.9437, "step": 19060 }, { "epoch": 0.36, "learning_rate": 3.705733360836066e-06, "loss": 1.0028, "step": 19061 }, { "epoch": 0.36, "learning_rate": 3.7055995344836384e-06, "loss": 1.1528, "step": 19062 }, { "epoch": 0.36, "learning_rate": 3.7054657036295383e-06, "loss": 0.8924, "step": 19063 }, { "epoch": 0.36, "learning_rate": 3.7053318682742666e-06, "loss": 1.0443, "step": 19064 }, { "epoch": 0.36, "learning_rate": 3.7051980284183235e-06, "loss": 1.0676, "step": 19065 }, { "epoch": 0.36, "learning_rate": 3.705064184062207e-06, "loss": 0.991, "step": 19066 }, { "epoch": 0.36, "learning_rate": 3.704930335206418e-06, "loss": 0.7605, "step": 19067 }, { "epoch": 0.36, "learning_rate": 3.7047964818514565e-06, "loss": 0.9047, "step": 19068 }, { "epoch": 0.36, "learning_rate": 3.7046626239978212e-06, "loss": 0.9298, "step": 19069 }, { "epoch": 0.36, "learning_rate": 3.704528761646013e-06, "loss": 1.0755, "step": 19070 }, { "epoch": 0.36, "learning_rate": 3.704394894796532e-06, "loss": 0.9346, "step": 19071 }, { "epoch": 0.36, "learning_rate": 3.7042610234498766e-06, "loss": 0.7427, "step": 19072 }, { "epoch": 0.36, "learning_rate": 3.7041271476065473e-06, "loss": 0.8138, "step": 19073 }, { "epoch": 0.36, "learning_rate": 3.7039932672670448e-06, "loss": 0.9946, "step": 19074 }, { "epoch": 0.36, "learning_rate": 3.7038593824318674e-06, "loss": 1.1849, "step": 19075 }, { "epoch": 0.36, "learning_rate": 3.7037254931015163e-06, "loss": 0.9293, "step": 19076 }, { "epoch": 0.36, "learning_rate": 3.703591599276492e-06, "loss": 1.1238, "step": 19077 }, { "epoch": 0.36, "learning_rate": 3.7034577009572926e-06, "loss": 0.7999, "step": 19078 }, { "epoch": 0.36, "learning_rate": 3.703323798144419e-06, "loss": 1.1308, "step": 19079 }, { "epoch": 0.36, "learning_rate": 3.7031898908383724e-06, "loss": 0.9429, "step": 19080 }, { "epoch": 0.36, "learning_rate": 3.7030559790396507e-06, "loss": 1.0266, "step": 19081 }, { "epoch": 0.36, "learning_rate": 3.702922062748755e-06, "loss": 0.7728, "step": 19082 }, { "epoch": 0.36, "learning_rate": 3.7027881419661847e-06, "loss": 0.9687, "step": 19083 }, { "epoch": 0.36, "learning_rate": 3.702654216692441e-06, "loss": 0.8515, "step": 19084 }, { "epoch": 0.36, "learning_rate": 3.702520286928023e-06, "loss": 0.7009, "step": 19085 }, { "epoch": 0.36, "learning_rate": 3.702386352673432e-06, "loss": 0.8309, "step": 19086 }, { "epoch": 0.36, "learning_rate": 3.7022524139291665e-06, "loss": 1.0811, "step": 19087 }, { "epoch": 0.36, "learning_rate": 3.702118470695727e-06, "loss": 0.8877, "step": 19088 }, { "epoch": 0.36, "learning_rate": 3.7019845229736147e-06, "loss": 0.7401, "step": 19089 }, { "epoch": 0.36, "learning_rate": 3.7018505707633284e-06, "loss": 0.8977, "step": 19090 }, { "epoch": 0.36, "learning_rate": 3.7017166140653693e-06, "loss": 0.8978, "step": 19091 }, { "epoch": 0.36, "learning_rate": 3.7015826528802375e-06, "loss": 0.9294, "step": 19092 }, { "epoch": 0.36, "learning_rate": 3.701448687208432e-06, "loss": 1.0991, "step": 19093 }, { "epoch": 0.36, "learning_rate": 3.7013147170504547e-06, "loss": 0.8344, "step": 19094 }, { "epoch": 0.36, "learning_rate": 3.7011807424068054e-06, "loss": 0.9777, "step": 19095 }, { "epoch": 0.36, "learning_rate": 3.701046763277983e-06, "loss": 0.9538, "step": 19096 }, { "epoch": 0.36, "learning_rate": 3.7009127796644888e-06, "loss": 0.8518, "step": 19097 }, { "epoch": 0.36, "learning_rate": 3.7007787915668243e-06, "loss": 1.0522, "step": 19098 }, { "epoch": 0.36, "learning_rate": 3.7006447989854875e-06, "loss": 1.1512, "step": 19099 }, { "epoch": 0.36, "learning_rate": 3.7005108019209807e-06, "loss": 0.9167, "step": 19100 }, { "epoch": 0.36, "learning_rate": 3.7003768003738027e-06, "loss": 0.9224, "step": 19101 }, { "epoch": 0.36, "learning_rate": 3.700242794344455e-06, "loss": 0.8751, "step": 19102 }, { "epoch": 0.36, "learning_rate": 3.700108783833437e-06, "loss": 0.7506, "step": 19103 }, { "epoch": 0.36, "learning_rate": 3.6999747688412504e-06, "loss": 0.8544, "step": 19104 }, { "epoch": 0.36, "learning_rate": 3.699840749368394e-06, "loss": 1.0072, "step": 19105 }, { "epoch": 0.36, "learning_rate": 3.699706725415369e-06, "loss": 1.3072, "step": 19106 }, { "epoch": 0.36, "learning_rate": 3.6995726969826766e-06, "loss": 1.0523, "step": 19107 }, { "epoch": 0.36, "learning_rate": 3.699438664070816e-06, "loss": 0.9513, "step": 19108 }, { "epoch": 0.36, "learning_rate": 3.6993046266802885e-06, "loss": 1.0245, "step": 19109 }, { "epoch": 0.36, "learning_rate": 3.699170584811594e-06, "loss": 0.7985, "step": 19110 }, { "epoch": 0.36, "learning_rate": 3.699036538465233e-06, "loss": 1.0786, "step": 19111 }, { "epoch": 0.36, "learning_rate": 3.6989024876417067e-06, "loss": 1.1657, "step": 19112 }, { "epoch": 0.36, "learning_rate": 3.6987684323415155e-06, "loss": 0.9177, "step": 19113 }, { "epoch": 0.36, "learning_rate": 3.6986343725651597e-06, "loss": 1.0187, "step": 19114 }, { "epoch": 0.36, "learning_rate": 3.6985003083131397e-06, "loss": 1.1092, "step": 19115 }, { "epoch": 0.36, "learning_rate": 3.6983662395859567e-06, "loss": 1.1064, "step": 19116 }, { "epoch": 0.36, "learning_rate": 3.6982321663841104e-06, "loss": 0.8237, "step": 19117 }, { "epoch": 0.36, "learning_rate": 3.6980980887081014e-06, "loss": 1.0689, "step": 19118 }, { "epoch": 0.36, "learning_rate": 3.697964006558432e-06, "loss": 0.8944, "step": 19119 }, { "epoch": 0.36, "learning_rate": 3.6978299199356015e-06, "loss": 0.8723, "step": 19120 }, { "epoch": 0.36, "learning_rate": 3.6976958288401104e-06, "loss": 0.8331, "step": 19121 }, { "epoch": 0.36, "learning_rate": 3.69756173327246e-06, "loss": 0.9026, "step": 19122 }, { "epoch": 0.36, "learning_rate": 3.697427633233151e-06, "loss": 1.1743, "step": 19123 }, { "epoch": 0.36, "learning_rate": 3.6972935287226834e-06, "loss": 0.8146, "step": 19124 }, { "epoch": 0.36, "learning_rate": 3.697159419741559e-06, "loss": 1.2034, "step": 19125 }, { "epoch": 0.36, "learning_rate": 3.6970253062902774e-06, "loss": 0.9063, "step": 19126 }, { "epoch": 0.36, "learning_rate": 3.69689118836934e-06, "loss": 0.8658, "step": 19127 }, { "epoch": 0.36, "learning_rate": 3.696757065979249e-06, "loss": 0.9542, "step": 19128 }, { "epoch": 0.36, "learning_rate": 3.696622939120503e-06, "loss": 1.0493, "step": 19129 }, { "epoch": 0.36, "learning_rate": 3.696488807793603e-06, "loss": 1.155, "step": 19130 }, { "epoch": 0.36, "learning_rate": 3.6963546719990507e-06, "loss": 0.847, "step": 19131 }, { "epoch": 0.36, "learning_rate": 3.696220531737347e-06, "loss": 1.0891, "step": 19132 }, { "epoch": 0.36, "learning_rate": 3.6960863870089924e-06, "loss": 0.8784, "step": 19133 }, { "epoch": 0.36, "learning_rate": 3.6959522378144884e-06, "loss": 1.0827, "step": 19134 }, { "epoch": 0.36, "learning_rate": 3.695818084154335e-06, "loss": 0.8597, "step": 19135 }, { "epoch": 0.36, "learning_rate": 3.6956839260290333e-06, "loss": 0.8728, "step": 19136 }, { "epoch": 0.36, "learning_rate": 3.695549763439085e-06, "loss": 1.1981, "step": 19137 }, { "epoch": 0.36, "learning_rate": 3.69541559638499e-06, "loss": 1.1453, "step": 19138 }, { "epoch": 0.36, "learning_rate": 3.69528142486725e-06, "loss": 1.1219, "step": 19139 }, { "epoch": 0.36, "learning_rate": 3.695147248886366e-06, "loss": 0.9098, "step": 19140 }, { "epoch": 0.36, "learning_rate": 3.6950130684428387e-06, "loss": 0.7794, "step": 19141 }, { "epoch": 0.36, "learning_rate": 3.69487888353717e-06, "loss": 0.8548, "step": 19142 }, { "epoch": 0.36, "learning_rate": 3.6947446941698594e-06, "loss": 0.9037, "step": 19143 }, { "epoch": 0.36, "learning_rate": 3.6946105003414086e-06, "loss": 0.835, "step": 19144 }, { "epoch": 0.36, "learning_rate": 3.694476302052319e-06, "loss": 1.0462, "step": 19145 }, { "epoch": 0.36, "learning_rate": 3.694342099303091e-06, "loss": 1.0253, "step": 19146 }, { "epoch": 0.36, "learning_rate": 3.694207892094227e-06, "loss": 0.864, "step": 19147 }, { "epoch": 0.36, "learning_rate": 3.6940736804262267e-06, "loss": 0.9919, "step": 19148 }, { "epoch": 0.36, "learning_rate": 3.693939464299593e-06, "loss": 0.892, "step": 19149 }, { "epoch": 0.36, "learning_rate": 3.693805243714825e-06, "loss": 1.2741, "step": 19150 }, { "epoch": 0.36, "learning_rate": 3.693671018672425e-06, "loss": 0.8688, "step": 19151 }, { "epoch": 0.36, "learning_rate": 3.693536789172894e-06, "loss": 0.6475, "step": 19152 }, { "epoch": 0.36, "learning_rate": 3.693402555216733e-06, "loss": 1.0143, "step": 19153 }, { "epoch": 0.36, "learning_rate": 3.693268316804444e-06, "loss": 0.6802, "step": 19154 }, { "epoch": 0.36, "learning_rate": 3.693134073936527e-06, "loss": 1.0084, "step": 19155 }, { "epoch": 0.36, "learning_rate": 3.692999826613485e-06, "loss": 1.0924, "step": 19156 }, { "epoch": 0.36, "learning_rate": 3.692865574835817e-06, "loss": 1.1343, "step": 19157 }, { "epoch": 0.36, "learning_rate": 3.692731318604027e-06, "loss": 0.957, "step": 19158 }, { "epoch": 0.36, "learning_rate": 3.6925970579186134e-06, "loss": 0.7552, "step": 19159 }, { "epoch": 0.36, "learning_rate": 3.692462792780079e-06, "loss": 0.8024, "step": 19160 }, { "epoch": 0.36, "learning_rate": 3.692328523188926e-06, "loss": 0.8333, "step": 19161 }, { "epoch": 0.36, "learning_rate": 3.6921942491456543e-06, "loss": 1.1105, "step": 19162 }, { "epoch": 0.36, "learning_rate": 3.692059970650766e-06, "loss": 1.0344, "step": 19163 }, { "epoch": 0.36, "learning_rate": 3.6919256877047626e-06, "loss": 1.0197, "step": 19164 }, { "epoch": 0.36, "learning_rate": 3.691791400308145e-06, "loss": 0.7836, "step": 19165 }, { "epoch": 0.36, "learning_rate": 3.6916571084614144e-06, "loss": 1.012, "step": 19166 }, { "epoch": 0.36, "learning_rate": 3.691522812165073e-06, "loss": 1.0374, "step": 19167 }, { "epoch": 0.36, "learning_rate": 3.6913885114196217e-06, "loss": 1.1567, "step": 19168 }, { "epoch": 0.36, "learning_rate": 3.691254206225563e-06, "loss": 1.0678, "step": 19169 }, { "epoch": 0.36, "learning_rate": 3.691119896583397e-06, "loss": 0.9517, "step": 19170 }, { "epoch": 0.36, "learning_rate": 3.6909855824936266e-06, "loss": 0.9639, "step": 19171 }, { "epoch": 0.36, "learning_rate": 3.6908512639567517e-06, "loss": 0.9479, "step": 19172 }, { "epoch": 0.36, "learning_rate": 3.6907169409732744e-06, "loss": 0.846, "step": 19173 }, { "epoch": 0.36, "learning_rate": 3.690582613543697e-06, "loss": 1.221, "step": 19174 }, { "epoch": 0.36, "learning_rate": 3.6904482816685207e-06, "loss": 1.1024, "step": 19175 }, { "epoch": 0.36, "learning_rate": 3.690313945348247e-06, "loss": 1.0839, "step": 19176 }, { "epoch": 0.36, "learning_rate": 3.6901796045833782e-06, "loss": 0.9587, "step": 19177 }, { "epoch": 0.36, "learning_rate": 3.6900452593744146e-06, "loss": 0.9712, "step": 19178 }, { "epoch": 0.36, "learning_rate": 3.689910909721858e-06, "loss": 0.8505, "step": 19179 }, { "epoch": 0.36, "learning_rate": 3.689776555626211e-06, "loss": 0.8679, "step": 19180 }, { "epoch": 0.36, "learning_rate": 3.6896421970879752e-06, "loss": 1.0863, "step": 19181 }, { "epoch": 0.36, "learning_rate": 3.6895078341076514e-06, "loss": 0.9395, "step": 19182 }, { "epoch": 0.36, "learning_rate": 3.6893734666857417e-06, "loss": 0.8938, "step": 19183 }, { "epoch": 0.36, "learning_rate": 3.6892390948227484e-06, "loss": 1.0806, "step": 19184 }, { "epoch": 0.36, "learning_rate": 3.689104718519173e-06, "loss": 0.8723, "step": 19185 }, { "epoch": 0.36, "learning_rate": 3.6889703377755163e-06, "loss": 0.881, "step": 19186 }, { "epoch": 0.36, "learning_rate": 3.688835952592281e-06, "loss": 0.9517, "step": 19187 }, { "epoch": 0.36, "learning_rate": 3.688701562969969e-06, "loss": 0.9256, "step": 19188 }, { "epoch": 0.36, "learning_rate": 3.688567168909082e-06, "loss": 0.9871, "step": 19189 }, { "epoch": 0.36, "learning_rate": 3.6884327704101213e-06, "loss": 0.8716, "step": 19190 }, { "epoch": 0.36, "learning_rate": 3.688298367473589e-06, "loss": 0.9701, "step": 19191 }, { "epoch": 0.36, "learning_rate": 3.688163960099987e-06, "loss": 0.8668, "step": 19192 }, { "epoch": 0.36, "learning_rate": 3.688029548289817e-06, "loss": 1.3322, "step": 19193 }, { "epoch": 0.36, "learning_rate": 3.687895132043581e-06, "loss": 1.1183, "step": 19194 }, { "epoch": 0.36, "learning_rate": 3.687760711361782e-06, "loss": 0.9326, "step": 19195 }, { "epoch": 0.36, "learning_rate": 3.6876262862449208e-06, "loss": 0.9488, "step": 19196 }, { "epoch": 0.36, "learning_rate": 3.6874918566934984e-06, "loss": 1.0922, "step": 19197 }, { "epoch": 0.36, "learning_rate": 3.6873574227080183e-06, "loss": 0.9598, "step": 19198 }, { "epoch": 0.36, "learning_rate": 3.6872229842889826e-06, "loss": 0.9786, "step": 19199 }, { "epoch": 0.36, "learning_rate": 3.6870885414368916e-06, "loss": 0.8572, "step": 19200 }, { "epoch": 0.36, "learning_rate": 3.6869540941522484e-06, "loss": 0.8725, "step": 19201 }, { "epoch": 0.36, "learning_rate": 3.686819642435556e-06, "loss": 0.8927, "step": 19202 }, { "epoch": 0.36, "learning_rate": 3.6866851862873153e-06, "loss": 0.9365, "step": 19203 }, { "epoch": 0.36, "learning_rate": 3.686550725708028e-06, "loss": 0.7263, "step": 19204 }, { "epoch": 0.36, "learning_rate": 3.6864162606981975e-06, "loss": 0.9683, "step": 19205 }, { "epoch": 0.36, "learning_rate": 3.686281791258324e-06, "loss": 1.0998, "step": 19206 }, { "epoch": 0.36, "learning_rate": 3.686147317388911e-06, "loss": 1.0315, "step": 19207 }, { "epoch": 0.36, "learning_rate": 3.68601283909046e-06, "loss": 0.966, "step": 19208 }, { "epoch": 0.36, "learning_rate": 3.685878356363474e-06, "loss": 0.9948, "step": 19209 }, { "epoch": 0.36, "learning_rate": 3.6857438692084547e-06, "loss": 0.9282, "step": 19210 }, { "epoch": 0.36, "learning_rate": 3.685609377625904e-06, "loss": 1.0241, "step": 19211 }, { "epoch": 0.36, "learning_rate": 3.685474881616324e-06, "loss": 1.246, "step": 19212 }, { "epoch": 0.36, "learning_rate": 3.685340381180217e-06, "loss": 1.0315, "step": 19213 }, { "epoch": 0.36, "learning_rate": 3.6852058763180855e-06, "loss": 0.8872, "step": 19214 }, { "epoch": 0.36, "learning_rate": 3.685071367030432e-06, "loss": 0.9774, "step": 19215 }, { "epoch": 0.36, "learning_rate": 3.6849368533177575e-06, "loss": 0.8667, "step": 19216 }, { "epoch": 0.36, "learning_rate": 3.684802335180566e-06, "loss": 0.9919, "step": 19217 }, { "epoch": 0.36, "learning_rate": 3.6846678126193587e-06, "loss": 0.9247, "step": 19218 }, { "epoch": 0.36, "learning_rate": 3.6845332856346377e-06, "loss": 0.964, "step": 19219 }, { "epoch": 0.36, "learning_rate": 3.684398754226906e-06, "loss": 0.953, "step": 19220 }, { "epoch": 0.36, "learning_rate": 3.684264218396666e-06, "loss": 0.9695, "step": 19221 }, { "epoch": 0.36, "learning_rate": 3.6841296781444186e-06, "loss": 0.7358, "step": 19222 }, { "epoch": 0.36, "learning_rate": 3.683995133470668e-06, "loss": 0.8057, "step": 19223 }, { "epoch": 0.36, "learning_rate": 3.6838605843759164e-06, "loss": 1.1306, "step": 19224 }, { "epoch": 0.36, "learning_rate": 3.683726030860665e-06, "loss": 1.0155, "step": 19225 }, { "epoch": 0.36, "learning_rate": 3.6835914729254175e-06, "loss": 1.0256, "step": 19226 }, { "epoch": 0.36, "learning_rate": 3.683456910570675e-06, "loss": 0.9669, "step": 19227 }, { "epoch": 0.36, "learning_rate": 3.6833223437969413e-06, "loss": 1.0455, "step": 19228 }, { "epoch": 0.36, "learning_rate": 3.683187772604718e-06, "loss": 0.9172, "step": 19229 }, { "epoch": 0.36, "learning_rate": 3.6830531969945073e-06, "loss": 0.998, "step": 19230 }, { "epoch": 0.36, "learning_rate": 3.6829186169668124e-06, "loss": 1.087, "step": 19231 }, { "epoch": 0.36, "learning_rate": 3.6827840325221363e-06, "loss": 0.9231, "step": 19232 }, { "epoch": 0.36, "learning_rate": 3.6826494436609805e-06, "loss": 0.8155, "step": 19233 }, { "epoch": 0.36, "learning_rate": 3.682514850383848e-06, "loss": 0.9751, "step": 19234 }, { "epoch": 0.36, "learning_rate": 3.682380252691241e-06, "loss": 0.8451, "step": 19235 }, { "epoch": 0.36, "learning_rate": 3.6822456505836627e-06, "loss": 0.9619, "step": 19236 }, { "epoch": 0.36, "learning_rate": 3.6821110440616154e-06, "loss": 1.0626, "step": 19237 }, { "epoch": 0.36, "learning_rate": 3.6819764331256023e-06, "loss": 0.9178, "step": 19238 }, { "epoch": 0.36, "learning_rate": 3.6818418177761245e-06, "loss": 1.0127, "step": 19239 }, { "epoch": 0.36, "learning_rate": 3.681707198013686e-06, "loss": 0.8591, "step": 19240 }, { "epoch": 0.36, "learning_rate": 3.681572573838789e-06, "loss": 0.7545, "step": 19241 }, { "epoch": 0.36, "learning_rate": 3.6814379452519367e-06, "loss": 0.8571, "step": 19242 }, { "epoch": 0.36, "learning_rate": 3.68130331225363e-06, "loss": 0.8316, "step": 19243 }, { "epoch": 0.36, "learning_rate": 3.681168674844374e-06, "loss": 0.7984, "step": 19244 }, { "epoch": 0.36, "learning_rate": 3.6810340330246704e-06, "loss": 1.0379, "step": 19245 }, { "epoch": 0.36, "learning_rate": 3.6808993867950216e-06, "loss": 0.8285, "step": 19246 }, { "epoch": 0.36, "learning_rate": 3.680764736155931e-06, "loss": 0.9014, "step": 19247 }, { "epoch": 0.36, "learning_rate": 3.680630081107901e-06, "loss": 0.9199, "step": 19248 }, { "epoch": 0.36, "learning_rate": 3.6804954216514344e-06, "loss": 0.9963, "step": 19249 }, { "epoch": 0.36, "learning_rate": 3.6803607577870336e-06, "loss": 1.0087, "step": 19250 }, { "epoch": 0.36, "learning_rate": 3.680226089515202e-06, "loss": 0.8908, "step": 19251 }, { "epoch": 0.36, "learning_rate": 3.6800914168364433e-06, "loss": 0.7367, "step": 19252 }, { "epoch": 0.36, "learning_rate": 3.679956739751259e-06, "loss": 0.8864, "step": 19253 }, { "epoch": 0.36, "learning_rate": 3.679822058260152e-06, "loss": 0.655, "step": 19254 }, { "epoch": 0.36, "learning_rate": 3.679687372363626e-06, "loss": 0.9114, "step": 19255 }, { "epoch": 0.36, "learning_rate": 3.6795526820621828e-06, "loss": 1.1688, "step": 19256 }, { "epoch": 0.36, "learning_rate": 3.679417987356327e-06, "loss": 0.8872, "step": 19257 }, { "epoch": 0.36, "learning_rate": 3.6792832882465603e-06, "loss": 0.8177, "step": 19258 }, { "epoch": 0.36, "learning_rate": 3.6791485847333862e-06, "loss": 0.7519, "step": 19259 }, { "epoch": 0.36, "learning_rate": 3.6790138768173074e-06, "loss": 0.7958, "step": 19260 }, { "epoch": 0.36, "learning_rate": 3.6788791644988264e-06, "loss": 0.7158, "step": 19261 }, { "epoch": 0.36, "learning_rate": 3.6787444477784474e-06, "loss": 1.0723, "step": 19262 }, { "epoch": 0.36, "learning_rate": 3.678609726656672e-06, "loss": 0.9931, "step": 19263 }, { "epoch": 0.36, "learning_rate": 3.6784750011340043e-06, "loss": 1.1168, "step": 19264 }, { "epoch": 0.36, "learning_rate": 3.6783402712109473e-06, "loss": 1.104, "step": 19265 }, { "epoch": 0.36, "learning_rate": 3.678205536888004e-06, "loss": 1.0495, "step": 19266 }, { "epoch": 0.36, "learning_rate": 3.6780707981656764e-06, "loss": 0.7033, "step": 19267 }, { "epoch": 0.36, "learning_rate": 3.6779360550444697e-06, "loss": 1.2352, "step": 19268 }, { "epoch": 0.36, "learning_rate": 3.677801307524886e-06, "loss": 1.0887, "step": 19269 }, { "epoch": 0.36, "learning_rate": 3.6776665556074275e-06, "loss": 0.8585, "step": 19270 }, { "epoch": 0.36, "learning_rate": 3.6775317992925984e-06, "loss": 0.8869, "step": 19271 }, { "epoch": 0.36, "learning_rate": 3.6773970385809017e-06, "loss": 1.0854, "step": 19272 }, { "epoch": 0.36, "learning_rate": 3.6772622734728402e-06, "loss": 0.7651, "step": 19273 }, { "epoch": 0.36, "learning_rate": 3.6771275039689187e-06, "loss": 0.9092, "step": 19274 }, { "epoch": 0.36, "learning_rate": 3.6769927300696378e-06, "loss": 1.2125, "step": 19275 }, { "epoch": 0.36, "learning_rate": 3.6768579517755026e-06, "loss": 0.8948, "step": 19276 }, { "epoch": 0.36, "learning_rate": 3.676723169087016e-06, "loss": 0.8852, "step": 19277 }, { "epoch": 0.36, "learning_rate": 3.676588382004681e-06, "loss": 0.979, "step": 19278 }, { "epoch": 0.36, "learning_rate": 3.676453590529001e-06, "loss": 0.7417, "step": 19279 }, { "epoch": 0.36, "learning_rate": 3.67631879466048e-06, "loss": 0.8378, "step": 19280 }, { "epoch": 0.36, "learning_rate": 3.67618399439962e-06, "loss": 1.2972, "step": 19281 }, { "epoch": 0.36, "learning_rate": 3.676049189746925e-06, "loss": 0.9951, "step": 19282 }, { "epoch": 0.36, "learning_rate": 3.6759143807028996e-06, "loss": 1.0262, "step": 19283 }, { "epoch": 0.36, "learning_rate": 3.6757795672680454e-06, "loss": 1.0172, "step": 19284 }, { "epoch": 0.36, "learning_rate": 3.675644749442865e-06, "loss": 0.9523, "step": 19285 }, { "epoch": 0.36, "learning_rate": 3.6755099272278645e-06, "loss": 0.7423, "step": 19286 }, { "epoch": 0.36, "learning_rate": 3.6753751006235457e-06, "loss": 1.0574, "step": 19287 }, { "epoch": 0.36, "learning_rate": 3.6752402696304117e-06, "loss": 1.0609, "step": 19288 }, { "epoch": 0.36, "learning_rate": 3.6751054342489678e-06, "loss": 0.929, "step": 19289 }, { "epoch": 0.36, "learning_rate": 3.6749705944797152e-06, "loss": 0.7653, "step": 19290 }, { "epoch": 0.36, "learning_rate": 3.6748357503231586e-06, "loss": 0.9161, "step": 19291 }, { "epoch": 0.36, "learning_rate": 3.6747009017798013e-06, "loss": 0.6933, "step": 19292 }, { "epoch": 0.36, "learning_rate": 3.674566048850147e-06, "loss": 1.0162, "step": 19293 }, { "epoch": 0.36, "learning_rate": 3.6744311915347e-06, "loss": 1.0207, "step": 19294 }, { "epoch": 0.36, "learning_rate": 3.674296329833962e-06, "loss": 1.0515, "step": 19295 }, { "epoch": 0.36, "learning_rate": 3.674161463748437e-06, "loss": 0.9149, "step": 19296 }, { "epoch": 0.36, "learning_rate": 3.67402659327863e-06, "loss": 0.9959, "step": 19297 }, { "epoch": 0.36, "learning_rate": 3.6738917184250427e-06, "loss": 0.9029, "step": 19298 }, { "epoch": 0.36, "learning_rate": 3.6737568391881808e-06, "loss": 1.0024, "step": 19299 }, { "epoch": 0.36, "learning_rate": 3.6736219555685467e-06, "loss": 1.1362, "step": 19300 }, { "epoch": 0.36, "learning_rate": 3.6734870675666433e-06, "loss": 0.9805, "step": 19301 }, { "epoch": 0.36, "learning_rate": 3.6733521751829757e-06, "loss": 0.9736, "step": 19302 }, { "epoch": 0.36, "learning_rate": 3.6732172784180476e-06, "loss": 1.1381, "step": 19303 }, { "epoch": 0.36, "learning_rate": 3.6730823772723617e-06, "loss": 0.8722, "step": 19304 }, { "epoch": 0.36, "learning_rate": 3.672947471746422e-06, "loss": 1.0234, "step": 19305 }, { "epoch": 0.36, "learning_rate": 3.6728125618407327e-06, "loss": 1.1452, "step": 19306 }, { "epoch": 0.36, "learning_rate": 3.6726776475557967e-06, "loss": 0.9217, "step": 19307 }, { "epoch": 0.36, "learning_rate": 3.672542728892119e-06, "loss": 1.0388, "step": 19308 }, { "epoch": 0.36, "learning_rate": 3.6724078058502026e-06, "loss": 0.7988, "step": 19309 }, { "epoch": 0.36, "learning_rate": 3.672272878430551e-06, "loss": 0.8441, "step": 19310 }, { "epoch": 0.36, "learning_rate": 3.672137946633669e-06, "loss": 1.0876, "step": 19311 }, { "epoch": 0.36, "learning_rate": 3.672003010460059e-06, "loss": 0.9471, "step": 19312 }, { "epoch": 0.36, "learning_rate": 3.671868069910226e-06, "loss": 1.1049, "step": 19313 }, { "epoch": 0.36, "learning_rate": 3.671733124984674e-06, "loss": 0.7459, "step": 19314 }, { "epoch": 0.36, "learning_rate": 3.6715981756839062e-06, "loss": 1.0975, "step": 19315 }, { "epoch": 0.36, "learning_rate": 3.671463222008427e-06, "loss": 0.7931, "step": 19316 }, { "epoch": 0.36, "learning_rate": 3.67132826395874e-06, "loss": 0.8222, "step": 19317 }, { "epoch": 0.36, "learning_rate": 3.6711933015353492e-06, "loss": 1.0152, "step": 19318 }, { "epoch": 0.36, "learning_rate": 3.6710583347387573e-06, "loss": 1.0274, "step": 19319 }, { "epoch": 0.36, "learning_rate": 3.670923363569471e-06, "loss": 1.0194, "step": 19320 }, { "epoch": 0.36, "learning_rate": 3.670788388027992e-06, "loss": 0.9705, "step": 19321 }, { "epoch": 0.36, "learning_rate": 3.6706534081148253e-06, "loss": 0.916, "step": 19322 }, { "epoch": 0.36, "learning_rate": 3.6705184238304746e-06, "loss": 0.7851, "step": 19323 }, { "epoch": 0.36, "learning_rate": 3.670383435175444e-06, "loss": 1.094, "step": 19324 }, { "epoch": 0.36, "learning_rate": 3.6702484421502376e-06, "loss": 0.9542, "step": 19325 }, { "epoch": 0.36, "learning_rate": 3.6701134447553593e-06, "loss": 1.0318, "step": 19326 }, { "epoch": 0.36, "learning_rate": 3.669978442991313e-06, "loss": 0.9988, "step": 19327 }, { "epoch": 0.36, "learning_rate": 3.669843436858604e-06, "loss": 0.9733, "step": 19328 }, { "epoch": 0.36, "learning_rate": 3.6697084263577343e-06, "loss": 0.817, "step": 19329 }, { "epoch": 0.36, "learning_rate": 3.669573411489211e-06, "loss": 0.8612, "step": 19330 }, { "epoch": 0.36, "learning_rate": 3.6694383922535346e-06, "loss": 1.043, "step": 19331 }, { "epoch": 0.36, "learning_rate": 3.6693033686512113e-06, "loss": 0.9327, "step": 19332 }, { "epoch": 0.36, "learning_rate": 3.6691683406827457e-06, "loss": 1.0334, "step": 19333 }, { "epoch": 0.36, "learning_rate": 3.6690333083486414e-06, "loss": 0.899, "step": 19334 }, { "epoch": 0.36, "learning_rate": 3.668898271649402e-06, "loss": 0.8546, "step": 19335 }, { "epoch": 0.36, "learning_rate": 3.6687632305855333e-06, "loss": 0.9252, "step": 19336 }, { "epoch": 0.36, "learning_rate": 3.668628185157537e-06, "loss": 0.9834, "step": 19337 }, { "epoch": 0.36, "learning_rate": 3.6684931353659202e-06, "loss": 0.993, "step": 19338 }, { "epoch": 0.36, "learning_rate": 3.668358081211186e-06, "loss": 0.9591, "step": 19339 }, { "epoch": 0.36, "learning_rate": 3.668223022693837e-06, "loss": 0.8217, "step": 19340 }, { "epoch": 0.36, "learning_rate": 3.66808795981438e-06, "loss": 0.8924, "step": 19341 }, { "epoch": 0.36, "learning_rate": 3.6679528925733186e-06, "loss": 0.6881, "step": 19342 }, { "epoch": 0.36, "learning_rate": 3.667817820971157e-06, "loss": 1.0354, "step": 19343 }, { "epoch": 0.36, "learning_rate": 3.6676827450083984e-06, "loss": 1.028, "step": 19344 }, { "epoch": 0.36, "learning_rate": 3.6675476646855496e-06, "loss": 0.8824, "step": 19345 }, { "epoch": 0.36, "learning_rate": 3.667412580003113e-06, "loss": 0.8501, "step": 19346 }, { "epoch": 0.37, "learning_rate": 3.6672774909615928e-06, "loss": 0.9827, "step": 19347 }, { "epoch": 0.37, "learning_rate": 3.6671423975614956e-06, "loss": 0.8854, "step": 19348 }, { "epoch": 0.37, "learning_rate": 3.667007299803324e-06, "loss": 1.0261, "step": 19349 }, { "epoch": 0.37, "learning_rate": 3.6668721976875826e-06, "loss": 1.0975, "step": 19350 }, { "epoch": 0.37, "learning_rate": 3.666737091214777e-06, "loss": 0.8221, "step": 19351 }, { "epoch": 0.37, "learning_rate": 3.6666019803854103e-06, "loss": 0.9299, "step": 19352 }, { "epoch": 0.37, "learning_rate": 3.6664668651999874e-06, "loss": 1.0434, "step": 19353 }, { "epoch": 0.37, "learning_rate": 3.666331745659013e-06, "loss": 0.7409, "step": 19354 }, { "epoch": 0.37, "learning_rate": 3.6661966217629917e-06, "loss": 0.8514, "step": 19355 }, { "epoch": 0.37, "learning_rate": 3.6660614935124277e-06, "loss": 1.0359, "step": 19356 }, { "epoch": 0.37, "learning_rate": 3.6659263609078264e-06, "loss": 1.0016, "step": 19357 }, { "epoch": 0.37, "learning_rate": 3.665791223949692e-06, "loss": 1.0031, "step": 19358 }, { "epoch": 0.37, "learning_rate": 3.6656560826385286e-06, "loss": 0.9214, "step": 19359 }, { "epoch": 0.37, "learning_rate": 3.6655209369748405e-06, "loss": 0.969, "step": 19360 }, { "epoch": 0.37, "learning_rate": 3.6653857869591335e-06, "loss": 0.8312, "step": 19361 }, { "epoch": 0.37, "learning_rate": 3.6652506325919116e-06, "loss": 0.9573, "step": 19362 }, { "epoch": 0.37, "learning_rate": 3.6651154738736806e-06, "loss": 0.9295, "step": 19363 }, { "epoch": 0.37, "learning_rate": 3.664980310804943e-06, "loss": 0.8795, "step": 19364 }, { "epoch": 0.37, "learning_rate": 3.6648451433862047e-06, "loss": 0.8648, "step": 19365 }, { "epoch": 0.37, "learning_rate": 3.6647099716179708e-06, "loss": 0.8797, "step": 19366 }, { "epoch": 0.37, "learning_rate": 3.664574795500745e-06, "loss": 0.9248, "step": 19367 }, { "epoch": 0.37, "learning_rate": 3.6644396150350327e-06, "loss": 1.0397, "step": 19368 }, { "epoch": 0.37, "learning_rate": 3.6643044302213394e-06, "loss": 1.0801, "step": 19369 }, { "epoch": 0.37, "learning_rate": 3.6641692410601683e-06, "loss": 0.9395, "step": 19370 }, { "epoch": 0.37, "learning_rate": 3.664034047552025e-06, "loss": 0.8176, "step": 19371 }, { "epoch": 0.37, "learning_rate": 3.6638988496974145e-06, "loss": 0.8685, "step": 19372 }, { "epoch": 0.37, "learning_rate": 3.6637636474968415e-06, "loss": 0.8631, "step": 19373 }, { "epoch": 0.37, "learning_rate": 3.66362844095081e-06, "loss": 0.9056, "step": 19374 }, { "epoch": 0.37, "learning_rate": 3.663493230059826e-06, "loss": 0.9146, "step": 19375 }, { "epoch": 0.37, "learning_rate": 3.663358014824394e-06, "loss": 1.0718, "step": 19376 }, { "epoch": 0.37, "learning_rate": 3.6632227952450184e-06, "loss": 0.9023, "step": 19377 }, { "epoch": 0.37, "learning_rate": 3.663087571322206e-06, "loss": 0.8075, "step": 19378 }, { "epoch": 0.37, "learning_rate": 3.6629523430564585e-06, "loss": 0.9583, "step": 19379 }, { "epoch": 0.37, "learning_rate": 3.6628171104482836e-06, "loss": 0.8649, "step": 19380 }, { "epoch": 0.37, "learning_rate": 3.662681873498185e-06, "loss": 1.1217, "step": 19381 }, { "epoch": 0.37, "learning_rate": 3.662546632206668e-06, "loss": 0.999, "step": 19382 }, { "epoch": 0.37, "learning_rate": 3.6624113865742374e-06, "loss": 1.016, "step": 19383 }, { "epoch": 0.37, "learning_rate": 3.662276136601398e-06, "loss": 0.8891, "step": 19384 }, { "epoch": 0.37, "learning_rate": 3.662140882288656e-06, "loss": 0.8434, "step": 19385 }, { "epoch": 0.37, "learning_rate": 3.6620056236365148e-06, "loss": 0.889, "step": 19386 }, { "epoch": 0.37, "learning_rate": 3.6618703606454807e-06, "loss": 0.9455, "step": 19387 }, { "epoch": 0.37, "learning_rate": 3.6617350933160582e-06, "loss": 0.8788, "step": 19388 }, { "epoch": 0.37, "learning_rate": 3.6615998216487517e-06, "loss": 0.8098, "step": 19389 }, { "epoch": 0.37, "learning_rate": 3.6614645456440682e-06, "loss": 0.9175, "step": 19390 }, { "epoch": 0.37, "learning_rate": 3.661329265302511e-06, "loss": 0.8266, "step": 19391 }, { "epoch": 0.37, "learning_rate": 3.661193980624587e-06, "loss": 0.8187, "step": 19392 }, { "epoch": 0.37, "learning_rate": 3.6610586916107994e-06, "loss": 1.0065, "step": 19393 }, { "epoch": 0.37, "learning_rate": 3.6609233982616543e-06, "loss": 1.027, "step": 19394 }, { "epoch": 0.37, "learning_rate": 3.6607881005776568e-06, "loss": 0.9653, "step": 19395 }, { "epoch": 0.37, "learning_rate": 3.660652798559312e-06, "loss": 0.8554, "step": 19396 }, { "epoch": 0.37, "learning_rate": 3.6605174922071257e-06, "loss": 0.9589, "step": 19397 }, { "epoch": 0.37, "learning_rate": 3.6603821815216022e-06, "loss": 0.8766, "step": 19398 }, { "epoch": 0.37, "learning_rate": 3.6602468665032478e-06, "loss": 1.1227, "step": 19399 }, { "epoch": 0.37, "learning_rate": 3.6601115471525667e-06, "loss": 1.0953, "step": 19400 }, { "epoch": 0.37, "learning_rate": 3.6599762234700647e-06, "loss": 0.7883, "step": 19401 }, { "epoch": 0.37, "learning_rate": 3.659840895456247e-06, "loss": 0.9154, "step": 19402 }, { "epoch": 0.37, "learning_rate": 3.659705563111619e-06, "loss": 0.9445, "step": 19403 }, { "epoch": 0.37, "learning_rate": 3.659570226436686e-06, "loss": 0.8627, "step": 19404 }, { "epoch": 0.37, "learning_rate": 3.659434885431954e-06, "loss": 1.1335, "step": 19405 }, { "epoch": 0.37, "learning_rate": 3.6592995400979266e-06, "loss": 1.0114, "step": 19406 }, { "epoch": 0.37, "learning_rate": 3.6591641904351106e-06, "loss": 1.0174, "step": 19407 }, { "epoch": 0.37, "learning_rate": 3.6590288364440117e-06, "loss": 0.879, "step": 19408 }, { "epoch": 0.37, "learning_rate": 3.658893478125134e-06, "loss": 0.9109, "step": 19409 }, { "epoch": 0.37, "learning_rate": 3.658758115478984e-06, "loss": 0.8284, "step": 19410 }, { "epoch": 0.37, "learning_rate": 3.658622748506066e-06, "loss": 0.9261, "step": 19411 }, { "epoch": 0.37, "learning_rate": 3.658487377206886e-06, "loss": 1.0853, "step": 19412 }, { "epoch": 0.37, "learning_rate": 3.6583520015819513e-06, "loss": 0.9805, "step": 19413 }, { "epoch": 0.37, "learning_rate": 3.658216621631764e-06, "loss": 0.9081, "step": 19414 }, { "epoch": 0.37, "learning_rate": 3.6580812373568323e-06, "loss": 1.0547, "step": 19415 }, { "epoch": 0.37, "learning_rate": 3.6579458487576604e-06, "loss": 0.8705, "step": 19416 }, { "epoch": 0.37, "learning_rate": 3.6578104558347542e-06, "loss": 0.8593, "step": 19417 }, { "epoch": 0.37, "learning_rate": 3.6576750585886194e-06, "loss": 1.0399, "step": 19418 }, { "epoch": 0.37, "learning_rate": 3.657539657019762e-06, "loss": 1.059, "step": 19419 }, { "epoch": 0.37, "learning_rate": 3.657404251128686e-06, "loss": 0.9, "step": 19420 }, { "epoch": 0.37, "learning_rate": 3.6572688409158986e-06, "loss": 0.7737, "step": 19421 }, { "epoch": 0.37, "learning_rate": 3.6571334263819047e-06, "loss": 1.0306, "step": 19422 }, { "epoch": 0.37, "learning_rate": 3.6569980075272098e-06, "loss": 1.0429, "step": 19423 }, { "epoch": 0.37, "learning_rate": 3.65686258435232e-06, "loss": 1.0096, "step": 19424 }, { "epoch": 0.37, "learning_rate": 3.656727156857741e-06, "loss": 0.914, "step": 19425 }, { "epoch": 0.37, "learning_rate": 3.656591725043978e-06, "loss": 0.8888, "step": 19426 }, { "epoch": 0.37, "learning_rate": 3.6564562889115374e-06, "loss": 0.9514, "step": 19427 }, { "epoch": 0.37, "learning_rate": 3.6563208484609243e-06, "loss": 0.9708, "step": 19428 }, { "epoch": 0.37, "learning_rate": 3.656185403692644e-06, "loss": 0.9174, "step": 19429 }, { "epoch": 0.37, "learning_rate": 3.6560499546072036e-06, "loss": 0.7973, "step": 19430 }, { "epoch": 0.37, "learning_rate": 3.6559145012051078e-06, "loss": 0.9803, "step": 19431 }, { "epoch": 0.37, "learning_rate": 3.6557790434868624e-06, "loss": 0.9707, "step": 19432 }, { "epoch": 0.37, "learning_rate": 3.6556435814529735e-06, "loss": 1.0425, "step": 19433 }, { "epoch": 0.37, "learning_rate": 3.6555081151039478e-06, "loss": 1.0579, "step": 19434 }, { "epoch": 0.37, "learning_rate": 3.6553726444402895e-06, "loss": 0.933, "step": 19435 }, { "epoch": 0.37, "learning_rate": 3.6552371694625056e-06, "loss": 1.0537, "step": 19436 }, { "epoch": 0.37, "learning_rate": 3.6551016901711006e-06, "loss": 1.0051, "step": 19437 }, { "epoch": 0.37, "learning_rate": 3.6549662065665818e-06, "loss": 0.8272, "step": 19438 }, { "epoch": 0.37, "learning_rate": 3.654830718649455e-06, "loss": 1.075, "step": 19439 }, { "epoch": 0.37, "learning_rate": 3.6546952264202255e-06, "loss": 0.9052, "step": 19440 }, { "epoch": 0.37, "learning_rate": 3.6545597298793994e-06, "loss": 0.9604, "step": 19441 }, { "epoch": 0.37, "learning_rate": 3.6544242290274822e-06, "loss": 0.8542, "step": 19442 }, { "epoch": 0.37, "learning_rate": 3.6542887238649817e-06, "loss": 1.2052, "step": 19443 }, { "epoch": 0.37, "learning_rate": 3.6541532143924007e-06, "loss": 1.0911, "step": 19444 }, { "epoch": 0.37, "learning_rate": 3.6540177006102473e-06, "loss": 0.8625, "step": 19445 }, { "epoch": 0.37, "learning_rate": 3.6538821825190286e-06, "loss": 0.9744, "step": 19446 }, { "epoch": 0.37, "learning_rate": 3.653746660119248e-06, "loss": 0.7886, "step": 19447 }, { "epoch": 0.37, "learning_rate": 3.6536111334114133e-06, "loss": 0.8648, "step": 19448 }, { "epoch": 0.37, "learning_rate": 3.65347560239603e-06, "loss": 0.9883, "step": 19449 }, { "epoch": 0.37, "learning_rate": 3.6533400670736034e-06, "loss": 1.1343, "step": 19450 }, { "epoch": 0.37, "learning_rate": 3.653204527444641e-06, "loss": 1.0603, "step": 19451 }, { "epoch": 0.37, "learning_rate": 3.653068983509648e-06, "loss": 0.8464, "step": 19452 }, { "epoch": 0.37, "learning_rate": 3.652933435269131e-06, "loss": 1.0068, "step": 19453 }, { "epoch": 0.37, "learning_rate": 3.6527978827235954e-06, "loss": 0.858, "step": 19454 }, { "epoch": 0.37, "learning_rate": 3.6526623258735487e-06, "loss": 0.7495, "step": 19455 }, { "epoch": 0.37, "learning_rate": 3.6525267647194963e-06, "loss": 0.9343, "step": 19456 }, { "epoch": 0.37, "learning_rate": 3.652391199261943e-06, "loss": 0.9241, "step": 19457 }, { "epoch": 0.37, "learning_rate": 3.6522556295013974e-06, "loss": 0.8522, "step": 19458 }, { "epoch": 0.37, "learning_rate": 3.652120055438364e-06, "loss": 0.8087, "step": 19459 }, { "epoch": 0.37, "learning_rate": 3.65198447707335e-06, "loss": 1.0094, "step": 19460 }, { "epoch": 0.37, "learning_rate": 3.6518488944068613e-06, "loss": 0.9962, "step": 19461 }, { "epoch": 0.37, "learning_rate": 3.651713307439404e-06, "loss": 0.9879, "step": 19462 }, { "epoch": 0.37, "learning_rate": 3.6515777161714843e-06, "loss": 0.9133, "step": 19463 }, { "epoch": 0.37, "learning_rate": 3.65144212060361e-06, "loss": 1.0074, "step": 19464 }, { "epoch": 0.37, "learning_rate": 3.6513065207362843e-06, "loss": 0.8446, "step": 19465 }, { "epoch": 0.37, "learning_rate": 3.651170916570016e-06, "loss": 0.7747, "step": 19466 }, { "epoch": 0.37, "learning_rate": 3.6510353081053112e-06, "loss": 1.0103, "step": 19467 }, { "epoch": 0.37, "learning_rate": 3.6508996953426756e-06, "loss": 0.8692, "step": 19468 }, { "epoch": 0.37, "learning_rate": 3.650764078282616e-06, "loss": 1.0266, "step": 19469 }, { "epoch": 0.37, "learning_rate": 3.6506284569256386e-06, "loss": 0.7898, "step": 19470 }, { "epoch": 0.37, "learning_rate": 3.6504928312722495e-06, "loss": 1.0403, "step": 19471 }, { "epoch": 0.37, "learning_rate": 3.6503572013229553e-06, "loss": 0.6864, "step": 19472 }, { "epoch": 0.37, "learning_rate": 3.6502215670782627e-06, "loss": 0.7714, "step": 19473 }, { "epoch": 0.37, "learning_rate": 3.650085928538678e-06, "loss": 1.1006, "step": 19474 }, { "epoch": 0.37, "learning_rate": 3.6499502857047083e-06, "loss": 1.1268, "step": 19475 }, { "epoch": 0.37, "learning_rate": 3.6498146385768596e-06, "loss": 0.8962, "step": 19476 }, { "epoch": 0.37, "learning_rate": 3.6496789871556377e-06, "loss": 0.942, "step": 19477 }, { "epoch": 0.37, "learning_rate": 3.6495433314415495e-06, "loss": 0.8292, "step": 19478 }, { "epoch": 0.37, "learning_rate": 3.6494076714351023e-06, "loss": 0.9898, "step": 19479 }, { "epoch": 0.37, "learning_rate": 3.6492720071368015e-06, "loss": 1.0101, "step": 19480 }, { "epoch": 0.37, "learning_rate": 3.6491363385471547e-06, "loss": 1.2605, "step": 19481 }, { "epoch": 0.37, "learning_rate": 3.649000665666668e-06, "loss": 0.9501, "step": 19482 }, { "epoch": 0.37, "learning_rate": 3.6488649884958484e-06, "loss": 0.9723, "step": 19483 }, { "epoch": 0.37, "learning_rate": 3.6487293070352014e-06, "loss": 0.7623, "step": 19484 }, { "epoch": 0.37, "learning_rate": 3.648593621285235e-06, "loss": 0.8807, "step": 19485 }, { "epoch": 0.37, "learning_rate": 3.6484579312464547e-06, "loss": 0.7913, "step": 19486 }, { "epoch": 0.37, "learning_rate": 3.6483222369193675e-06, "loss": 0.956, "step": 19487 }, { "epoch": 0.37, "learning_rate": 3.6481865383044814e-06, "loss": 1.1238, "step": 19488 }, { "epoch": 0.37, "learning_rate": 3.6480508354023016e-06, "loss": 0.9147, "step": 19489 }, { "epoch": 0.37, "learning_rate": 3.6479151282133346e-06, "loss": 0.9911, "step": 19490 }, { "epoch": 0.37, "learning_rate": 3.647779416738088e-06, "loss": 1.0243, "step": 19491 }, { "epoch": 0.37, "learning_rate": 3.6476437009770683e-06, "loss": 0.8407, "step": 19492 }, { "epoch": 0.37, "learning_rate": 3.6475079809307824e-06, "loss": 1.2961, "step": 19493 }, { "epoch": 0.37, "learning_rate": 3.6473722565997368e-06, "loss": 1.1925, "step": 19494 }, { "epoch": 0.37, "learning_rate": 3.647236527984438e-06, "loss": 1.0303, "step": 19495 }, { "epoch": 0.37, "learning_rate": 3.647100795085393e-06, "loss": 0.8798, "step": 19496 }, { "epoch": 0.37, "learning_rate": 3.6469650579031097e-06, "loss": 0.8943, "step": 19497 }, { "epoch": 0.37, "learning_rate": 3.6468293164380935e-06, "loss": 0.7941, "step": 19498 }, { "epoch": 0.37, "learning_rate": 3.646693570690852e-06, "loss": 0.8703, "step": 19499 }, { "epoch": 0.37, "learning_rate": 3.6465578206618913e-06, "loss": 1.182, "step": 19500 }, { "epoch": 0.37, "learning_rate": 3.646422066351719e-06, "loss": 1.1049, "step": 19501 }, { "epoch": 0.37, "learning_rate": 3.6462863077608424e-06, "loss": 1.0035, "step": 19502 }, { "epoch": 0.37, "learning_rate": 3.6461505448897675e-06, "loss": 1.005, "step": 19503 }, { "epoch": 0.37, "learning_rate": 3.646014777739002e-06, "loss": 0.7722, "step": 19504 }, { "epoch": 0.37, "learning_rate": 3.6458790063090522e-06, "loss": 0.8298, "step": 19505 }, { "epoch": 0.37, "learning_rate": 3.6457432306004252e-06, "loss": 0.9876, "step": 19506 }, { "epoch": 0.37, "learning_rate": 3.645607450613628e-06, "loss": 0.8592, "step": 19507 }, { "epoch": 0.37, "learning_rate": 3.6454716663491677e-06, "loss": 0.8149, "step": 19508 }, { "epoch": 0.37, "learning_rate": 3.645335877807552e-06, "loss": 0.8621, "step": 19509 }, { "epoch": 0.37, "learning_rate": 3.6452000849892868e-06, "loss": 0.8644, "step": 19510 }, { "epoch": 0.37, "learning_rate": 3.6450642878948795e-06, "loss": 1.0785, "step": 19511 }, { "epoch": 0.37, "learning_rate": 3.6449284865248375e-06, "loss": 1.2641, "step": 19512 }, { "epoch": 0.37, "learning_rate": 3.6447926808796674e-06, "loss": 1.0386, "step": 19513 }, { "epoch": 0.37, "learning_rate": 3.644656870959876e-06, "loss": 0.8369, "step": 19514 }, { "epoch": 0.37, "learning_rate": 3.6445210567659716e-06, "loss": 0.9835, "step": 19515 }, { "epoch": 0.37, "learning_rate": 3.6443852382984608e-06, "loss": 0.8552, "step": 19516 }, { "epoch": 0.37, "learning_rate": 3.64424941555785e-06, "loss": 0.6861, "step": 19517 }, { "epoch": 0.37, "learning_rate": 3.6441135885446483e-06, "loss": 1.1456, "step": 19518 }, { "epoch": 0.37, "learning_rate": 3.6439777572593605e-06, "loss": 1.0421, "step": 19519 }, { "epoch": 0.37, "learning_rate": 3.6438419217024945e-06, "loss": 0.6878, "step": 19520 }, { "epoch": 0.37, "learning_rate": 3.6437060818745584e-06, "loss": 0.986, "step": 19521 }, { "epoch": 0.37, "learning_rate": 3.6435702377760584e-06, "loss": 1.0236, "step": 19522 }, { "epoch": 0.37, "learning_rate": 3.6434343894075023e-06, "loss": 0.8004, "step": 19523 }, { "epoch": 0.37, "learning_rate": 3.643298536769398e-06, "loss": 0.9998, "step": 19524 }, { "epoch": 0.37, "learning_rate": 3.6431626798622515e-06, "loss": 1.1837, "step": 19525 }, { "epoch": 0.37, "learning_rate": 3.6430268186865704e-06, "loss": 1.1115, "step": 19526 }, { "epoch": 0.37, "learning_rate": 3.642890953242863e-06, "loss": 1.0427, "step": 19527 }, { "epoch": 0.37, "learning_rate": 3.6427550835316346e-06, "loss": 1.0616, "step": 19528 }, { "epoch": 0.37, "learning_rate": 3.6426192095533948e-06, "loss": 0.7735, "step": 19529 }, { "epoch": 0.37, "learning_rate": 3.6424833313086495e-06, "loss": 0.8715, "step": 19530 }, { "epoch": 0.37, "learning_rate": 3.642347448797906e-06, "loss": 1.0042, "step": 19531 }, { "epoch": 0.37, "learning_rate": 3.642211562021673e-06, "loss": 0.7467, "step": 19532 }, { "epoch": 0.37, "learning_rate": 3.6420756709804566e-06, "loss": 0.8524, "step": 19533 }, { "epoch": 0.37, "learning_rate": 3.641939775674765e-06, "loss": 0.8583, "step": 19534 }, { "epoch": 0.37, "learning_rate": 3.6418038761051046e-06, "loss": 0.8049, "step": 19535 }, { "epoch": 0.37, "learning_rate": 3.641667972271984e-06, "loss": 0.9205, "step": 19536 }, { "epoch": 0.37, "learning_rate": 3.64153206417591e-06, "loss": 0.9171, "step": 19537 }, { "epoch": 0.37, "learning_rate": 3.6413961518173907e-06, "loss": 1.1223, "step": 19538 }, { "epoch": 0.37, "learning_rate": 3.6412602351969327e-06, "loss": 0.8106, "step": 19539 }, { "epoch": 0.37, "learning_rate": 3.6411243143150442e-06, "loss": 1.1131, "step": 19540 }, { "epoch": 0.37, "learning_rate": 3.640988389172232e-06, "loss": 0.8901, "step": 19541 }, { "epoch": 0.37, "learning_rate": 3.640852459769005e-06, "loss": 0.7988, "step": 19542 }, { "epoch": 0.37, "learning_rate": 3.640716526105869e-06, "loss": 1.2012, "step": 19543 }, { "epoch": 0.37, "learning_rate": 3.6405805881833333e-06, "loss": 1.0605, "step": 19544 }, { "epoch": 0.37, "learning_rate": 3.6404446460019044e-06, "loss": 0.8833, "step": 19545 }, { "epoch": 0.37, "learning_rate": 3.6403086995620902e-06, "loss": 0.9607, "step": 19546 }, { "epoch": 0.37, "learning_rate": 3.6401727488643985e-06, "loss": 0.9835, "step": 19547 }, { "epoch": 0.37, "learning_rate": 3.6400367939093363e-06, "loss": 0.7876, "step": 19548 }, { "epoch": 0.37, "learning_rate": 3.639900834697411e-06, "loss": 0.8807, "step": 19549 }, { "epoch": 0.37, "learning_rate": 3.6397648712291317e-06, "loss": 1.17, "step": 19550 }, { "epoch": 0.37, "learning_rate": 3.6396289035050055e-06, "loss": 1.0658, "step": 19551 }, { "epoch": 0.37, "learning_rate": 3.6394929315255394e-06, "loss": 1.0832, "step": 19552 }, { "epoch": 0.37, "learning_rate": 3.639356955291242e-06, "loss": 0.8743, "step": 19553 }, { "epoch": 0.37, "learning_rate": 3.6392209748026208e-06, "loss": 0.9288, "step": 19554 }, { "epoch": 0.37, "learning_rate": 3.6390849900601834e-06, "loss": 0.8265, "step": 19555 }, { "epoch": 0.37, "learning_rate": 3.638949001064437e-06, "loss": 1.0011, "step": 19556 }, { "epoch": 0.37, "learning_rate": 3.63881300781589e-06, "loss": 1.147, "step": 19557 }, { "epoch": 0.37, "learning_rate": 3.6386770103150503e-06, "loss": 0.7889, "step": 19558 }, { "epoch": 0.37, "learning_rate": 3.638541008562426e-06, "loss": 0.9684, "step": 19559 }, { "epoch": 0.37, "learning_rate": 3.6384050025585245e-06, "loss": 0.9986, "step": 19560 }, { "epoch": 0.37, "learning_rate": 3.6382689923038533e-06, "loss": 0.9818, "step": 19561 }, { "epoch": 0.37, "learning_rate": 3.6381329777989207e-06, "loss": 0.862, "step": 19562 }, { "epoch": 0.37, "learning_rate": 3.6379969590442336e-06, "loss": 1.1281, "step": 19563 }, { "epoch": 0.37, "learning_rate": 3.6378609360403015e-06, "loss": 0.858, "step": 19564 }, { "epoch": 0.37, "learning_rate": 3.637724908787632e-06, "loss": 1.0144, "step": 19565 }, { "epoch": 0.37, "learning_rate": 3.6375888772867324e-06, "loss": 0.8799, "step": 19566 }, { "epoch": 0.37, "learning_rate": 3.6374528415381105e-06, "loss": 0.7744, "step": 19567 }, { "epoch": 0.37, "learning_rate": 3.6373168015422745e-06, "loss": 1.1044, "step": 19568 }, { "epoch": 0.37, "learning_rate": 3.6371807572997324e-06, "loss": 1.0472, "step": 19569 }, { "epoch": 0.37, "learning_rate": 3.6370447088109917e-06, "loss": 1.0536, "step": 19570 }, { "epoch": 0.37, "learning_rate": 3.636908656076562e-06, "loss": 0.9977, "step": 19571 }, { "epoch": 0.37, "learning_rate": 3.63677259909695e-06, "loss": 0.9391, "step": 19572 }, { "epoch": 0.37, "learning_rate": 3.6366365378726637e-06, "loss": 0.8702, "step": 19573 }, { "epoch": 0.37, "learning_rate": 3.636500472404212e-06, "loss": 1.1508, "step": 19574 }, { "epoch": 0.37, "learning_rate": 3.636364402692102e-06, "loss": 1.0123, "step": 19575 }, { "epoch": 0.37, "learning_rate": 3.6362283287368414e-06, "loss": 1.034, "step": 19576 }, { "epoch": 0.37, "learning_rate": 3.6360922505389394e-06, "loss": 0.9738, "step": 19577 }, { "epoch": 0.37, "learning_rate": 3.635956168098904e-06, "loss": 0.9935, "step": 19578 }, { "epoch": 0.37, "learning_rate": 3.6358200814172432e-06, "loss": 0.9509, "step": 19579 }, { "epoch": 0.37, "learning_rate": 3.6356839904944656e-06, "loss": 1.0283, "step": 19580 }, { "epoch": 0.37, "learning_rate": 3.635547895331078e-06, "loss": 1.028, "step": 19581 }, { "epoch": 0.37, "learning_rate": 3.6354117959275897e-06, "loss": 0.9758, "step": 19582 }, { "epoch": 0.37, "learning_rate": 3.6352756922845083e-06, "loss": 0.9158, "step": 19583 }, { "epoch": 0.37, "learning_rate": 3.6351395844023425e-06, "loss": 0.7733, "step": 19584 }, { "epoch": 0.37, "learning_rate": 3.6350034722815997e-06, "loss": 1.1018, "step": 19585 }, { "epoch": 0.37, "learning_rate": 3.63486735592279e-06, "loss": 0.8355, "step": 19586 }, { "epoch": 0.37, "learning_rate": 3.63473123532642e-06, "loss": 1.094, "step": 19587 }, { "epoch": 0.37, "learning_rate": 3.634595110492998e-06, "loss": 0.8136, "step": 19588 }, { "epoch": 0.37, "learning_rate": 3.6344589814230322e-06, "loss": 0.9236, "step": 19589 }, { "epoch": 0.37, "learning_rate": 3.6343228481170324e-06, "loss": 1.053, "step": 19590 }, { "epoch": 0.37, "learning_rate": 3.634186710575504e-06, "loss": 0.9865, "step": 19591 }, { "epoch": 0.37, "learning_rate": 3.634050568798959e-06, "loss": 0.8241, "step": 19592 }, { "epoch": 0.37, "learning_rate": 3.633914422787903e-06, "loss": 1.0809, "step": 19593 }, { "epoch": 0.37, "learning_rate": 3.6337782725428463e-06, "loss": 0.9166, "step": 19594 }, { "epoch": 0.37, "learning_rate": 3.6336421180642957e-06, "loss": 0.9118, "step": 19595 }, { "epoch": 0.37, "learning_rate": 3.63350595935276e-06, "loss": 0.7304, "step": 19596 }, { "epoch": 0.37, "learning_rate": 3.633369796408748e-06, "loss": 0.9807, "step": 19597 }, { "epoch": 0.37, "learning_rate": 3.633233629232768e-06, "loss": 0.8636, "step": 19598 }, { "epoch": 0.37, "learning_rate": 3.633097457825328e-06, "loss": 1.1559, "step": 19599 }, { "epoch": 0.37, "learning_rate": 3.632961282186937e-06, "loss": 1.1666, "step": 19600 }, { "epoch": 0.37, "learning_rate": 3.6328251023181036e-06, "loss": 1.0137, "step": 19601 }, { "epoch": 0.37, "learning_rate": 3.632688918219336e-06, "loss": 1.0377, "step": 19602 }, { "epoch": 0.37, "learning_rate": 3.6325527298911427e-06, "loss": 0.987, "step": 19603 }, { "epoch": 0.37, "learning_rate": 3.632416537334032e-06, "loss": 0.8398, "step": 19604 }, { "epoch": 0.37, "learning_rate": 3.6322803405485125e-06, "loss": 0.841, "step": 19605 }, { "epoch": 0.37, "learning_rate": 3.632144139535093e-06, "loss": 1.0214, "step": 19606 }, { "epoch": 0.37, "learning_rate": 3.632007934294283e-06, "loss": 0.8677, "step": 19607 }, { "epoch": 0.37, "learning_rate": 3.6318717248265888e-06, "loss": 1.0107, "step": 19608 }, { "epoch": 0.37, "learning_rate": 3.631735511132521e-06, "loss": 0.9551, "step": 19609 }, { "epoch": 0.37, "learning_rate": 3.6315992932125874e-06, "loss": 0.8277, "step": 19610 }, { "epoch": 0.37, "learning_rate": 3.6314630710672966e-06, "loss": 1.0428, "step": 19611 }, { "epoch": 0.37, "learning_rate": 3.6313268446971566e-06, "loss": 1.1152, "step": 19612 }, { "epoch": 0.37, "learning_rate": 3.6311906141026783e-06, "loss": 1.0243, "step": 19613 }, { "epoch": 0.37, "learning_rate": 3.6310543792843677e-06, "loss": 0.9268, "step": 19614 }, { "epoch": 0.37, "learning_rate": 3.630918140242735e-06, "loss": 0.9694, "step": 19615 }, { "epoch": 0.37, "learning_rate": 3.63078189697829e-06, "loss": 0.9115, "step": 19616 }, { "epoch": 0.37, "learning_rate": 3.6306456494915386e-06, "loss": 0.9784, "step": 19617 }, { "epoch": 0.37, "learning_rate": 3.6305093977829912e-06, "loss": 1.1559, "step": 19618 }, { "epoch": 0.37, "learning_rate": 3.6303731418531564e-06, "loss": 1.0158, "step": 19619 }, { "epoch": 0.37, "learning_rate": 3.630236881702543e-06, "loss": 0.9028, "step": 19620 }, { "epoch": 0.37, "learning_rate": 3.6301006173316598e-06, "loss": 0.8446, "step": 19621 }, { "epoch": 0.37, "learning_rate": 3.6299643487410164e-06, "loss": 0.8775, "step": 19622 }, { "epoch": 0.37, "learning_rate": 3.6298280759311194e-06, "loss": 0.9328, "step": 19623 }, { "epoch": 0.37, "learning_rate": 3.6296917989024796e-06, "loss": 0.8714, "step": 19624 }, { "epoch": 0.37, "learning_rate": 3.629555517655605e-06, "loss": 1.0074, "step": 19625 }, { "epoch": 0.37, "learning_rate": 3.629419232191005e-06, "loss": 0.894, "step": 19626 }, { "epoch": 0.37, "learning_rate": 3.629282942509188e-06, "loss": 0.8886, "step": 19627 }, { "epoch": 0.37, "learning_rate": 3.6291466486106637e-06, "loss": 0.8647, "step": 19628 }, { "epoch": 0.37, "learning_rate": 3.6290103504959403e-06, "loss": 0.8704, "step": 19629 }, { "epoch": 0.37, "learning_rate": 3.628874048165526e-06, "loss": 0.8399, "step": 19630 }, { "epoch": 0.37, "learning_rate": 3.6287377416199316e-06, "loss": 0.8874, "step": 19631 }, { "epoch": 0.37, "learning_rate": 3.6286014308596645e-06, "loss": 1.1753, "step": 19632 }, { "epoch": 0.37, "learning_rate": 3.628465115885234e-06, "loss": 0.804, "step": 19633 }, { "epoch": 0.37, "learning_rate": 3.6283287966971504e-06, "loss": 0.6961, "step": 19634 }, { "epoch": 0.37, "learning_rate": 3.6281924732959207e-06, "loss": 0.8715, "step": 19635 }, { "epoch": 0.37, "learning_rate": 3.628056145682055e-06, "loss": 0.89, "step": 19636 }, { "epoch": 0.37, "learning_rate": 3.6279198138560634e-06, "loss": 1.0101, "step": 19637 }, { "epoch": 0.37, "learning_rate": 3.6277834778184527e-06, "loss": 0.9709, "step": 19638 }, { "epoch": 0.37, "learning_rate": 3.627647137569733e-06, "loss": 0.9849, "step": 19639 }, { "epoch": 0.37, "learning_rate": 3.627510793110414e-06, "loss": 1.0047, "step": 19640 }, { "epoch": 0.37, "learning_rate": 3.6273744444410037e-06, "loss": 0.784, "step": 19641 }, { "epoch": 0.37, "learning_rate": 3.627238091562012e-06, "loss": 0.9611, "step": 19642 }, { "epoch": 0.37, "learning_rate": 3.6271017344739485e-06, "loss": 0.9676, "step": 19643 }, { "epoch": 0.37, "learning_rate": 3.6269653731773207e-06, "loss": 1.0873, "step": 19644 }, { "epoch": 0.37, "learning_rate": 3.62682900767264e-06, "loss": 0.9462, "step": 19645 }, { "epoch": 0.37, "learning_rate": 3.6266926379604123e-06, "loss": 0.787, "step": 19646 }, { "epoch": 0.37, "learning_rate": 3.62655626404115e-06, "loss": 0.9034, "step": 19647 }, { "epoch": 0.37, "learning_rate": 3.6264198859153616e-06, "loss": 0.9449, "step": 19648 }, { "epoch": 0.37, "learning_rate": 3.626283503583555e-06, "loss": 1.0328, "step": 19649 }, { "epoch": 0.37, "learning_rate": 3.6261471170462412e-06, "loss": 0.8197, "step": 19650 }, { "epoch": 0.37, "learning_rate": 3.6260107263039284e-06, "loss": 0.992, "step": 19651 }, { "epoch": 0.37, "learning_rate": 3.625874331357126e-06, "loss": 0.925, "step": 19652 }, { "epoch": 0.37, "learning_rate": 3.6257379322063425e-06, "loss": 1.0944, "step": 19653 }, { "epoch": 0.37, "learning_rate": 3.625601528852089e-06, "loss": 0.8705, "step": 19654 }, { "epoch": 0.37, "learning_rate": 3.6254651212948736e-06, "loss": 0.7181, "step": 19655 }, { "epoch": 0.37, "learning_rate": 3.6253287095352063e-06, "loss": 1.1811, "step": 19656 }, { "epoch": 0.37, "learning_rate": 3.6251922935735962e-06, "loss": 1.0191, "step": 19657 }, { "epoch": 0.37, "learning_rate": 3.6250558734105524e-06, "loss": 0.8202, "step": 19658 }, { "epoch": 0.37, "learning_rate": 3.624919449046584e-06, "loss": 0.9982, "step": 19659 }, { "epoch": 0.37, "learning_rate": 3.624783020482201e-06, "loss": 0.8795, "step": 19660 }, { "epoch": 0.37, "learning_rate": 3.6246465877179126e-06, "loss": 0.8376, "step": 19661 }, { "epoch": 0.37, "learning_rate": 3.6245101507542286e-06, "loss": 1.0012, "step": 19662 }, { "epoch": 0.37, "learning_rate": 3.6243737095916587e-06, "loss": 1.2303, "step": 19663 }, { "epoch": 0.37, "learning_rate": 3.624237264230711e-06, "loss": 0.8768, "step": 19664 }, { "epoch": 0.37, "learning_rate": 3.6241008146718957e-06, "loss": 0.6962, "step": 19665 }, { "epoch": 0.37, "learning_rate": 3.6239643609157225e-06, "loss": 1.0389, "step": 19666 }, { "epoch": 0.37, "learning_rate": 3.6238279029627018e-06, "loss": 0.777, "step": 19667 }, { "epoch": 0.37, "learning_rate": 3.623691440813341e-06, "loss": 1.0767, "step": 19668 }, { "epoch": 0.37, "learning_rate": 3.623554974468152e-06, "loss": 1.0353, "step": 19669 }, { "epoch": 0.37, "learning_rate": 3.6234185039276427e-06, "loss": 0.8353, "step": 19670 }, { "epoch": 0.37, "learning_rate": 3.6232820291923227e-06, "loss": 1.0514, "step": 19671 }, { "epoch": 0.37, "learning_rate": 3.623145550262702e-06, "loss": 0.9, "step": 19672 }, { "epoch": 0.37, "learning_rate": 3.623009067139291e-06, "loss": 0.9739, "step": 19673 }, { "epoch": 0.37, "learning_rate": 3.622872579822597e-06, "loss": 1.0067, "step": 19674 }, { "epoch": 0.37, "learning_rate": 3.6227360883131334e-06, "loss": 1.075, "step": 19675 }, { "epoch": 0.37, "learning_rate": 3.6225995926114066e-06, "loss": 0.964, "step": 19676 }, { "epoch": 0.37, "learning_rate": 3.6224630927179273e-06, "loss": 0.9155, "step": 19677 }, { "epoch": 0.37, "learning_rate": 3.6223265886332053e-06, "loss": 0.8589, "step": 19678 }, { "epoch": 0.37, "learning_rate": 3.62219008035775e-06, "loss": 0.9005, "step": 19679 }, { "epoch": 0.37, "learning_rate": 3.622053567892072e-06, "loss": 1.0198, "step": 19680 }, { "epoch": 0.37, "learning_rate": 3.6219170512366798e-06, "loss": 1.1017, "step": 19681 }, { "epoch": 0.37, "learning_rate": 3.621780530392084e-06, "loss": 0.8404, "step": 19682 }, { "epoch": 0.37, "learning_rate": 3.621644005358794e-06, "loss": 0.8144, "step": 19683 }, { "epoch": 0.37, "learning_rate": 3.6215074761373193e-06, "loss": 1.0479, "step": 19684 }, { "epoch": 0.37, "learning_rate": 3.6213709427281705e-06, "loss": 0.8287, "step": 19685 }, { "epoch": 0.37, "learning_rate": 3.621234405131857e-06, "loss": 0.866, "step": 19686 }, { "epoch": 0.37, "learning_rate": 3.621097863348888e-06, "loss": 1.0527, "step": 19687 }, { "epoch": 0.37, "learning_rate": 3.6209613173797747e-06, "loss": 0.8534, "step": 19688 }, { "epoch": 0.37, "learning_rate": 3.6208247672250256e-06, "loss": 1.0828, "step": 19689 }, { "epoch": 0.37, "learning_rate": 3.6206882128851523e-06, "loss": 0.8293, "step": 19690 }, { "epoch": 0.37, "learning_rate": 3.6205516543606627e-06, "loss": 0.9203, "step": 19691 }, { "epoch": 0.37, "learning_rate": 3.6204150916520675e-06, "loss": 0.8558, "step": 19692 }, { "epoch": 0.37, "learning_rate": 3.620278524759877e-06, "loss": 1.1036, "step": 19693 }, { "epoch": 0.37, "learning_rate": 3.620141953684601e-06, "loss": 1.1083, "step": 19694 }, { "epoch": 0.37, "learning_rate": 3.6200053784267486e-06, "loss": 0.9991, "step": 19695 }, { "epoch": 0.37, "learning_rate": 3.619868798986831e-06, "loss": 0.9844, "step": 19696 }, { "epoch": 0.37, "learning_rate": 3.6197322153653574e-06, "loss": 0.9802, "step": 19697 }, { "epoch": 0.37, "learning_rate": 3.6195956275628385e-06, "loss": 0.9227, "step": 19698 }, { "epoch": 0.37, "learning_rate": 3.619459035579784e-06, "loss": 0.9743, "step": 19699 }, { "epoch": 0.37, "learning_rate": 3.619322439416703e-06, "loss": 0.8671, "step": 19700 }, { "epoch": 0.37, "learning_rate": 3.6191858390741065e-06, "loss": 0.9302, "step": 19701 }, { "epoch": 0.37, "learning_rate": 3.619049234552505e-06, "loss": 0.9055, "step": 19702 }, { "epoch": 0.37, "learning_rate": 3.6189126258524067e-06, "loss": 1.0914, "step": 19703 }, { "epoch": 0.37, "learning_rate": 3.618776012974324e-06, "loss": 0.8884, "step": 19704 }, { "epoch": 0.37, "learning_rate": 3.618639395918766e-06, "loss": 0.9157, "step": 19705 }, { "epoch": 0.37, "learning_rate": 3.6185027746862422e-06, "loss": 0.9536, "step": 19706 }, { "epoch": 0.37, "learning_rate": 3.618366149277264e-06, "loss": 0.8333, "step": 19707 }, { "epoch": 0.37, "learning_rate": 3.61822951969234e-06, "loss": 0.8604, "step": 19708 }, { "epoch": 0.37, "learning_rate": 3.618092885931982e-06, "loss": 1.1395, "step": 19709 }, { "epoch": 0.37, "learning_rate": 3.617956247996699e-06, "loss": 0.7015, "step": 19710 }, { "epoch": 0.37, "learning_rate": 3.6178196058870025e-06, "loss": 1.0139, "step": 19711 }, { "epoch": 0.37, "learning_rate": 3.6176829596034015e-06, "loss": 1.2452, "step": 19712 }, { "epoch": 0.37, "learning_rate": 3.6175463091464057e-06, "loss": 0.9835, "step": 19713 }, { "epoch": 0.37, "learning_rate": 3.617409654516528e-06, "loss": 1.0175, "step": 19714 }, { "epoch": 0.37, "learning_rate": 3.617272995714275e-06, "loss": 1.0337, "step": 19715 }, { "epoch": 0.37, "learning_rate": 3.617136332740159e-06, "loss": 1.0787, "step": 19716 }, { "epoch": 0.37, "learning_rate": 3.6169996655946915e-06, "loss": 1.0707, "step": 19717 }, { "epoch": 0.37, "learning_rate": 3.616862994278381e-06, "loss": 0.7902, "step": 19718 }, { "epoch": 0.37, "learning_rate": 3.6167263187917378e-06, "loss": 1.076, "step": 19719 }, { "epoch": 0.37, "learning_rate": 3.616589639135274e-06, "loss": 1.0502, "step": 19720 }, { "epoch": 0.37, "learning_rate": 3.6164529553094975e-06, "loss": 0.8286, "step": 19721 }, { "epoch": 0.37, "learning_rate": 3.6163162673149203e-06, "loss": 0.9167, "step": 19722 }, { "epoch": 0.37, "learning_rate": 3.6161795751520525e-06, "loss": 0.7699, "step": 19723 }, { "epoch": 0.37, "learning_rate": 3.616042878821404e-06, "loss": 1.0828, "step": 19724 }, { "epoch": 0.37, "learning_rate": 3.6159061783234863e-06, "loss": 1.1804, "step": 19725 }, { "epoch": 0.37, "learning_rate": 3.615769473658809e-06, "loss": 1.1896, "step": 19726 }, { "epoch": 0.37, "learning_rate": 3.615632764827882e-06, "loss": 0.8777, "step": 19727 }, { "epoch": 0.37, "learning_rate": 3.6154960518312164e-06, "loss": 1.0038, "step": 19728 }, { "epoch": 0.37, "learning_rate": 3.615359334669324e-06, "loss": 0.9551, "step": 19729 }, { "epoch": 0.37, "learning_rate": 3.615222613342713e-06, "loss": 0.9183, "step": 19730 }, { "epoch": 0.37, "learning_rate": 3.6150858878518946e-06, "loss": 1.1856, "step": 19731 }, { "epoch": 0.37, "learning_rate": 3.6149491581973813e-06, "loss": 0.925, "step": 19732 }, { "epoch": 0.37, "learning_rate": 3.6148124243796807e-06, "loss": 0.7808, "step": 19733 }, { "epoch": 0.37, "learning_rate": 3.614675686399305e-06, "loss": 0.7852, "step": 19734 }, { "epoch": 0.37, "learning_rate": 3.6145389442567646e-06, "loss": 0.9432, "step": 19735 }, { "epoch": 0.37, "learning_rate": 3.61440219795257e-06, "loss": 0.9764, "step": 19736 }, { "epoch": 0.37, "learning_rate": 3.6142654474872307e-06, "loss": 1.058, "step": 19737 }, { "epoch": 0.37, "learning_rate": 3.6141286928612603e-06, "loss": 1.1743, "step": 19738 }, { "epoch": 0.37, "learning_rate": 3.613991934075166e-06, "loss": 0.9829, "step": 19739 }, { "epoch": 0.37, "learning_rate": 3.6138551711294605e-06, "loss": 0.8583, "step": 19740 }, { "epoch": 0.37, "learning_rate": 3.6137184040246542e-06, "loss": 1.0079, "step": 19741 }, { "epoch": 0.37, "learning_rate": 3.613581632761257e-06, "loss": 0.6618, "step": 19742 }, { "epoch": 0.37, "learning_rate": 3.6134448573397805e-06, "loss": 0.8448, "step": 19743 }, { "epoch": 0.37, "learning_rate": 3.613308077760735e-06, "loss": 1.2804, "step": 19744 }, { "epoch": 0.37, "learning_rate": 3.613171294024631e-06, "loss": 0.987, "step": 19745 }, { "epoch": 0.37, "learning_rate": 3.6130345061319796e-06, "loss": 1.028, "step": 19746 }, { "epoch": 0.37, "learning_rate": 3.6128977140832923e-06, "loss": 0.7603, "step": 19747 }, { "epoch": 0.37, "learning_rate": 3.612760917879078e-06, "loss": 0.9635, "step": 19748 }, { "epoch": 0.37, "learning_rate": 3.612624117519849e-06, "loss": 1.1752, "step": 19749 }, { "epoch": 0.37, "learning_rate": 3.6124873130061158e-06, "loss": 1.1878, "step": 19750 }, { "epoch": 0.37, "learning_rate": 3.6123505043383883e-06, "loss": 1.0416, "step": 19751 }, { "epoch": 0.37, "learning_rate": 3.6122136915171785e-06, "loss": 0.8223, "step": 19752 }, { "epoch": 0.37, "learning_rate": 3.6120768745429975e-06, "loss": 1.0117, "step": 19753 }, { "epoch": 0.37, "learning_rate": 3.6119400534163552e-06, "loss": 0.8872, "step": 19754 }, { "epoch": 0.37, "learning_rate": 3.6118032281377624e-06, "loss": 1.1127, "step": 19755 }, { "epoch": 0.37, "learning_rate": 3.611666398707731e-06, "loss": 0.9866, "step": 19756 }, { "epoch": 0.37, "learning_rate": 3.6115295651267712e-06, "loss": 0.9215, "step": 19757 }, { "epoch": 0.37, "learning_rate": 3.611392727395393e-06, "loss": 0.9315, "step": 19758 }, { "epoch": 0.37, "learning_rate": 3.61125588551411e-06, "loss": 1.0176, "step": 19759 }, { "epoch": 0.37, "learning_rate": 3.611119039483431e-06, "loss": 0.8405, "step": 19760 }, { "epoch": 0.37, "learning_rate": 3.6109821893038683e-06, "loss": 1.0037, "step": 19761 }, { "epoch": 0.37, "learning_rate": 3.6108453349759307e-06, "loss": 1.0144, "step": 19762 }, { "epoch": 0.37, "learning_rate": 3.610708476500132e-06, "loss": 1.1717, "step": 19763 }, { "epoch": 0.37, "learning_rate": 3.6105716138769807e-06, "loss": 1.0115, "step": 19764 }, { "epoch": 0.37, "learning_rate": 3.61043474710699e-06, "loss": 0.9883, "step": 19765 }, { "epoch": 0.37, "learning_rate": 3.61029787619067e-06, "loss": 0.9556, "step": 19766 }, { "epoch": 0.37, "learning_rate": 3.6101610011285314e-06, "loss": 0.757, "step": 19767 }, { "epoch": 0.37, "learning_rate": 3.610024121921086e-06, "loss": 0.9611, "step": 19768 }, { "epoch": 0.37, "learning_rate": 3.6098872385688436e-06, "loss": 0.8939, "step": 19769 }, { "epoch": 0.37, "learning_rate": 3.6097503510723177e-06, "loss": 1.0522, "step": 19770 }, { "epoch": 0.37, "learning_rate": 3.6096134594320164e-06, "loss": 0.8231, "step": 19771 }, { "epoch": 0.37, "learning_rate": 3.6094765636484534e-06, "loss": 0.8979, "step": 19772 }, { "epoch": 0.37, "learning_rate": 3.6093396637221395e-06, "loss": 1.1054, "step": 19773 }, { "epoch": 0.37, "learning_rate": 3.6092027596535847e-06, "loss": 1.1503, "step": 19774 }, { "epoch": 0.37, "learning_rate": 3.609065851443301e-06, "loss": 0.8647, "step": 19775 }, { "epoch": 0.37, "learning_rate": 3.6089289390917992e-06, "loss": 1.0685, "step": 19776 }, { "epoch": 0.37, "learning_rate": 3.608792022599591e-06, "loss": 0.7494, "step": 19777 }, { "epoch": 0.37, "learning_rate": 3.6086551019671866e-06, "loss": 1.075, "step": 19778 }, { "epoch": 0.37, "learning_rate": 3.6085181771950984e-06, "loss": 0.8097, "step": 19779 }, { "epoch": 0.37, "learning_rate": 3.6083812482838376e-06, "loss": 0.9696, "step": 19780 }, { "epoch": 0.37, "learning_rate": 3.6082443152339153e-06, "loss": 0.971, "step": 19781 }, { "epoch": 0.37, "learning_rate": 3.6081073780458424e-06, "loss": 0.9109, "step": 19782 }, { "epoch": 0.37, "learning_rate": 3.607970436720131e-06, "loss": 0.8472, "step": 19783 }, { "epoch": 0.37, "learning_rate": 3.607833491257291e-06, "loss": 0.8058, "step": 19784 }, { "epoch": 0.37, "learning_rate": 3.6076965416578353e-06, "loss": 0.8964, "step": 19785 }, { "epoch": 0.37, "learning_rate": 3.6075595879222745e-06, "loss": 0.8814, "step": 19786 }, { "epoch": 0.37, "learning_rate": 3.6074226300511207e-06, "loss": 1.3643, "step": 19787 }, { "epoch": 0.37, "learning_rate": 3.607285668044884e-06, "loss": 1.0323, "step": 19788 }, { "epoch": 0.37, "learning_rate": 3.6071487019040773e-06, "loss": 0.9719, "step": 19789 }, { "epoch": 0.37, "learning_rate": 3.6070117316292106e-06, "loss": 0.8884, "step": 19790 }, { "epoch": 0.37, "learning_rate": 3.6068747572207973e-06, "loss": 0.6694, "step": 19791 }, { "epoch": 0.37, "learning_rate": 3.6067377786793456e-06, "loss": 0.9954, "step": 19792 }, { "epoch": 0.37, "learning_rate": 3.60660079600537e-06, "loss": 0.9538, "step": 19793 }, { "epoch": 0.37, "learning_rate": 3.6064638091993814e-06, "loss": 0.9849, "step": 19794 }, { "epoch": 0.37, "learning_rate": 3.6063268182618905e-06, "loss": 0.8822, "step": 19795 }, { "epoch": 0.37, "learning_rate": 3.606189823193409e-06, "loss": 0.7811, "step": 19796 }, { "epoch": 0.37, "learning_rate": 3.606052823994449e-06, "loss": 0.9678, "step": 19797 }, { "epoch": 0.37, "learning_rate": 3.6059158206655217e-06, "loss": 0.9695, "step": 19798 }, { "epoch": 0.37, "learning_rate": 3.605778813207138e-06, "loss": 1.1183, "step": 19799 }, { "epoch": 0.37, "learning_rate": 3.60564180161981e-06, "loss": 1.0782, "step": 19800 }, { "epoch": 0.37, "learning_rate": 3.6055047859040505e-06, "loss": 1.104, "step": 19801 }, { "epoch": 0.37, "learning_rate": 3.6053677660603693e-06, "loss": 0.8215, "step": 19802 }, { "epoch": 0.37, "learning_rate": 3.605230742089279e-06, "loss": 1.0608, "step": 19803 }, { "epoch": 0.37, "learning_rate": 3.605093713991291e-06, "loss": 0.971, "step": 19804 }, { "epoch": 0.37, "learning_rate": 3.604956681766917e-06, "loss": 0.9411, "step": 19805 }, { "epoch": 0.37, "learning_rate": 3.604819645416668e-06, "loss": 1.1854, "step": 19806 }, { "epoch": 0.37, "learning_rate": 3.6046826049410565e-06, "loss": 1.147, "step": 19807 }, { "epoch": 0.37, "learning_rate": 3.604545560340594e-06, "loss": 1.0214, "step": 19808 }, { "epoch": 0.37, "learning_rate": 3.6044085116157936e-06, "loss": 0.9193, "step": 19809 }, { "epoch": 0.37, "learning_rate": 3.604271458767164e-06, "loss": 0.8562, "step": 19810 }, { "epoch": 0.37, "learning_rate": 3.6041344017952196e-06, "loss": 0.9967, "step": 19811 }, { "epoch": 0.37, "learning_rate": 3.6039973407004706e-06, "loss": 1.2073, "step": 19812 }, { "epoch": 0.37, "learning_rate": 3.6038602754834296e-06, "loss": 1.2246, "step": 19813 }, { "epoch": 0.37, "learning_rate": 3.603723206144608e-06, "loss": 0.9329, "step": 19814 }, { "epoch": 0.37, "learning_rate": 3.6035861326845184e-06, "loss": 0.8453, "step": 19815 }, { "epoch": 0.37, "learning_rate": 3.6034490551036716e-06, "loss": 0.9925, "step": 19816 }, { "epoch": 0.37, "learning_rate": 3.6033119734025795e-06, "loss": 1.0268, "step": 19817 }, { "epoch": 0.37, "learning_rate": 3.603174887581755e-06, "loss": 1.0201, "step": 19818 }, { "epoch": 0.37, "learning_rate": 3.603037797641709e-06, "loss": 0.8805, "step": 19819 }, { "epoch": 0.37, "learning_rate": 3.6029007035829534e-06, "loss": 0.9521, "step": 19820 }, { "epoch": 0.37, "learning_rate": 3.6027636054060007e-06, "loss": 0.8676, "step": 19821 }, { "epoch": 0.37, "learning_rate": 3.602626503111362e-06, "loss": 0.955, "step": 19822 }, { "epoch": 0.37, "learning_rate": 3.6024893966995504e-06, "loss": 0.8973, "step": 19823 }, { "epoch": 0.37, "learning_rate": 3.6023522861710773e-06, "loss": 1.0098, "step": 19824 }, { "epoch": 0.37, "learning_rate": 3.6022151715264544e-06, "loss": 1.0457, "step": 19825 }, { "epoch": 0.37, "learning_rate": 3.6020780527661936e-06, "loss": 0.9125, "step": 19826 }, { "epoch": 0.37, "learning_rate": 3.601940929890807e-06, "loss": 0.826, "step": 19827 }, { "epoch": 0.37, "learning_rate": 3.601803802900807e-06, "loss": 0.992, "step": 19828 }, { "epoch": 0.37, "learning_rate": 3.6016666717967053e-06, "loss": 0.9059, "step": 19829 }, { "epoch": 0.37, "learning_rate": 3.601529536579014e-06, "loss": 0.9797, "step": 19830 }, { "epoch": 0.37, "learning_rate": 3.6013923972482457e-06, "loss": 1.2185, "step": 19831 }, { "epoch": 0.37, "learning_rate": 3.6012552538049116e-06, "loss": 0.8917, "step": 19832 }, { "epoch": 0.37, "learning_rate": 3.6011181062495244e-06, "loss": 0.8803, "step": 19833 }, { "epoch": 0.37, "learning_rate": 3.600980954582595e-06, "loss": 0.8867, "step": 19834 }, { "epoch": 0.37, "learning_rate": 3.600843798804637e-06, "loss": 0.8494, "step": 19835 }, { "epoch": 0.37, "learning_rate": 3.6007066389161625e-06, "loss": 0.8345, "step": 19836 }, { "epoch": 0.37, "learning_rate": 3.600569474917683e-06, "loss": 1.2388, "step": 19837 }, { "epoch": 0.37, "learning_rate": 3.60043230680971e-06, "loss": 1.2471, "step": 19838 }, { "epoch": 0.37, "learning_rate": 3.600295134592758e-06, "loss": 0.9445, "step": 19839 }, { "epoch": 0.37, "learning_rate": 3.6001579582673363e-06, "loss": 0.9725, "step": 19840 }, { "epoch": 0.37, "learning_rate": 3.600020777833959e-06, "loss": 0.9269, "step": 19841 }, { "epoch": 0.37, "learning_rate": 3.5998835932931375e-06, "loss": 1.0099, "step": 19842 }, { "epoch": 0.37, "learning_rate": 3.599746404645385e-06, "loss": 1.1593, "step": 19843 }, { "epoch": 0.37, "learning_rate": 3.5996092118912128e-06, "loss": 1.0551, "step": 19844 }, { "epoch": 0.37, "learning_rate": 3.5994720150311342e-06, "loss": 0.9391, "step": 19845 }, { "epoch": 0.37, "learning_rate": 3.5993348140656597e-06, "loss": 0.8732, "step": 19846 }, { "epoch": 0.37, "learning_rate": 3.5991976089953035e-06, "loss": 0.8257, "step": 19847 }, { "epoch": 0.37, "learning_rate": 3.5990603998205763e-06, "loss": 0.9571, "step": 19848 }, { "epoch": 0.37, "learning_rate": 3.5989231865419922e-06, "loss": 0.8922, "step": 19849 }, { "epoch": 0.37, "learning_rate": 3.5987859691600625e-06, "loss": 1.2422, "step": 19850 }, { "epoch": 0.37, "learning_rate": 3.5986487476752996e-06, "loss": 0.8801, "step": 19851 }, { "epoch": 0.37, "learning_rate": 3.5985115220882155e-06, "loss": 1.0016, "step": 19852 }, { "epoch": 0.37, "learning_rate": 3.598374292399323e-06, "loss": 0.7196, "step": 19853 }, { "epoch": 0.37, "learning_rate": 3.5982370586091354e-06, "loss": 0.9883, "step": 19854 }, { "epoch": 0.37, "learning_rate": 3.5980998207181633e-06, "loss": 0.7954, "step": 19855 }, { "epoch": 0.37, "learning_rate": 3.597962578726921e-06, "loss": 1.006, "step": 19856 }, { "epoch": 0.37, "learning_rate": 3.59782533263592e-06, "loss": 0.73, "step": 19857 }, { "epoch": 0.37, "learning_rate": 3.5976880824456724e-06, "loss": 0.8242, "step": 19858 }, { "epoch": 0.37, "learning_rate": 3.5975508281566914e-06, "loss": 0.9107, "step": 19859 }, { "epoch": 0.37, "learning_rate": 3.5974135697694897e-06, "loss": 1.0134, "step": 19860 }, { "epoch": 0.37, "learning_rate": 3.5972763072845785e-06, "loss": 0.945, "step": 19861 }, { "epoch": 0.37, "learning_rate": 3.5971390407024715e-06, "loss": 1.0135, "step": 19862 }, { "epoch": 0.37, "learning_rate": 3.597001770023681e-06, "loss": 0.9298, "step": 19863 }, { "epoch": 0.37, "learning_rate": 3.5968644952487197e-06, "loss": 0.7736, "step": 19864 }, { "epoch": 0.37, "learning_rate": 3.5967272163780997e-06, "loss": 0.8878, "step": 19865 }, { "epoch": 0.37, "learning_rate": 3.5965899334123346e-06, "loss": 0.9131, "step": 19866 }, { "epoch": 0.37, "learning_rate": 3.5964526463519356e-06, "loss": 0.7586, "step": 19867 }, { "epoch": 0.37, "learning_rate": 3.596315355197416e-06, "loss": 0.9091, "step": 19868 }, { "epoch": 0.37, "learning_rate": 3.596178059949289e-06, "loss": 1.1324, "step": 19869 }, { "epoch": 0.37, "learning_rate": 3.596040760608066e-06, "loss": 1.1063, "step": 19870 }, { "epoch": 0.37, "learning_rate": 3.5959034571742613e-06, "loss": 0.8946, "step": 19871 }, { "epoch": 0.37, "learning_rate": 3.5957661496483866e-06, "loss": 0.9835, "step": 19872 }, { "epoch": 0.37, "learning_rate": 3.595628838030954e-06, "loss": 0.9915, "step": 19873 }, { "epoch": 0.37, "learning_rate": 3.5954915223224774e-06, "loss": 0.972, "step": 19874 }, { "epoch": 0.37, "learning_rate": 3.595354202523469e-06, "loss": 1.0159, "step": 19875 }, { "epoch": 0.37, "learning_rate": 3.595216878634441e-06, "loss": 1.1363, "step": 19876 }, { "epoch": 0.38, "learning_rate": 3.595079550655907e-06, "loss": 0.8091, "step": 19877 }, { "epoch": 0.38, "learning_rate": 3.59494221858838e-06, "loss": 0.7784, "step": 19878 }, { "epoch": 0.38, "learning_rate": 3.594804882432372e-06, "loss": 0.6746, "step": 19879 }, { "epoch": 0.38, "learning_rate": 3.594667542188397e-06, "loss": 1.0728, "step": 19880 }, { "epoch": 0.38, "learning_rate": 3.5945301978569663e-06, "loss": 0.9577, "step": 19881 }, { "epoch": 0.38, "learning_rate": 3.5943928494385933e-06, "loss": 0.9938, "step": 19882 }, { "epoch": 0.38, "learning_rate": 3.5942554969337907e-06, "loss": 0.8087, "step": 19883 }, { "epoch": 0.38, "learning_rate": 3.594118140343072e-06, "loss": 1.0347, "step": 19884 }, { "epoch": 0.38, "learning_rate": 3.5939807796669496e-06, "loss": 0.9808, "step": 19885 }, { "epoch": 0.38, "learning_rate": 3.5938434149059364e-06, "loss": 1.0825, "step": 19886 }, { "epoch": 0.38, "learning_rate": 3.593706046060546e-06, "loss": 1.166, "step": 19887 }, { "epoch": 0.38, "learning_rate": 3.59356867313129e-06, "loss": 1.0989, "step": 19888 }, { "epoch": 0.38, "learning_rate": 3.5934312961186822e-06, "loss": 1.0314, "step": 19889 }, { "epoch": 0.38, "learning_rate": 3.593293915023236e-06, "loss": 0.859, "step": 19890 }, { "epoch": 0.38, "learning_rate": 3.593156529845463e-06, "loss": 0.7622, "step": 19891 }, { "epoch": 0.38, "learning_rate": 3.5930191405858784e-06, "loss": 1.0085, "step": 19892 }, { "epoch": 0.38, "learning_rate": 3.5928817472449927e-06, "loss": 0.8852, "step": 19893 }, { "epoch": 0.38, "learning_rate": 3.5927443498233204e-06, "loss": 0.9944, "step": 19894 }, { "epoch": 0.38, "learning_rate": 3.5926069483213744e-06, "loss": 1.0891, "step": 19895 }, { "epoch": 0.38, "learning_rate": 3.592469542739667e-06, "loss": 0.9775, "step": 19896 }, { "epoch": 0.38, "learning_rate": 3.592332133078712e-06, "loss": 1.0004, "step": 19897 }, { "epoch": 0.38, "learning_rate": 3.592194719339023e-06, "loss": 0.847, "step": 19898 }, { "epoch": 0.38, "learning_rate": 3.5920573015211115e-06, "loss": 0.7605, "step": 19899 }, { "epoch": 0.38, "learning_rate": 3.5919198796254916e-06, "loss": 1.1509, "step": 19900 }, { "epoch": 0.38, "learning_rate": 3.591782453652677e-06, "loss": 0.9448, "step": 19901 }, { "epoch": 0.38, "learning_rate": 3.5916450236031798e-06, "loss": 0.8968, "step": 19902 }, { "epoch": 0.38, "learning_rate": 3.5915075894775137e-06, "loss": 0.6889, "step": 19903 }, { "epoch": 0.38, "learning_rate": 3.591370151276191e-06, "loss": 0.9516, "step": 19904 }, { "epoch": 0.38, "learning_rate": 3.591232708999727e-06, "loss": 0.9615, "step": 19905 }, { "epoch": 0.38, "learning_rate": 3.591095262648632e-06, "loss": 1.1029, "step": 19906 }, { "epoch": 0.38, "learning_rate": 3.5909578122234217e-06, "loss": 1.1311, "step": 19907 }, { "epoch": 0.38, "learning_rate": 3.590820357724608e-06, "loss": 0.8453, "step": 19908 }, { "epoch": 0.38, "learning_rate": 3.590682899152705e-06, "loss": 0.8962, "step": 19909 }, { "epoch": 0.38, "learning_rate": 3.5905454365082247e-06, "loss": 0.7463, "step": 19910 }, { "epoch": 0.38, "learning_rate": 3.5904079697916814e-06, "loss": 1.0034, "step": 19911 }, { "epoch": 0.38, "learning_rate": 3.5902704990035884e-06, "loss": 0.9771, "step": 19912 }, { "epoch": 0.38, "learning_rate": 3.59013302414446e-06, "loss": 1.1322, "step": 19913 }, { "epoch": 0.38, "learning_rate": 3.5899955452148065e-06, "loss": 0.8677, "step": 19914 }, { "epoch": 0.38, "learning_rate": 3.5898580622151437e-06, "loss": 1.1344, "step": 19915 }, { "epoch": 0.38, "learning_rate": 3.5897205751459848e-06, "loss": 1.0847, "step": 19916 }, { "epoch": 0.38, "learning_rate": 3.589583084007842e-06, "loss": 0.8508, "step": 19917 }, { "epoch": 0.38, "learning_rate": 3.5894455888012293e-06, "loss": 0.923, "step": 19918 }, { "epoch": 0.38, "learning_rate": 3.5893080895266606e-06, "loss": 0.9948, "step": 19919 }, { "epoch": 0.38, "learning_rate": 3.5891705861846486e-06, "loss": 0.8782, "step": 19920 }, { "epoch": 0.38, "learning_rate": 3.589033078775707e-06, "loss": 0.7913, "step": 19921 }, { "epoch": 0.38, "learning_rate": 3.58889556730035e-06, "loss": 0.8194, "step": 19922 }, { "epoch": 0.38, "learning_rate": 3.588758051759089e-06, "loss": 0.8389, "step": 19923 }, { "epoch": 0.38, "learning_rate": 3.5886205321524403e-06, "loss": 0.8459, "step": 19924 }, { "epoch": 0.38, "learning_rate": 3.5884830084809146e-06, "loss": 1.0296, "step": 19925 }, { "epoch": 0.38, "learning_rate": 3.5883454807450276e-06, "loss": 1.0248, "step": 19926 }, { "epoch": 0.38, "learning_rate": 3.5882079489452916e-06, "loss": 0.7233, "step": 19927 }, { "epoch": 0.38, "learning_rate": 3.5880704130822208e-06, "loss": 0.9462, "step": 19928 }, { "epoch": 0.38, "learning_rate": 3.5879328731563277e-06, "loss": 0.8903, "step": 19929 }, { "epoch": 0.38, "learning_rate": 3.5877953291681272e-06, "loss": 0.8289, "step": 19930 }, { "epoch": 0.38, "learning_rate": 3.5876577811181323e-06, "loss": 0.9291, "step": 19931 }, { "epoch": 0.38, "learning_rate": 3.5875202290068563e-06, "loss": 0.9205, "step": 19932 }, { "epoch": 0.38, "learning_rate": 3.587382672834813e-06, "loss": 0.9581, "step": 19933 }, { "epoch": 0.38, "learning_rate": 3.587245112602517e-06, "loss": 1.1133, "step": 19934 }, { "epoch": 0.38, "learning_rate": 3.58710754831048e-06, "loss": 0.7822, "step": 19935 }, { "epoch": 0.38, "learning_rate": 3.586969979959217e-06, "loss": 0.8182, "step": 19936 }, { "epoch": 0.38, "learning_rate": 3.586832407549242e-06, "loss": 1.0603, "step": 19937 }, { "epoch": 0.38, "learning_rate": 3.5866948310810677e-06, "loss": 1.0275, "step": 19938 }, { "epoch": 0.38, "learning_rate": 3.5865572505552083e-06, "loss": 0.8931, "step": 19939 }, { "epoch": 0.38, "learning_rate": 3.586419665972178e-06, "loss": 0.7757, "step": 19940 }, { "epoch": 0.38, "learning_rate": 3.586282077332489e-06, "loss": 0.9576, "step": 19941 }, { "epoch": 0.38, "learning_rate": 3.5861444846366565e-06, "loss": 1.0124, "step": 19942 }, { "epoch": 0.38, "learning_rate": 3.586006887885194e-06, "loss": 0.838, "step": 19943 }, { "epoch": 0.38, "learning_rate": 3.5858692870786147e-06, "loss": 0.954, "step": 19944 }, { "epoch": 0.38, "learning_rate": 3.5857316822174327e-06, "loss": 1.0169, "step": 19945 }, { "epoch": 0.38, "learning_rate": 3.585594073302162e-06, "loss": 1.0535, "step": 19946 }, { "epoch": 0.38, "learning_rate": 3.585456460333316e-06, "loss": 0.9215, "step": 19947 }, { "epoch": 0.38, "learning_rate": 3.5853188433114096e-06, "loss": 0.9876, "step": 19948 }, { "epoch": 0.38, "learning_rate": 3.5851812222369565e-06, "loss": 1.1034, "step": 19949 }, { "epoch": 0.38, "learning_rate": 3.5850435971104684e-06, "loss": 1.168, "step": 19950 }, { "epoch": 0.38, "learning_rate": 3.5849059679324616e-06, "loss": 0.9427, "step": 19951 }, { "epoch": 0.38, "learning_rate": 3.584768334703449e-06, "loss": 1.0013, "step": 19952 }, { "epoch": 0.38, "learning_rate": 3.584630697423944e-06, "loss": 0.8849, "step": 19953 }, { "epoch": 0.38, "learning_rate": 3.5844930560944623e-06, "loss": 0.7543, "step": 19954 }, { "epoch": 0.38, "learning_rate": 3.5843554107155164e-06, "loss": 0.7214, "step": 19955 }, { "epoch": 0.38, "learning_rate": 3.584217761287621e-06, "loss": 1.0424, "step": 19956 }, { "epoch": 0.38, "learning_rate": 3.584080107811289e-06, "loss": 1.0363, "step": 19957 }, { "epoch": 0.38, "learning_rate": 3.5839424502870363e-06, "loss": 0.9165, "step": 19958 }, { "epoch": 0.38, "learning_rate": 3.5838047887153743e-06, "loss": 0.8525, "step": 19959 }, { "epoch": 0.38, "learning_rate": 3.5836671230968188e-06, "loss": 0.8249, "step": 19960 }, { "epoch": 0.38, "learning_rate": 3.5835294534318844e-06, "loss": 0.9529, "step": 19961 }, { "epoch": 0.38, "learning_rate": 3.5833917797210836e-06, "loss": 1.0605, "step": 19962 }, { "epoch": 0.38, "learning_rate": 3.583254101964931e-06, "loss": 1.0792, "step": 19963 }, { "epoch": 0.38, "learning_rate": 3.5831164201639414e-06, "loss": 0.932, "step": 19964 }, { "epoch": 0.38, "learning_rate": 3.5829787343186275e-06, "loss": 1.1097, "step": 19965 }, { "epoch": 0.38, "learning_rate": 3.5828410444295046e-06, "loss": 0.9027, "step": 19966 }, { "epoch": 0.38, "learning_rate": 3.5827033504970865e-06, "loss": 1.0487, "step": 19967 }, { "epoch": 0.38, "learning_rate": 3.5825656525218868e-06, "loss": 1.1834, "step": 19968 }, { "epoch": 0.38, "learning_rate": 3.58242795050442e-06, "loss": 1.1102, "step": 19969 }, { "epoch": 0.38, "learning_rate": 3.582290244445202e-06, "loss": 0.8468, "step": 19970 }, { "epoch": 0.38, "learning_rate": 3.582152534344744e-06, "loss": 0.9094, "step": 19971 }, { "epoch": 0.38, "learning_rate": 3.582014820203562e-06, "loss": 1.0976, "step": 19972 }, { "epoch": 0.38, "learning_rate": 3.5818771020221695e-06, "loss": 0.8801, "step": 19973 }, { "epoch": 0.38, "learning_rate": 3.581739379801081e-06, "loss": 0.9879, "step": 19974 }, { "epoch": 0.38, "learning_rate": 3.5816016535408116e-06, "loss": 1.1668, "step": 19975 }, { "epoch": 0.38, "learning_rate": 3.5814639232418745e-06, "loss": 0.9023, "step": 19976 }, { "epoch": 0.38, "learning_rate": 3.581326188904784e-06, "loss": 0.9256, "step": 19977 }, { "epoch": 0.38, "learning_rate": 3.581188450530055e-06, "loss": 0.7813, "step": 19978 }, { "epoch": 0.38, "learning_rate": 3.581050708118201e-06, "loss": 0.8827, "step": 19979 }, { "epoch": 0.38, "learning_rate": 3.580912961669737e-06, "loss": 0.9968, "step": 19980 }, { "epoch": 0.38, "learning_rate": 3.5807752111851767e-06, "loss": 0.85, "step": 19981 }, { "epoch": 0.38, "learning_rate": 3.580637456665036e-06, "loss": 0.8902, "step": 19982 }, { "epoch": 0.38, "learning_rate": 3.580499698109828e-06, "loss": 0.7838, "step": 19983 }, { "epoch": 0.38, "learning_rate": 3.5803619355200665e-06, "loss": 1.0446, "step": 19984 }, { "epoch": 0.38, "learning_rate": 3.5802241688962676e-06, "loss": 0.8785, "step": 19985 }, { "epoch": 0.38, "learning_rate": 3.580086398238944e-06, "loss": 1.0991, "step": 19986 }, { "epoch": 0.38, "learning_rate": 3.5799486235486106e-06, "loss": 0.9514, "step": 19987 }, { "epoch": 0.38, "learning_rate": 3.579810844825783e-06, "loss": 0.999, "step": 19988 }, { "epoch": 0.38, "learning_rate": 3.5796730620709743e-06, "loss": 0.9232, "step": 19989 }, { "epoch": 0.38, "learning_rate": 3.5795352752846996e-06, "loss": 1.0, "step": 19990 }, { "epoch": 0.38, "learning_rate": 3.5793974844674734e-06, "loss": 0.9248, "step": 19991 }, { "epoch": 0.38, "learning_rate": 3.57925968961981e-06, "loss": 1.1116, "step": 19992 }, { "epoch": 0.38, "learning_rate": 3.5791218907422242e-06, "loss": 1.0922, "step": 19993 }, { "epoch": 0.38, "learning_rate": 3.57898408783523e-06, "loss": 0.9766, "step": 19994 }, { "epoch": 0.38, "learning_rate": 3.5788462808993424e-06, "loss": 0.8864, "step": 19995 }, { "epoch": 0.38, "learning_rate": 3.578708469935076e-06, "loss": 0.9137, "step": 19996 }, { "epoch": 0.38, "learning_rate": 3.5785706549429454e-06, "loss": 0.9642, "step": 19997 }, { "epoch": 0.38, "learning_rate": 3.5784328359234642e-06, "loss": 0.9529, "step": 19998 }, { "epoch": 0.38, "learning_rate": 3.5782950128771494e-06, "loss": 1.1546, "step": 19999 }, { "epoch": 0.38, "learning_rate": 3.5781571858045126e-06, "loss": 1.0597, "step": 20000 }, { "epoch": 0.38, "learning_rate": 3.5780193547060706e-06, "loss": 1.0016, "step": 20001 }, { "epoch": 0.38, "learning_rate": 3.5778815195823373e-06, "loss": 0.8975, "step": 20002 }, { "epoch": 0.38, "learning_rate": 3.577743680433827e-06, "loss": 0.7775, "step": 20003 }, { "epoch": 0.38, "learning_rate": 3.5776058372610557e-06, "loss": 0.7849, "step": 20004 }, { "epoch": 0.38, "learning_rate": 3.577467990064537e-06, "loss": 1.116, "step": 20005 }, { "epoch": 0.38, "learning_rate": 3.5773301388447857e-06, "loss": 0.9507, "step": 20006 }, { "epoch": 0.38, "learning_rate": 3.5771922836023165e-06, "loss": 0.7708, "step": 20007 }, { "epoch": 0.38, "learning_rate": 3.577054424337644e-06, "loss": 0.752, "step": 20008 }, { "epoch": 0.38, "learning_rate": 3.576916561051284e-06, "loss": 0.9372, "step": 20009 }, { "epoch": 0.38, "learning_rate": 3.5767786937437503e-06, "loss": 0.8817, "step": 20010 }, { "epoch": 0.38, "learning_rate": 3.5766408224155584e-06, "loss": 0.9943, "step": 20011 }, { "epoch": 0.38, "learning_rate": 3.5765029470672224e-06, "loss": 1.2623, "step": 20012 }, { "epoch": 0.38, "learning_rate": 3.5763650676992572e-06, "loss": 0.8101, "step": 20013 }, { "epoch": 0.38, "learning_rate": 3.5762271843121775e-06, "loss": 0.8092, "step": 20014 }, { "epoch": 0.38, "learning_rate": 3.5760892969064994e-06, "loss": 0.5845, "step": 20015 }, { "epoch": 0.38, "learning_rate": 3.575951405482736e-06, "loss": 1.0914, "step": 20016 }, { "epoch": 0.38, "learning_rate": 3.5758135100414036e-06, "loss": 0.924, "step": 20017 }, { "epoch": 0.38, "learning_rate": 3.575675610583017e-06, "loss": 1.077, "step": 20018 }, { "epoch": 0.38, "learning_rate": 3.57553770710809e-06, "loss": 1.1213, "step": 20019 }, { "epoch": 0.38, "learning_rate": 3.5753997996171384e-06, "loss": 0.8901, "step": 20020 }, { "epoch": 0.38, "learning_rate": 3.5752618881106764e-06, "loss": 0.9102, "step": 20021 }, { "epoch": 0.38, "learning_rate": 3.5751239725892194e-06, "loss": 0.8781, "step": 20022 }, { "epoch": 0.38, "learning_rate": 3.5749860530532832e-06, "loss": 0.7993, "step": 20023 }, { "epoch": 0.38, "learning_rate": 3.574848129503382e-06, "loss": 0.9274, "step": 20024 }, { "epoch": 0.38, "learning_rate": 3.5747102019400303e-06, "loss": 1.0252, "step": 20025 }, { "epoch": 0.38, "learning_rate": 3.5745722703637444e-06, "loss": 0.9588, "step": 20026 }, { "epoch": 0.38, "learning_rate": 3.5744343347750375e-06, "loss": 0.9557, "step": 20027 }, { "epoch": 0.38, "learning_rate": 3.574296395174427e-06, "loss": 0.9462, "step": 20028 }, { "epoch": 0.38, "learning_rate": 3.5741584515624254e-06, "loss": 0.8514, "step": 20029 }, { "epoch": 0.38, "learning_rate": 3.5740205039395496e-06, "loss": 0.8826, "step": 20030 }, { "epoch": 0.38, "learning_rate": 3.5738825523063147e-06, "loss": 1.1646, "step": 20031 }, { "epoch": 0.38, "learning_rate": 3.573744596663235e-06, "loss": 0.9911, "step": 20032 }, { "epoch": 0.38, "learning_rate": 3.5736066370108257e-06, "loss": 0.8199, "step": 20033 }, { "epoch": 0.38, "learning_rate": 3.573468673349602e-06, "loss": 1.0089, "step": 20034 }, { "epoch": 0.38, "learning_rate": 3.5733307056800794e-06, "loss": 0.9468, "step": 20035 }, { "epoch": 0.38, "learning_rate": 3.573192734002773e-06, "loss": 0.8854, "step": 20036 }, { "epoch": 0.38, "learning_rate": 3.5730547583181974e-06, "loss": 0.9228, "step": 20037 }, { "epoch": 0.38, "learning_rate": 3.5729167786268685e-06, "loss": 1.1045, "step": 20038 }, { "epoch": 0.38, "learning_rate": 3.5727787949293013e-06, "loss": 0.7866, "step": 20039 }, { "epoch": 0.38, "learning_rate": 3.572640807226011e-06, "loss": 0.9973, "step": 20040 }, { "epoch": 0.38, "learning_rate": 3.5725028155175132e-06, "loss": 1.0167, "step": 20041 }, { "epoch": 0.38, "learning_rate": 3.572364819804322e-06, "loss": 0.8737, "step": 20042 }, { "epoch": 0.38, "learning_rate": 3.5722268200869536e-06, "loss": 1.0413, "step": 20043 }, { "epoch": 0.38, "learning_rate": 3.5720888163659235e-06, "loss": 0.9968, "step": 20044 }, { "epoch": 0.38, "learning_rate": 3.5719508086417466e-06, "loss": 0.7617, "step": 20045 }, { "epoch": 0.38, "learning_rate": 3.5718127969149376e-06, "loss": 1.0767, "step": 20046 }, { "epoch": 0.38, "learning_rate": 3.571674781186013e-06, "loss": 1.0379, "step": 20047 }, { "epoch": 0.38, "learning_rate": 3.571536761455488e-06, "loss": 0.8403, "step": 20048 }, { "epoch": 0.38, "learning_rate": 3.5713987377238767e-06, "loss": 1.0427, "step": 20049 }, { "epoch": 0.38, "learning_rate": 3.571260709991696e-06, "loss": 1.0901, "step": 20050 }, { "epoch": 0.38, "learning_rate": 3.5711226782594605e-06, "loss": 0.9702, "step": 20051 }, { "epoch": 0.38, "learning_rate": 3.5709846425276856e-06, "loss": 1.0209, "step": 20052 }, { "epoch": 0.38, "learning_rate": 3.5708466027968874e-06, "loss": 0.9427, "step": 20053 }, { "epoch": 0.38, "learning_rate": 3.5707085590675807e-06, "loss": 0.8063, "step": 20054 }, { "epoch": 0.38, "learning_rate": 3.57057051134028e-06, "loss": 1.0426, "step": 20055 }, { "epoch": 0.38, "learning_rate": 3.5704324596155027e-06, "loss": 0.979, "step": 20056 }, { "epoch": 0.38, "learning_rate": 3.570294403893763e-06, "loss": 1.0933, "step": 20057 }, { "epoch": 0.38, "learning_rate": 3.570156344175577e-06, "loss": 0.858, "step": 20058 }, { "epoch": 0.38, "learning_rate": 3.570018280461461e-06, "loss": 1.1082, "step": 20059 }, { "epoch": 0.38, "learning_rate": 3.569880212751928e-06, "loss": 0.7528, "step": 20060 }, { "epoch": 0.38, "learning_rate": 3.5697421410474963e-06, "loss": 0.9171, "step": 20061 }, { "epoch": 0.38, "learning_rate": 3.56960406534868e-06, "loss": 1.2222, "step": 20062 }, { "epoch": 0.38, "learning_rate": 3.569465985655995e-06, "loss": 0.989, "step": 20063 }, { "epoch": 0.38, "learning_rate": 3.569327901969956e-06, "loss": 1.045, "step": 20064 }, { "epoch": 0.38, "learning_rate": 3.5691898142910797e-06, "loss": 0.9384, "step": 20065 }, { "epoch": 0.38, "learning_rate": 3.569051722619882e-06, "loss": 0.9569, "step": 20066 }, { "epoch": 0.38, "learning_rate": 3.568913626956877e-06, "loss": 0.8799, "step": 20067 }, { "epoch": 0.38, "learning_rate": 3.5687755273025825e-06, "loss": 1.1624, "step": 20068 }, { "epoch": 0.38, "learning_rate": 3.5686374236575122e-06, "loss": 1.0083, "step": 20069 }, { "epoch": 0.38, "learning_rate": 3.5684993160221824e-06, "loss": 0.9377, "step": 20070 }, { "epoch": 0.38, "learning_rate": 3.5683612043971093e-06, "loss": 0.986, "step": 20071 }, { "epoch": 0.38, "learning_rate": 3.568223088782808e-06, "loss": 0.7974, "step": 20072 }, { "epoch": 0.38, "learning_rate": 3.5680849691797944e-06, "loss": 0.9613, "step": 20073 }, { "epoch": 0.38, "learning_rate": 3.5679468455885847e-06, "loss": 0.8615, "step": 20074 }, { "epoch": 0.38, "learning_rate": 3.567808718009694e-06, "loss": 1.1147, "step": 20075 }, { "epoch": 0.38, "learning_rate": 3.5676705864436377e-06, "loss": 1.0249, "step": 20076 }, { "epoch": 0.38, "learning_rate": 3.5675324508909325e-06, "loss": 0.7271, "step": 20077 }, { "epoch": 0.38, "learning_rate": 3.5673943113520935e-06, "loss": 0.8911, "step": 20078 }, { "epoch": 0.38, "learning_rate": 3.5672561678276372e-06, "loss": 0.9049, "step": 20079 }, { "epoch": 0.38, "learning_rate": 3.5671180203180798e-06, "loss": 0.9028, "step": 20080 }, { "epoch": 0.38, "learning_rate": 3.566979868823936e-06, "loss": 1.0936, "step": 20081 }, { "epoch": 0.38, "learning_rate": 3.5668417133457223e-06, "loss": 1.0185, "step": 20082 }, { "epoch": 0.38, "learning_rate": 3.566703553883954e-06, "loss": 0.8154, "step": 20083 }, { "epoch": 0.38, "learning_rate": 3.566565390439147e-06, "loss": 0.8086, "step": 20084 }, { "epoch": 0.38, "learning_rate": 3.566427223011818e-06, "loss": 0.8293, "step": 20085 }, { "epoch": 0.38, "learning_rate": 3.566289051602482e-06, "loss": 0.8814, "step": 20086 }, { "epoch": 0.38, "learning_rate": 3.5661508762116557e-06, "loss": 1.1129, "step": 20087 }, { "epoch": 0.38, "learning_rate": 3.566012696839855e-06, "loss": 0.7945, "step": 20088 }, { "epoch": 0.38, "learning_rate": 3.5658745134875956e-06, "loss": 0.8447, "step": 20089 }, { "epoch": 0.38, "learning_rate": 3.5657363261553936e-06, "loss": 0.759, "step": 20090 }, { "epoch": 0.38, "learning_rate": 3.565598134843764e-06, "loss": 0.9161, "step": 20091 }, { "epoch": 0.38, "learning_rate": 3.5654599395532235e-06, "loss": 0.9239, "step": 20092 }, { "epoch": 0.38, "learning_rate": 3.565321740284289e-06, "loss": 0.9256, "step": 20093 }, { "epoch": 0.38, "learning_rate": 3.5651835370374754e-06, "loss": 1.118, "step": 20094 }, { "epoch": 0.38, "learning_rate": 3.5650453298132996e-06, "loss": 1.0533, "step": 20095 }, { "epoch": 0.38, "learning_rate": 3.564907118612277e-06, "loss": 0.8682, "step": 20096 }, { "epoch": 0.38, "learning_rate": 3.5647689034349236e-06, "loss": 0.8141, "step": 20097 }, { "epoch": 0.38, "learning_rate": 3.564630684281756e-06, "loss": 0.8283, "step": 20098 }, { "epoch": 0.38, "learning_rate": 3.5644924611532892e-06, "loss": 1.0175, "step": 20099 }, { "epoch": 0.38, "learning_rate": 3.5643542340500414e-06, "loss": 1.1208, "step": 20100 }, { "epoch": 0.38, "learning_rate": 3.5642160029725276e-06, "loss": 0.8764, "step": 20101 }, { "epoch": 0.38, "learning_rate": 3.564077767921263e-06, "loss": 0.8208, "step": 20102 }, { "epoch": 0.38, "learning_rate": 3.563939528896765e-06, "loss": 1.0232, "step": 20103 }, { "epoch": 0.38, "learning_rate": 3.56380128589955e-06, "loss": 0.9725, "step": 20104 }, { "epoch": 0.38, "learning_rate": 3.563663038930133e-06, "loss": 1.0593, "step": 20105 }, { "epoch": 0.38, "learning_rate": 3.56352478798903e-06, "loss": 1.0928, "step": 20106 }, { "epoch": 0.38, "learning_rate": 3.563386533076759e-06, "loss": 0.8964, "step": 20107 }, { "epoch": 0.38, "learning_rate": 3.5632482741938355e-06, "loss": 0.7873, "step": 20108 }, { "epoch": 0.38, "learning_rate": 3.563110011340775e-06, "loss": 0.9888, "step": 20109 }, { "epoch": 0.38, "learning_rate": 3.562971744518095e-06, "loss": 0.8411, "step": 20110 }, { "epoch": 0.38, "learning_rate": 3.56283347372631e-06, "loss": 0.9406, "step": 20111 }, { "epoch": 0.38, "learning_rate": 3.5626951989659385e-06, "loss": 1.121, "step": 20112 }, { "epoch": 0.38, "learning_rate": 3.5625569202374953e-06, "loss": 1.0716, "step": 20113 }, { "epoch": 0.38, "learning_rate": 3.5624186375414973e-06, "loss": 0.9119, "step": 20114 }, { "epoch": 0.38, "learning_rate": 3.562280350878461e-06, "loss": 1.0192, "step": 20115 }, { "epoch": 0.38, "learning_rate": 3.5621420602489013e-06, "loss": 0.9141, "step": 20116 }, { "epoch": 0.38, "learning_rate": 3.5620037656533364e-06, "loss": 1.0228, "step": 20117 }, { "epoch": 0.38, "learning_rate": 3.5618654670922825e-06, "loss": 1.0875, "step": 20118 }, { "epoch": 0.38, "learning_rate": 3.5617271645662542e-06, "loss": 1.1169, "step": 20119 }, { "epoch": 0.38, "learning_rate": 3.5615888580757696e-06, "loss": 0.8352, "step": 20120 }, { "epoch": 0.38, "learning_rate": 3.5614505476213457e-06, "loss": 1.0163, "step": 20121 }, { "epoch": 0.38, "learning_rate": 3.561312233203498e-06, "loss": 0.9633, "step": 20122 }, { "epoch": 0.38, "learning_rate": 3.561173914822742e-06, "loss": 0.9802, "step": 20123 }, { "epoch": 0.38, "learning_rate": 3.561035592479596e-06, "loss": 1.065, "step": 20124 }, { "epoch": 0.38, "learning_rate": 3.5608972661745744e-06, "loss": 1.3812, "step": 20125 }, { "epoch": 0.38, "learning_rate": 3.5607589359081956e-06, "loss": 0.7717, "step": 20126 }, { "epoch": 0.38, "learning_rate": 3.560620601680976e-06, "loss": 0.8923, "step": 20127 }, { "epoch": 0.38, "learning_rate": 3.560482263493431e-06, "loss": 1.0358, "step": 20128 }, { "epoch": 0.38, "learning_rate": 3.5603439213460778e-06, "loss": 0.6152, "step": 20129 }, { "epoch": 0.38, "learning_rate": 3.560205575239433e-06, "loss": 1.0562, "step": 20130 }, { "epoch": 0.38, "learning_rate": 3.560067225174013e-06, "loss": 1.1079, "step": 20131 }, { "epoch": 0.38, "learning_rate": 3.559928871150334e-06, "loss": 1.1028, "step": 20132 }, { "epoch": 0.38, "learning_rate": 3.559790513168914e-06, "loss": 0.8974, "step": 20133 }, { "epoch": 0.38, "learning_rate": 3.5596521512302686e-06, "loss": 1.0448, "step": 20134 }, { "epoch": 0.38, "learning_rate": 3.5595137853349138e-06, "loss": 0.8895, "step": 20135 }, { "epoch": 0.38, "learning_rate": 3.5593754154833683e-06, "loss": 0.8978, "step": 20136 }, { "epoch": 0.38, "learning_rate": 3.5592370416761468e-06, "loss": 1.1511, "step": 20137 }, { "epoch": 0.38, "learning_rate": 3.559098663913766e-06, "loss": 1.0076, "step": 20138 }, { "epoch": 0.38, "learning_rate": 3.5589602821967444e-06, "loss": 0.8296, "step": 20139 }, { "epoch": 0.38, "learning_rate": 3.5588218965255966e-06, "loss": 0.7405, "step": 20140 }, { "epoch": 0.38, "learning_rate": 3.5586835069008407e-06, "loss": 0.8868, "step": 20141 }, { "epoch": 0.38, "learning_rate": 3.558545113322993e-06, "loss": 0.8065, "step": 20142 }, { "epoch": 0.38, "learning_rate": 3.5584067157925704e-06, "loss": 0.9451, "step": 20143 }, { "epoch": 0.38, "learning_rate": 3.5582683143100894e-06, "loss": 1.1059, "step": 20144 }, { "epoch": 0.38, "learning_rate": 3.558129908876068e-06, "loss": 0.7613, "step": 20145 }, { "epoch": 0.38, "learning_rate": 3.55799149949102e-06, "loss": 0.7893, "step": 20146 }, { "epoch": 0.38, "learning_rate": 3.5578530861554663e-06, "loss": 0.9963, "step": 20147 }, { "epoch": 0.38, "learning_rate": 3.55771466886992e-06, "loss": 0.7394, "step": 20148 }, { "epoch": 0.38, "learning_rate": 3.5575762476349003e-06, "loss": 0.9081, "step": 20149 }, { "epoch": 0.38, "learning_rate": 3.5574378224509224e-06, "loss": 1.1965, "step": 20150 }, { "epoch": 0.38, "learning_rate": 3.5572993933185056e-06, "loss": 0.9687, "step": 20151 }, { "epoch": 0.38, "learning_rate": 3.557160960238164e-06, "loss": 0.8831, "step": 20152 }, { "epoch": 0.38, "learning_rate": 3.5570225232104166e-06, "loss": 0.9662, "step": 20153 }, { "epoch": 0.38, "learning_rate": 3.556884082235779e-06, "loss": 0.8903, "step": 20154 }, { "epoch": 0.38, "learning_rate": 3.556745637314769e-06, "loss": 1.0153, "step": 20155 }, { "epoch": 0.38, "learning_rate": 3.5566071884479023e-06, "loss": 1.1572, "step": 20156 }, { "epoch": 0.38, "learning_rate": 3.5564687356356986e-06, "loss": 0.9577, "step": 20157 }, { "epoch": 0.38, "learning_rate": 3.5563302788786714e-06, "loss": 1.0807, "step": 20158 }, { "epoch": 0.38, "learning_rate": 3.5561918181773396e-06, "loss": 0.9343, "step": 20159 }, { "epoch": 0.38, "learning_rate": 3.5560533535322207e-06, "loss": 0.8846, "step": 20160 }, { "epoch": 0.38, "learning_rate": 3.55591488494383e-06, "loss": 0.8151, "step": 20161 }, { "epoch": 0.38, "learning_rate": 3.5557764124126858e-06, "loss": 0.8233, "step": 20162 }, { "epoch": 0.38, "learning_rate": 3.5556379359393057e-06, "loss": 1.0756, "step": 20163 }, { "epoch": 0.38, "learning_rate": 3.555499455524205e-06, "loss": 0.8311, "step": 20164 }, { "epoch": 0.38, "learning_rate": 3.5553609711679017e-06, "loss": 0.9961, "step": 20165 }, { "epoch": 0.38, "learning_rate": 3.5552224828709137e-06, "loss": 0.8646, "step": 20166 }, { "epoch": 0.38, "learning_rate": 3.5550839906337566e-06, "loss": 0.9979, "step": 20167 }, { "epoch": 0.38, "learning_rate": 3.5549454944569477e-06, "loss": 1.0997, "step": 20168 }, { "epoch": 0.38, "learning_rate": 3.5548069943410057e-06, "loss": 1.0899, "step": 20169 }, { "epoch": 0.38, "learning_rate": 3.554668490286446e-06, "loss": 0.7414, "step": 20170 }, { "epoch": 0.38, "learning_rate": 3.5545299822937867e-06, "loss": 0.8629, "step": 20171 }, { "epoch": 0.38, "learning_rate": 3.5543914703635453e-06, "loss": 0.9923, "step": 20172 }, { "epoch": 0.38, "learning_rate": 3.554252954496238e-06, "loss": 0.7272, "step": 20173 }, { "epoch": 0.38, "learning_rate": 3.554114434692382e-06, "loss": 1.0214, "step": 20174 }, { "epoch": 0.38, "learning_rate": 3.5539759109524956e-06, "loss": 1.0612, "step": 20175 }, { "epoch": 0.38, "learning_rate": 3.5538373832770958e-06, "loss": 0.8587, "step": 20176 }, { "epoch": 0.38, "learning_rate": 3.5536988516666985e-06, "loss": 0.9937, "step": 20177 }, { "epoch": 0.38, "learning_rate": 3.5535603161218234e-06, "loss": 1.0343, "step": 20178 }, { "epoch": 0.38, "learning_rate": 3.5534217766429856e-06, "loss": 0.7235, "step": 20179 }, { "epoch": 0.38, "learning_rate": 3.5532832332307034e-06, "loss": 0.86, "step": 20180 }, { "epoch": 0.38, "learning_rate": 3.553144685885494e-06, "loss": 1.3473, "step": 20181 }, { "epoch": 0.38, "learning_rate": 3.5530061346078738e-06, "loss": 0.7012, "step": 20182 }, { "epoch": 0.38, "learning_rate": 3.5528675793983614e-06, "loss": 0.7007, "step": 20183 }, { "epoch": 0.38, "learning_rate": 3.552729020257474e-06, "loss": 0.6386, "step": 20184 }, { "epoch": 0.38, "learning_rate": 3.552590457185728e-06, "loss": 1.0133, "step": 20185 }, { "epoch": 0.38, "learning_rate": 3.5524518901836423e-06, "loss": 0.9654, "step": 20186 }, { "epoch": 0.38, "learning_rate": 3.552313319251734e-06, "loss": 1.3125, "step": 20187 }, { "epoch": 0.38, "learning_rate": 3.552174744390519e-06, "loss": 1.1049, "step": 20188 }, { "epoch": 0.38, "learning_rate": 3.5520361656005165e-06, "loss": 0.9294, "step": 20189 }, { "epoch": 0.38, "learning_rate": 3.551897582882242e-06, "loss": 1.0424, "step": 20190 }, { "epoch": 0.38, "learning_rate": 3.5517589962362154e-06, "loss": 0.8247, "step": 20191 }, { "epoch": 0.38, "learning_rate": 3.551620405662952e-06, "loss": 1.0504, "step": 20192 }, { "epoch": 0.38, "learning_rate": 3.5514818111629717e-06, "loss": 0.9178, "step": 20193 }, { "epoch": 0.38, "learning_rate": 3.5513432127367897e-06, "loss": 0.9895, "step": 20194 }, { "epoch": 0.38, "learning_rate": 3.551204610384924e-06, "loss": 0.8038, "step": 20195 }, { "epoch": 0.38, "learning_rate": 3.5510660041078926e-06, "loss": 0.6805, "step": 20196 }, { "epoch": 0.38, "learning_rate": 3.5509273939062134e-06, "loss": 0.8614, "step": 20197 }, { "epoch": 0.38, "learning_rate": 3.5507887797804032e-06, "loss": 0.7881, "step": 20198 }, { "epoch": 0.38, "learning_rate": 3.5506501617309802e-06, "loss": 0.9504, "step": 20199 }, { "epoch": 0.38, "learning_rate": 3.5505115397584614e-06, "loss": 0.9285, "step": 20200 }, { "epoch": 0.38, "learning_rate": 3.5503729138633653e-06, "loss": 0.9409, "step": 20201 }, { "epoch": 0.38, "learning_rate": 3.550234284046209e-06, "loss": 0.8819, "step": 20202 }, { "epoch": 0.38, "learning_rate": 3.550095650307509e-06, "loss": 0.8021, "step": 20203 }, { "epoch": 0.38, "learning_rate": 3.5499570126477843e-06, "loss": 0.9337, "step": 20204 }, { "epoch": 0.38, "learning_rate": 3.549818371067553e-06, "loss": 0.7039, "step": 20205 }, { "epoch": 0.38, "learning_rate": 3.5496797255673314e-06, "loss": 1.2125, "step": 20206 }, { "epoch": 0.38, "learning_rate": 3.5495410761476383e-06, "loss": 1.2038, "step": 20207 }, { "epoch": 0.38, "learning_rate": 3.549402422808992e-06, "loss": 0.8492, "step": 20208 }, { "epoch": 0.38, "learning_rate": 3.5492637655519074e-06, "loss": 0.7433, "step": 20209 }, { "epoch": 0.38, "learning_rate": 3.5491251043769047e-06, "loss": 0.7932, "step": 20210 }, { "epoch": 0.38, "learning_rate": 3.5489864392845013e-06, "loss": 0.8112, "step": 20211 }, { "epoch": 0.38, "learning_rate": 3.5488477702752146e-06, "loss": 1.0824, "step": 20212 }, { "epoch": 0.38, "learning_rate": 3.5487090973495623e-06, "loss": 0.9332, "step": 20213 }, { "epoch": 0.38, "learning_rate": 3.5485704205080627e-06, "loss": 1.0024, "step": 20214 }, { "epoch": 0.38, "learning_rate": 3.5484317397512338e-06, "loss": 0.8634, "step": 20215 }, { "epoch": 0.38, "learning_rate": 3.5482930550795913e-06, "loss": 0.945, "step": 20216 }, { "epoch": 0.38, "learning_rate": 3.548154366493656e-06, "loss": 1.0117, "step": 20217 }, { "epoch": 0.38, "learning_rate": 3.548015673993944e-06, "loss": 0.9182, "step": 20218 }, { "epoch": 0.38, "learning_rate": 3.5478769775809733e-06, "loss": 1.0579, "step": 20219 }, { "epoch": 0.38, "learning_rate": 3.5477382772552633e-06, "loss": 1.1166, "step": 20220 }, { "epoch": 0.38, "learning_rate": 3.5475995730173296e-06, "loss": 0.8722, "step": 20221 }, { "epoch": 0.38, "learning_rate": 3.547460864867691e-06, "loss": 1.0273, "step": 20222 }, { "epoch": 0.38, "learning_rate": 3.547322152806867e-06, "loss": 0.8912, "step": 20223 }, { "epoch": 0.38, "learning_rate": 3.5471834368353724e-06, "loss": 1.1933, "step": 20224 }, { "epoch": 0.38, "learning_rate": 3.5470447169537283e-06, "loss": 1.0421, "step": 20225 }, { "epoch": 0.38, "learning_rate": 3.546905993162451e-06, "loss": 1.0452, "step": 20226 }, { "epoch": 0.38, "learning_rate": 3.546767265462059e-06, "loss": 0.7975, "step": 20227 }, { "epoch": 0.38, "learning_rate": 3.54662853385307e-06, "loss": 0.8937, "step": 20228 }, { "epoch": 0.38, "learning_rate": 3.5464897983360018e-06, "loss": 0.9917, "step": 20229 }, { "epoch": 0.38, "learning_rate": 3.5463510589113725e-06, "loss": 0.772, "step": 20230 }, { "epoch": 0.38, "learning_rate": 3.5462123155797012e-06, "loss": 1.1992, "step": 20231 }, { "epoch": 0.38, "learning_rate": 3.5460735683415047e-06, "loss": 0.8818, "step": 20232 }, { "epoch": 0.38, "learning_rate": 3.5459348171973017e-06, "loss": 0.8881, "step": 20233 }, { "epoch": 0.38, "learning_rate": 3.5457960621476106e-06, "loss": 0.9693, "step": 20234 }, { "epoch": 0.38, "learning_rate": 3.5456573031929486e-06, "loss": 0.7274, "step": 20235 }, { "epoch": 0.38, "learning_rate": 3.5455185403338344e-06, "loss": 0.9811, "step": 20236 }, { "epoch": 0.38, "learning_rate": 3.545379773570786e-06, "loss": 1.1867, "step": 20237 }, { "epoch": 0.38, "learning_rate": 3.5452410029043214e-06, "loss": 1.1128, "step": 20238 }, { "epoch": 0.38, "learning_rate": 3.545102228334959e-06, "loss": 0.8027, "step": 20239 }, { "epoch": 0.38, "learning_rate": 3.5449634498632174e-06, "loss": 1.0579, "step": 20240 }, { "epoch": 0.38, "learning_rate": 3.544824667489614e-06, "loss": 0.8598, "step": 20241 }, { "epoch": 0.38, "learning_rate": 3.5446858812146674e-06, "loss": 0.7108, "step": 20242 }, { "epoch": 0.38, "learning_rate": 3.5445470910388957e-06, "loss": 1.0849, "step": 20243 }, { "epoch": 0.38, "learning_rate": 3.5444082969628176e-06, "loss": 1.0847, "step": 20244 }, { "epoch": 0.38, "learning_rate": 3.54426949898695e-06, "loss": 0.9118, "step": 20245 }, { "epoch": 0.38, "learning_rate": 3.544130697111813e-06, "loss": 0.8844, "step": 20246 }, { "epoch": 0.38, "learning_rate": 3.5439918913379227e-06, "loss": 0.923, "step": 20247 }, { "epoch": 0.38, "learning_rate": 3.5438530816658e-06, "loss": 0.924, "step": 20248 }, { "epoch": 0.38, "learning_rate": 3.5437142680959618e-06, "loss": 0.9869, "step": 20249 }, { "epoch": 0.38, "learning_rate": 3.543575450628926e-06, "loss": 1.0816, "step": 20250 }, { "epoch": 0.38, "learning_rate": 3.5434366292652115e-06, "loss": 1.0633, "step": 20251 }, { "epoch": 0.38, "learning_rate": 3.543297804005337e-06, "loss": 0.8511, "step": 20252 }, { "epoch": 0.38, "learning_rate": 3.5431589748498195e-06, "loss": 1.1697, "step": 20253 }, { "epoch": 0.38, "learning_rate": 3.5430201417991793e-06, "loss": 1.0015, "step": 20254 }, { "epoch": 0.38, "learning_rate": 3.5428813048539345e-06, "loss": 1.0037, "step": 20255 }, { "epoch": 0.38, "learning_rate": 3.542742464014602e-06, "loss": 1.0513, "step": 20256 }, { "epoch": 0.38, "learning_rate": 3.542603619281701e-06, "loss": 1.0258, "step": 20257 }, { "epoch": 0.38, "learning_rate": 3.5424647706557503e-06, "loss": 0.8909, "step": 20258 }, { "epoch": 0.38, "learning_rate": 3.5423259181372678e-06, "loss": 1.0255, "step": 20259 }, { "epoch": 0.38, "learning_rate": 3.542187061726772e-06, "loss": 0.7477, "step": 20260 }, { "epoch": 0.38, "learning_rate": 3.5420482014247828e-06, "loss": 0.7926, "step": 20261 }, { "epoch": 0.38, "learning_rate": 3.541909337231817e-06, "loss": 1.166, "step": 20262 }, { "epoch": 0.38, "learning_rate": 3.5417704691483934e-06, "loss": 0.9493, "step": 20263 }, { "epoch": 0.38, "learning_rate": 3.5416315971750316e-06, "loss": 0.8033, "step": 20264 }, { "epoch": 0.38, "learning_rate": 3.5414927213122486e-06, "loss": 0.9589, "step": 20265 }, { "epoch": 0.38, "learning_rate": 3.5413538415605637e-06, "loss": 0.9164, "step": 20266 }, { "epoch": 0.38, "learning_rate": 3.5412149579204957e-06, "loss": 0.8624, "step": 20267 }, { "epoch": 0.38, "learning_rate": 3.541076070392563e-06, "loss": 0.9474, "step": 20268 }, { "epoch": 0.38, "learning_rate": 3.540937178977284e-06, "loss": 0.8983, "step": 20269 }, { "epoch": 0.38, "learning_rate": 3.5407982836751783e-06, "loss": 1.0903, "step": 20270 }, { "epoch": 0.38, "learning_rate": 3.540659384486763e-06, "loss": 0.8518, "step": 20271 }, { "epoch": 0.38, "learning_rate": 3.540520481412557e-06, "loss": 1.0127, "step": 20272 }, { "epoch": 0.38, "learning_rate": 3.54038157445308e-06, "loss": 0.8832, "step": 20273 }, { "epoch": 0.38, "learning_rate": 3.54024266360885e-06, "loss": 0.9418, "step": 20274 }, { "epoch": 0.38, "learning_rate": 3.540103748880386e-06, "loss": 1.0653, "step": 20275 }, { "epoch": 0.38, "learning_rate": 3.5399648302682067e-06, "loss": 0.9233, "step": 20276 }, { "epoch": 0.38, "learning_rate": 3.5398259077728304e-06, "loss": 0.922, "step": 20277 }, { "epoch": 0.38, "learning_rate": 3.5396869813947752e-06, "loss": 0.9951, "step": 20278 }, { "epoch": 0.38, "learning_rate": 3.5395480511345614e-06, "loss": 0.862, "step": 20279 }, { "epoch": 0.38, "learning_rate": 3.539409116992707e-06, "loss": 0.7969, "step": 20280 }, { "epoch": 0.38, "learning_rate": 3.539270178969731e-06, "loss": 1.0085, "step": 20281 }, { "epoch": 0.38, "learning_rate": 3.5391312370661523e-06, "loss": 0.8147, "step": 20282 }, { "epoch": 0.38, "learning_rate": 3.5389922912824885e-06, "loss": 0.9098, "step": 20283 }, { "epoch": 0.38, "learning_rate": 3.53885334161926e-06, "loss": 0.988, "step": 20284 }, { "epoch": 0.38, "learning_rate": 3.5387143880769853e-06, "loss": 0.9974, "step": 20285 }, { "epoch": 0.38, "learning_rate": 3.5385754306561815e-06, "loss": 0.8034, "step": 20286 }, { "epoch": 0.38, "learning_rate": 3.53843646935737e-06, "loss": 1.0364, "step": 20287 }, { "epoch": 0.38, "learning_rate": 3.5382975041810685e-06, "loss": 0.8847, "step": 20288 }, { "epoch": 0.38, "learning_rate": 3.538158535127796e-06, "loss": 0.6671, "step": 20289 }, { "epoch": 0.38, "learning_rate": 3.5380195621980713e-06, "loss": 0.9904, "step": 20290 }, { "epoch": 0.38, "learning_rate": 3.5378805853924137e-06, "loss": 0.8361, "step": 20291 }, { "epoch": 0.38, "learning_rate": 3.537741604711341e-06, "loss": 1.0205, "step": 20292 }, { "epoch": 0.38, "learning_rate": 3.537602620155373e-06, "loss": 0.9258, "step": 20293 }, { "epoch": 0.38, "learning_rate": 3.5374636317250288e-06, "loss": 1.0695, "step": 20294 }, { "epoch": 0.38, "learning_rate": 3.5373246394208277e-06, "loss": 1.0151, "step": 20295 }, { "epoch": 0.38, "learning_rate": 3.5371856432432877e-06, "loss": 0.921, "step": 20296 }, { "epoch": 0.38, "learning_rate": 3.537046643192929e-06, "loss": 0.7105, "step": 20297 }, { "epoch": 0.38, "learning_rate": 3.5369076392702694e-06, "loss": 1.0217, "step": 20298 }, { "epoch": 0.38, "learning_rate": 3.5367686314758284e-06, "loss": 1.0717, "step": 20299 }, { "epoch": 0.38, "learning_rate": 3.5366296198101253e-06, "loss": 0.972, "step": 20300 }, { "epoch": 0.38, "learning_rate": 3.5364906042736786e-06, "loss": 0.9774, "step": 20301 }, { "epoch": 0.38, "learning_rate": 3.5363515848670075e-06, "loss": 0.8273, "step": 20302 }, { "epoch": 0.38, "learning_rate": 3.536212561590633e-06, "loss": 0.8608, "step": 20303 }, { "epoch": 0.38, "learning_rate": 3.5360735344450716e-06, "loss": 0.8958, "step": 20304 }, { "epoch": 0.38, "learning_rate": 3.5359345034308427e-06, "loss": 0.9828, "step": 20305 }, { "epoch": 0.38, "learning_rate": 3.5357954685484676e-06, "loss": 0.7837, "step": 20306 }, { "epoch": 0.38, "learning_rate": 3.535656429798462e-06, "loss": 1.0834, "step": 20307 }, { "epoch": 0.38, "learning_rate": 3.535517387181348e-06, "loss": 0.9201, "step": 20308 }, { "epoch": 0.38, "learning_rate": 3.5353783406976446e-06, "loss": 0.8489, "step": 20309 }, { "epoch": 0.38, "learning_rate": 3.5352392903478693e-06, "loss": 0.6841, "step": 20310 }, { "epoch": 0.38, "learning_rate": 3.5351002361325427e-06, "loss": 0.6677, "step": 20311 }, { "epoch": 0.38, "learning_rate": 3.5349611780521836e-06, "loss": 1.0552, "step": 20312 }, { "epoch": 0.38, "learning_rate": 3.5348221161073104e-06, "loss": 0.9492, "step": 20313 }, { "epoch": 0.38, "learning_rate": 3.5346830502984444e-06, "loss": 0.8741, "step": 20314 }, { "epoch": 0.38, "learning_rate": 3.5345439806261023e-06, "loss": 1.0174, "step": 20315 }, { "epoch": 0.38, "learning_rate": 3.5344049070908054e-06, "loss": 0.7144, "step": 20316 }, { "epoch": 0.38, "learning_rate": 3.5342658296930722e-06, "loss": 0.845, "step": 20317 }, { "epoch": 0.38, "learning_rate": 3.5341267484334223e-06, "loss": 1.1649, "step": 20318 }, { "epoch": 0.38, "learning_rate": 3.533987663312375e-06, "loss": 1.0428, "step": 20319 }, { "epoch": 0.38, "learning_rate": 3.5338485743304485e-06, "loss": 0.9468, "step": 20320 }, { "epoch": 0.38, "learning_rate": 3.5337094814881634e-06, "loss": 0.7019, "step": 20321 }, { "epoch": 0.38, "learning_rate": 3.533570384786039e-06, "loss": 0.8798, "step": 20322 }, { "epoch": 0.38, "learning_rate": 3.533431284224595e-06, "loss": 0.6727, "step": 20323 }, { "epoch": 0.38, "learning_rate": 3.5332921798043503e-06, "loss": 0.9753, "step": 20324 }, { "epoch": 0.38, "learning_rate": 3.5331530715258233e-06, "loss": 0.914, "step": 20325 }, { "epoch": 0.38, "learning_rate": 3.533013959389535e-06, "loss": 0.7235, "step": 20326 }, { "epoch": 0.38, "learning_rate": 3.532874843396005e-06, "loss": 0.8355, "step": 20327 }, { "epoch": 0.38, "learning_rate": 3.5327357235457503e-06, "loss": 0.8184, "step": 20328 }, { "epoch": 0.38, "learning_rate": 3.532596599839293e-06, "loss": 0.8043, "step": 20329 }, { "epoch": 0.38, "learning_rate": 3.532457472277152e-06, "loss": 1.0322, "step": 20330 }, { "epoch": 0.38, "learning_rate": 3.532318340859846e-06, "loss": 0.9092, "step": 20331 }, { "epoch": 0.38, "learning_rate": 3.532179205587895e-06, "loss": 0.9091, "step": 20332 }, { "epoch": 0.38, "learning_rate": 3.5320400664618186e-06, "loss": 1.0906, "step": 20333 }, { "epoch": 0.38, "learning_rate": 3.5319009234821367e-06, "loss": 1.0118, "step": 20334 }, { "epoch": 0.38, "learning_rate": 3.5317617766493673e-06, "loss": 0.8089, "step": 20335 }, { "epoch": 0.38, "learning_rate": 3.531622625964032e-06, "loss": 0.9156, "step": 20336 }, { "epoch": 0.38, "learning_rate": 3.5314834714266486e-06, "loss": 1.2394, "step": 20337 }, { "epoch": 0.38, "learning_rate": 3.531344313037738e-06, "loss": 0.8663, "step": 20338 }, { "epoch": 0.38, "learning_rate": 3.5312051507978195e-06, "loss": 1.0712, "step": 20339 }, { "epoch": 0.38, "learning_rate": 3.5310659847074125e-06, "loss": 0.9761, "step": 20340 }, { "epoch": 0.38, "learning_rate": 3.5309268147670366e-06, "loss": 0.8662, "step": 20341 }, { "epoch": 0.38, "learning_rate": 3.530787640977212e-06, "loss": 0.7778, "step": 20342 }, { "epoch": 0.38, "learning_rate": 3.5306484633384573e-06, "loss": 0.8955, "step": 20343 }, { "epoch": 0.38, "learning_rate": 3.530509281851293e-06, "loss": 1.1363, "step": 20344 }, { "epoch": 0.38, "learning_rate": 3.530370096516239e-06, "loss": 1.0569, "step": 20345 }, { "epoch": 0.38, "learning_rate": 3.530230907333815e-06, "loss": 0.8353, "step": 20346 }, { "epoch": 0.38, "learning_rate": 3.53009171430454e-06, "loss": 0.8915, "step": 20347 }, { "epoch": 0.38, "learning_rate": 3.5299525174289338e-06, "loss": 0.8912, "step": 20348 }, { "epoch": 0.38, "learning_rate": 3.529813316707516e-06, "loss": 1.1163, "step": 20349 }, { "epoch": 0.38, "learning_rate": 3.5296741121408078e-06, "loss": 0.952, "step": 20350 }, { "epoch": 0.38, "learning_rate": 3.5295349037293275e-06, "loss": 0.8944, "step": 20351 }, { "epoch": 0.38, "learning_rate": 3.5293956914735954e-06, "loss": 0.8135, "step": 20352 }, { "epoch": 0.38, "learning_rate": 3.529256475374132e-06, "loss": 0.9498, "step": 20353 }, { "epoch": 0.38, "learning_rate": 3.5291172554314564e-06, "loss": 0.8955, "step": 20354 }, { "epoch": 0.38, "learning_rate": 3.528978031646088e-06, "loss": 1.0331, "step": 20355 }, { "epoch": 0.38, "learning_rate": 3.528838804018547e-06, "loss": 1.0997, "step": 20356 }, { "epoch": 0.38, "learning_rate": 3.5286995725493537e-06, "loss": 1.0805, "step": 20357 }, { "epoch": 0.38, "learning_rate": 3.528560337239028e-06, "loss": 0.998, "step": 20358 }, { "epoch": 0.38, "learning_rate": 3.52842109808809e-06, "loss": 0.6547, "step": 20359 }, { "epoch": 0.38, "learning_rate": 3.5282818550970582e-06, "loss": 0.9179, "step": 20360 }, { "epoch": 0.38, "learning_rate": 3.528142608266454e-06, "loss": 0.8663, "step": 20361 }, { "epoch": 0.38, "learning_rate": 3.5280033575967963e-06, "loss": 1.0028, "step": 20362 }, { "epoch": 0.38, "learning_rate": 3.5278641030886065e-06, "loss": 0.842, "step": 20363 }, { "epoch": 0.38, "learning_rate": 3.527724844742403e-06, "loss": 0.8728, "step": 20364 }, { "epoch": 0.38, "learning_rate": 3.5275855825587062e-06, "loss": 0.8943, "step": 20365 }, { "epoch": 0.38, "learning_rate": 3.5274463165380368e-06, "loss": 0.8074, "step": 20366 }, { "epoch": 0.38, "learning_rate": 3.5273070466809146e-06, "loss": 1.0487, "step": 20367 }, { "epoch": 0.38, "learning_rate": 3.527167772987859e-06, "loss": 0.9719, "step": 20368 }, { "epoch": 0.38, "learning_rate": 3.5270284954593904e-06, "loss": 1.0836, "step": 20369 }, { "epoch": 0.38, "learning_rate": 3.5268892140960282e-06, "loss": 0.9849, "step": 20370 }, { "epoch": 0.38, "learning_rate": 3.5267499288982944e-06, "loss": 1.0142, "step": 20371 }, { "epoch": 0.38, "learning_rate": 3.526610639866707e-06, "loss": 0.9018, "step": 20372 }, { "epoch": 0.38, "learning_rate": 3.5264713470017876e-06, "loss": 1.0668, "step": 20373 }, { "epoch": 0.38, "learning_rate": 3.5263320503040556e-06, "loss": 1.1879, "step": 20374 }, { "epoch": 0.38, "learning_rate": 3.526192749774031e-06, "loss": 1.0402, "step": 20375 }, { "epoch": 0.38, "learning_rate": 3.526053445412234e-06, "loss": 1.0389, "step": 20376 }, { "epoch": 0.38, "learning_rate": 3.5259141372191845e-06, "loss": 1.0224, "step": 20377 }, { "epoch": 0.38, "learning_rate": 3.525774825195404e-06, "loss": 1.0159, "step": 20378 }, { "epoch": 0.38, "learning_rate": 3.5256355093414107e-06, "loss": 0.8667, "step": 20379 }, { "epoch": 0.38, "learning_rate": 3.525496189657727e-06, "loss": 0.9153, "step": 20380 }, { "epoch": 0.38, "learning_rate": 3.525356866144871e-06, "loss": 1.3696, "step": 20381 }, { "epoch": 0.38, "learning_rate": 3.525217538803365e-06, "loss": 1.1353, "step": 20382 }, { "epoch": 0.38, "learning_rate": 3.525078207633727e-06, "loss": 0.93, "step": 20383 }, { "epoch": 0.38, "learning_rate": 3.5249388726364787e-06, "loss": 0.8728, "step": 20384 }, { "epoch": 0.38, "learning_rate": 3.5247995338121403e-06, "loss": 0.9384, "step": 20385 }, { "epoch": 0.38, "learning_rate": 3.5246601911612323e-06, "loss": 0.8597, "step": 20386 }, { "epoch": 0.38, "learning_rate": 3.524520844684274e-06, "loss": 1.0066, "step": 20387 }, { "epoch": 0.38, "learning_rate": 3.524381494381786e-06, "loss": 1.0157, "step": 20388 }, { "epoch": 0.38, "learning_rate": 3.52424214025429e-06, "loss": 0.8933, "step": 20389 }, { "epoch": 0.38, "learning_rate": 3.5241027823023044e-06, "loss": 0.889, "step": 20390 }, { "epoch": 0.38, "learning_rate": 3.5239634205263496e-06, "loss": 1.0889, "step": 20391 }, { "epoch": 0.38, "learning_rate": 3.5238240549269482e-06, "loss": 1.1398, "step": 20392 }, { "epoch": 0.38, "learning_rate": 3.5236846855046187e-06, "loss": 0.9842, "step": 20393 }, { "epoch": 0.38, "learning_rate": 3.523545312259882e-06, "loss": 1.1186, "step": 20394 }, { "epoch": 0.38, "learning_rate": 3.5234059351932587e-06, "loss": 1.0485, "step": 20395 }, { "epoch": 0.38, "learning_rate": 3.5232665543052684e-06, "loss": 0.8818, "step": 20396 }, { "epoch": 0.38, "learning_rate": 3.5231271695964327e-06, "loss": 1.0197, "step": 20397 }, { "epoch": 0.38, "learning_rate": 3.522987781067271e-06, "loss": 0.9661, "step": 20398 }, { "epoch": 0.38, "learning_rate": 3.5228483887183044e-06, "loss": 0.8345, "step": 20399 }, { "epoch": 0.38, "learning_rate": 3.5227089925500536e-06, "loss": 1.0179, "step": 20400 }, { "epoch": 0.38, "learning_rate": 3.5225695925630387e-06, "loss": 0.8634, "step": 20401 }, { "epoch": 0.38, "learning_rate": 3.5224301887577804e-06, "loss": 0.7813, "step": 20402 }, { "epoch": 0.38, "learning_rate": 3.522290781134799e-06, "loss": 0.8622, "step": 20403 }, { "epoch": 0.38, "learning_rate": 3.5221513696946153e-06, "loss": 0.8562, "step": 20404 }, { "epoch": 0.38, "learning_rate": 3.5220119544377495e-06, "loss": 0.9698, "step": 20405 }, { "epoch": 0.38, "learning_rate": 3.521872535364722e-06, "loss": 1.05, "step": 20406 }, { "epoch": 0.39, "learning_rate": 3.521733112476055e-06, "loss": 1.1484, "step": 20407 }, { "epoch": 0.39, "learning_rate": 3.521593685772267e-06, "loss": 0.7699, "step": 20408 }, { "epoch": 0.39, "learning_rate": 3.5214542552538793e-06, "loss": 0.9749, "step": 20409 }, { "epoch": 0.39, "learning_rate": 3.521314820921414e-06, "loss": 0.8698, "step": 20410 }, { "epoch": 0.39, "learning_rate": 3.5211753827753893e-06, "loss": 1.0301, "step": 20411 }, { "epoch": 0.39, "learning_rate": 3.5210359408163265e-06, "loss": 1.1732, "step": 20412 }, { "epoch": 0.39, "learning_rate": 3.5208964950447476e-06, "loss": 1.0435, "step": 20413 }, { "epoch": 0.39, "learning_rate": 3.5207570454611728e-06, "loss": 0.9435, "step": 20414 }, { "epoch": 0.39, "learning_rate": 3.5206175920661224e-06, "loss": 1.1119, "step": 20415 }, { "epoch": 0.39, "learning_rate": 3.5204781348601167e-06, "loss": 0.7615, "step": 20416 }, { "epoch": 0.39, "learning_rate": 3.5203386738436774e-06, "loss": 0.6919, "step": 20417 }, { "epoch": 0.39, "learning_rate": 3.520199209017324e-06, "loss": 1.1522, "step": 20418 }, { "epoch": 0.39, "learning_rate": 3.520059740381579e-06, "loss": 1.1863, "step": 20419 }, { "epoch": 0.39, "learning_rate": 3.5199202679369615e-06, "loss": 0.9573, "step": 20420 }, { "epoch": 0.39, "learning_rate": 3.519780791683993e-06, "loss": 0.7728, "step": 20421 }, { "epoch": 0.39, "learning_rate": 3.5196413116231954e-06, "loss": 0.9426, "step": 20422 }, { "epoch": 0.39, "learning_rate": 3.5195018277550874e-06, "loss": 0.9435, "step": 20423 }, { "epoch": 0.39, "learning_rate": 3.5193623400801915e-06, "loss": 1.0345, "step": 20424 }, { "epoch": 0.39, "learning_rate": 3.519222848599027e-06, "loss": 1.0878, "step": 20425 }, { "epoch": 0.39, "learning_rate": 3.519083353312116e-06, "loss": 1.0392, "step": 20426 }, { "epoch": 0.39, "learning_rate": 3.518943854219979e-06, "loss": 0.952, "step": 20427 }, { "epoch": 0.39, "learning_rate": 3.5188043513231374e-06, "loss": 0.8938, "step": 20428 }, { "epoch": 0.39, "learning_rate": 3.5186648446221104e-06, "loss": 0.9496, "step": 20429 }, { "epoch": 0.39, "learning_rate": 3.5185253341174213e-06, "loss": 1.0179, "step": 20430 }, { "epoch": 0.39, "learning_rate": 3.51838581980959e-06, "loss": 0.9707, "step": 20431 }, { "epoch": 0.39, "learning_rate": 3.5182463016991365e-06, "loss": 0.9322, "step": 20432 }, { "epoch": 0.39, "learning_rate": 3.518106779786582e-06, "loss": 0.8666, "step": 20433 }, { "epoch": 0.39, "learning_rate": 3.5179672540724485e-06, "loss": 0.9065, "step": 20434 }, { "epoch": 0.39, "learning_rate": 3.517827724557257e-06, "loss": 0.8558, "step": 20435 }, { "epoch": 0.39, "learning_rate": 3.5176881912415275e-06, "loss": 0.8338, "step": 20436 }, { "epoch": 0.39, "learning_rate": 3.517548654125782e-06, "loss": 1.1397, "step": 20437 }, { "epoch": 0.39, "learning_rate": 3.5174091132105405e-06, "loss": 1.0734, "step": 20438 }, { "epoch": 0.39, "learning_rate": 3.517269568496325e-06, "loss": 0.9272, "step": 20439 }, { "epoch": 0.39, "learning_rate": 3.5171300199836555e-06, "loss": 0.8154, "step": 20440 }, { "epoch": 0.39, "learning_rate": 3.516990467673054e-06, "loss": 0.9137, "step": 20441 }, { "epoch": 0.39, "learning_rate": 3.5168509115650414e-06, "loss": 0.8618, "step": 20442 }, { "epoch": 0.39, "learning_rate": 3.516711351660139e-06, "loss": 0.7378, "step": 20443 }, { "epoch": 0.39, "learning_rate": 3.516571787958867e-06, "loss": 0.9996, "step": 20444 }, { "epoch": 0.39, "learning_rate": 3.5164322204617468e-06, "loss": 0.9602, "step": 20445 }, { "epoch": 0.39, "learning_rate": 3.5162926491693007e-06, "loss": 0.9104, "step": 20446 }, { "epoch": 0.39, "learning_rate": 3.5161530740820484e-06, "loss": 0.8259, "step": 20447 }, { "epoch": 0.39, "learning_rate": 3.516013495200512e-06, "loss": 1.1534, "step": 20448 }, { "epoch": 0.39, "learning_rate": 3.5158739125252124e-06, "loss": 1.1286, "step": 20449 }, { "epoch": 0.39, "learning_rate": 3.5157343260566706e-06, "loss": 0.8314, "step": 20450 }, { "epoch": 0.39, "learning_rate": 3.515594735795408e-06, "loss": 1.2755, "step": 20451 }, { "epoch": 0.39, "learning_rate": 3.5154551417419457e-06, "loss": 0.8066, "step": 20452 }, { "epoch": 0.39, "learning_rate": 3.5153155438968056e-06, "loss": 0.8941, "step": 20453 }, { "epoch": 0.39, "learning_rate": 3.515175942260507e-06, "loss": 0.8503, "step": 20454 }, { "epoch": 0.39, "learning_rate": 3.515036336833574e-06, "loss": 1.164, "step": 20455 }, { "epoch": 0.39, "learning_rate": 3.5148967276165257e-06, "loss": 1.0797, "step": 20456 }, { "epoch": 0.39, "learning_rate": 3.5147571146098848e-06, "loss": 0.9426, "step": 20457 }, { "epoch": 0.39, "learning_rate": 3.514617497814172e-06, "loss": 1.0509, "step": 20458 }, { "epoch": 0.39, "learning_rate": 3.5144778772299077e-06, "loss": 0.9865, "step": 20459 }, { "epoch": 0.39, "learning_rate": 3.5143382528576143e-06, "loss": 0.8744, "step": 20460 }, { "epoch": 0.39, "learning_rate": 3.514198624697813e-06, "loss": 0.8737, "step": 20461 }, { "epoch": 0.39, "learning_rate": 3.514058992751025e-06, "loss": 0.7943, "step": 20462 }, { "epoch": 0.39, "learning_rate": 3.5139193570177726e-06, "loss": 1.0269, "step": 20463 }, { "epoch": 0.39, "learning_rate": 3.513779717498576e-06, "loss": 0.9599, "step": 20464 }, { "epoch": 0.39, "learning_rate": 3.513640074193957e-06, "loss": 1.0612, "step": 20465 }, { "epoch": 0.39, "learning_rate": 3.513500427104437e-06, "loss": 0.8056, "step": 20466 }, { "epoch": 0.39, "learning_rate": 3.513360776230537e-06, "loss": 0.8671, "step": 20467 }, { "epoch": 0.39, "learning_rate": 3.5132211215727797e-06, "loss": 1.1114, "step": 20468 }, { "epoch": 0.39, "learning_rate": 3.5130814631316857e-06, "loss": 1.1323, "step": 20469 }, { "epoch": 0.39, "learning_rate": 3.512941800907776e-06, "loss": 0.9247, "step": 20470 }, { "epoch": 0.39, "learning_rate": 3.512802134901573e-06, "loss": 0.9772, "step": 20471 }, { "epoch": 0.39, "learning_rate": 3.512662465113598e-06, "loss": 0.9968, "step": 20472 }, { "epoch": 0.39, "learning_rate": 3.512522791544373e-06, "loss": 0.7579, "step": 20473 }, { "epoch": 0.39, "learning_rate": 3.5123831141944178e-06, "loss": 0.8903, "step": 20474 }, { "epoch": 0.39, "learning_rate": 3.512243433064255e-06, "loss": 1.1143, "step": 20475 }, { "epoch": 0.39, "learning_rate": 3.512103748154407e-06, "loss": 0.8029, "step": 20476 }, { "epoch": 0.39, "learning_rate": 3.511964059465395e-06, "loss": 0.8957, "step": 20477 }, { "epoch": 0.39, "learning_rate": 3.5118243669977392e-06, "loss": 0.8398, "step": 20478 }, { "epoch": 0.39, "learning_rate": 3.511684670751963e-06, "loss": 0.864, "step": 20479 }, { "epoch": 0.39, "learning_rate": 3.5115449707285864e-06, "loss": 0.9667, "step": 20480 }, { "epoch": 0.39, "learning_rate": 3.5114052669281328e-06, "loss": 1.0453, "step": 20481 }, { "epoch": 0.39, "learning_rate": 3.5112655593511225e-06, "loss": 0.9276, "step": 20482 }, { "epoch": 0.39, "learning_rate": 3.5111258479980775e-06, "loss": 0.9915, "step": 20483 }, { "epoch": 0.39, "learning_rate": 3.5109861328695204e-06, "loss": 1.038, "step": 20484 }, { "epoch": 0.39, "learning_rate": 3.5108464139659717e-06, "loss": 0.9871, "step": 20485 }, { "epoch": 0.39, "learning_rate": 3.510706691287953e-06, "loss": 0.9161, "step": 20486 }, { "epoch": 0.39, "learning_rate": 3.5105669648359867e-06, "loss": 1.2659, "step": 20487 }, { "epoch": 0.39, "learning_rate": 3.510427234610594e-06, "loss": 1.1191, "step": 20488 }, { "epoch": 0.39, "learning_rate": 3.5102875006122973e-06, "loss": 0.99, "step": 20489 }, { "epoch": 0.39, "learning_rate": 3.5101477628416186e-06, "loss": 0.8831, "step": 20490 }, { "epoch": 0.39, "learning_rate": 3.5100080212990785e-06, "loss": 0.864, "step": 20491 }, { "epoch": 0.39, "learning_rate": 3.5098682759852e-06, "loss": 0.9536, "step": 20492 }, { "epoch": 0.39, "learning_rate": 3.509728526900504e-06, "loss": 1.1996, "step": 20493 }, { "epoch": 0.39, "learning_rate": 3.5095887740455127e-06, "loss": 1.108, "step": 20494 }, { "epoch": 0.39, "learning_rate": 3.5094490174207476e-06, "loss": 0.9247, "step": 20495 }, { "epoch": 0.39, "learning_rate": 3.5093092570267307e-06, "loss": 0.9831, "step": 20496 }, { "epoch": 0.39, "learning_rate": 3.5091694928639843e-06, "loss": 0.8906, "step": 20497 }, { "epoch": 0.39, "learning_rate": 3.5090297249330297e-06, "loss": 0.7589, "step": 20498 }, { "epoch": 0.39, "learning_rate": 3.508889953234389e-06, "loss": 0.9624, "step": 20499 }, { "epoch": 0.39, "learning_rate": 3.5087501777685843e-06, "loss": 1.1449, "step": 20500 }, { "epoch": 0.39, "learning_rate": 3.5086103985361375e-06, "loss": 0.9988, "step": 20501 }, { "epoch": 0.39, "learning_rate": 3.5084706155375705e-06, "loss": 0.793, "step": 20502 }, { "epoch": 0.39, "learning_rate": 3.5083308287734046e-06, "loss": 0.965, "step": 20503 }, { "epoch": 0.39, "learning_rate": 3.5081910382441624e-06, "loss": 0.7567, "step": 20504 }, { "epoch": 0.39, "learning_rate": 3.5080512439503665e-06, "loss": 1.198, "step": 20505 }, { "epoch": 0.39, "learning_rate": 3.507911445892538e-06, "loss": 1.068, "step": 20506 }, { "epoch": 0.39, "learning_rate": 3.5077716440711984e-06, "loss": 0.9888, "step": 20507 }, { "epoch": 0.39, "learning_rate": 3.5076318384868713e-06, "loss": 0.8993, "step": 20508 }, { "epoch": 0.39, "learning_rate": 3.5074920291400765e-06, "loss": 0.9761, "step": 20509 }, { "epoch": 0.39, "learning_rate": 3.5073522160313376e-06, "loss": 0.9706, "step": 20510 }, { "epoch": 0.39, "learning_rate": 3.507212399161178e-06, "loss": 0.9215, "step": 20511 }, { "epoch": 0.39, "learning_rate": 3.507072578530117e-06, "loss": 1.2513, "step": 20512 }, { "epoch": 0.39, "learning_rate": 3.5069327541386778e-06, "loss": 1.0168, "step": 20513 }, { "epoch": 0.39, "learning_rate": 3.506792925987383e-06, "loss": 1.0367, "step": 20514 }, { "epoch": 0.39, "learning_rate": 3.506653094076754e-06, "loss": 0.6556, "step": 20515 }, { "epoch": 0.39, "learning_rate": 3.506513258407313e-06, "loss": 0.9748, "step": 20516 }, { "epoch": 0.39, "learning_rate": 3.506373418979583e-06, "loss": 0.7693, "step": 20517 }, { "epoch": 0.39, "learning_rate": 3.506233575794085e-06, "loss": 1.0082, "step": 20518 }, { "epoch": 0.39, "learning_rate": 3.5060937288513413e-06, "loss": 0.9981, "step": 20519 }, { "epoch": 0.39, "learning_rate": 3.5059538781518753e-06, "loss": 0.6547, "step": 20520 }, { "epoch": 0.39, "learning_rate": 3.505814023696208e-06, "loss": 0.8729, "step": 20521 }, { "epoch": 0.39, "learning_rate": 3.505674165484862e-06, "loss": 1.0126, "step": 20522 }, { "epoch": 0.39, "learning_rate": 3.5055343035183594e-06, "loss": 0.8466, "step": 20523 }, { "epoch": 0.39, "learning_rate": 3.5053944377972227e-06, "loss": 1.0905, "step": 20524 }, { "epoch": 0.39, "learning_rate": 3.5052545683219734e-06, "loss": 1.1173, "step": 20525 }, { "epoch": 0.39, "learning_rate": 3.5051146950931353e-06, "loss": 1.0098, "step": 20526 }, { "epoch": 0.39, "learning_rate": 3.5049748181112292e-06, "loss": 0.7932, "step": 20527 }, { "epoch": 0.39, "learning_rate": 3.5048349373767783e-06, "loss": 0.9146, "step": 20528 }, { "epoch": 0.39, "learning_rate": 3.5046950528903044e-06, "loss": 0.9611, "step": 20529 }, { "epoch": 0.39, "learning_rate": 3.504555164652329e-06, "loss": 0.8308, "step": 20530 }, { "epoch": 0.39, "learning_rate": 3.504415272663377e-06, "loss": 0.9651, "step": 20531 }, { "epoch": 0.39, "learning_rate": 3.5042753769239686e-06, "loss": 0.8397, "step": 20532 }, { "epoch": 0.39, "learning_rate": 3.5041354774346265e-06, "loss": 0.855, "step": 20533 }, { "epoch": 0.39, "learning_rate": 3.503995574195873e-06, "loss": 0.8751, "step": 20534 }, { "epoch": 0.39, "learning_rate": 3.503855667208232e-06, "loss": 0.9111, "step": 20535 }, { "epoch": 0.39, "learning_rate": 3.5037157564722234e-06, "loss": 0.988, "step": 20536 }, { "epoch": 0.39, "learning_rate": 3.5035758419883715e-06, "loss": 1.2529, "step": 20537 }, { "epoch": 0.39, "learning_rate": 3.503435923757198e-06, "loss": 0.9142, "step": 20538 }, { "epoch": 0.39, "learning_rate": 3.503296001779226e-06, "loss": 1.061, "step": 20539 }, { "epoch": 0.39, "learning_rate": 3.503156076054977e-06, "loss": 0.977, "step": 20540 }, { "epoch": 0.39, "learning_rate": 3.503016146584974e-06, "loss": 0.8488, "step": 20541 }, { "epoch": 0.39, "learning_rate": 3.5028762133697404e-06, "loss": 1.0638, "step": 20542 }, { "epoch": 0.39, "learning_rate": 3.5027362764097965e-06, "loss": 1.1173, "step": 20543 }, { "epoch": 0.39, "learning_rate": 3.502596335705667e-06, "loss": 0.9862, "step": 20544 }, { "epoch": 0.39, "learning_rate": 3.5024563912578722e-06, "loss": 0.9601, "step": 20545 }, { "epoch": 0.39, "learning_rate": 3.502316443066937e-06, "loss": 0.7828, "step": 20546 }, { "epoch": 0.39, "learning_rate": 3.502176491133383e-06, "loss": 0.8258, "step": 20547 }, { "epoch": 0.39, "learning_rate": 3.502036535457733e-06, "loss": 0.8998, "step": 20548 }, { "epoch": 0.39, "learning_rate": 3.5018965760405087e-06, "loss": 0.884, "step": 20549 }, { "epoch": 0.39, "learning_rate": 3.5017566128822338e-06, "loss": 1.085, "step": 20550 }, { "epoch": 0.39, "learning_rate": 3.5016166459834296e-06, "loss": 0.9566, "step": 20551 }, { "epoch": 0.39, "learning_rate": 3.5014766753446196e-06, "loss": 0.9282, "step": 20552 }, { "epoch": 0.39, "learning_rate": 3.5013367009663274e-06, "loss": 0.9046, "step": 20553 }, { "epoch": 0.39, "learning_rate": 3.501196722849074e-06, "loss": 0.847, "step": 20554 }, { "epoch": 0.39, "learning_rate": 3.5010567409933825e-06, "loss": 1.0203, "step": 20555 }, { "epoch": 0.39, "learning_rate": 3.5009167553997764e-06, "loss": 1.1371, "step": 20556 }, { "epoch": 0.39, "learning_rate": 3.5007767660687776e-06, "loss": 0.8584, "step": 20557 }, { "epoch": 0.39, "learning_rate": 3.5006367730009087e-06, "loss": 1.109, "step": 20558 }, { "epoch": 0.39, "learning_rate": 3.500496776196693e-06, "loss": 1.0171, "step": 20559 }, { "epoch": 0.39, "learning_rate": 3.500356775656653e-06, "loss": 0.8723, "step": 20560 }, { "epoch": 0.39, "learning_rate": 3.5002167713813117e-06, "loss": 0.7693, "step": 20561 }, { "epoch": 0.39, "learning_rate": 3.5000767633711917e-06, "loss": 1.1426, "step": 20562 }, { "epoch": 0.39, "learning_rate": 3.4999367516268156e-06, "loss": 0.8022, "step": 20563 }, { "epoch": 0.39, "learning_rate": 3.4997967361487063e-06, "loss": 1.1131, "step": 20564 }, { "epoch": 0.39, "learning_rate": 3.499656716937386e-06, "loss": 0.8754, "step": 20565 }, { "epoch": 0.39, "learning_rate": 3.499516693993379e-06, "loss": 0.7708, "step": 20566 }, { "epoch": 0.39, "learning_rate": 3.499376667317207e-06, "loss": 1.0441, "step": 20567 }, { "epoch": 0.39, "learning_rate": 3.4992366369093934e-06, "loss": 0.952, "step": 20568 }, { "epoch": 0.39, "learning_rate": 3.4990966027704606e-06, "loss": 1.0078, "step": 20569 }, { "epoch": 0.39, "learning_rate": 3.4989565649009316e-06, "loss": 0.7823, "step": 20570 }, { "epoch": 0.39, "learning_rate": 3.498816523301329e-06, "loss": 0.7383, "step": 20571 }, { "epoch": 0.39, "learning_rate": 3.498676477972177e-06, "loss": 0.8459, "step": 20572 }, { "epoch": 0.39, "learning_rate": 3.4985364289139973e-06, "loss": 0.873, "step": 20573 }, { "epoch": 0.39, "learning_rate": 3.498396376127314e-06, "loss": 1.1841, "step": 20574 }, { "epoch": 0.39, "learning_rate": 3.4982563196126484e-06, "loss": 1.378, "step": 20575 }, { "epoch": 0.39, "learning_rate": 3.498116259370524e-06, "loss": 0.8191, "step": 20576 }, { "epoch": 0.39, "learning_rate": 3.4979761954014648e-06, "loss": 0.9137, "step": 20577 }, { "epoch": 0.39, "learning_rate": 3.497836127705993e-06, "loss": 1.1451, "step": 20578 }, { "epoch": 0.39, "learning_rate": 3.497696056284631e-06, "loss": 0.8808, "step": 20579 }, { "epoch": 0.39, "learning_rate": 3.4975559811379034e-06, "loss": 1.1262, "step": 20580 }, { "epoch": 0.39, "learning_rate": 3.4974159022663318e-06, "loss": 0.952, "step": 20581 }, { "epoch": 0.39, "learning_rate": 3.4972758196704406e-06, "loss": 0.9944, "step": 20582 }, { "epoch": 0.39, "learning_rate": 3.4971357333507507e-06, "loss": 0.7696, "step": 20583 }, { "epoch": 0.39, "learning_rate": 3.4969956433077873e-06, "loss": 1.0405, "step": 20584 }, { "epoch": 0.39, "learning_rate": 3.4968555495420726e-06, "loss": 0.7865, "step": 20585 }, { "epoch": 0.39, "learning_rate": 3.4967154520541297e-06, "loss": 0.9282, "step": 20586 }, { "epoch": 0.39, "learning_rate": 3.4965753508444824e-06, "loss": 1.0241, "step": 20587 }, { "epoch": 0.39, "learning_rate": 3.496435245913653e-06, "loss": 1.1391, "step": 20588 }, { "epoch": 0.39, "learning_rate": 3.496295137262165e-06, "loss": 1.0159, "step": 20589 }, { "epoch": 0.39, "learning_rate": 3.496155024890541e-06, "loss": 0.8491, "step": 20590 }, { "epoch": 0.39, "learning_rate": 3.4960149087993055e-06, "loss": 0.8427, "step": 20591 }, { "epoch": 0.39, "learning_rate": 3.49587478898898e-06, "loss": 0.7163, "step": 20592 }, { "epoch": 0.39, "learning_rate": 3.4957346654600894e-06, "loss": 0.9084, "step": 20593 }, { "epoch": 0.39, "learning_rate": 3.495594538213156e-06, "loss": 0.9222, "step": 20594 }, { "epoch": 0.39, "learning_rate": 3.495454407248703e-06, "loss": 0.8964, "step": 20595 }, { "epoch": 0.39, "learning_rate": 3.4953142725672532e-06, "loss": 0.8692, "step": 20596 }, { "epoch": 0.39, "learning_rate": 3.495174134169331e-06, "loss": 0.9019, "step": 20597 }, { "epoch": 0.39, "learning_rate": 3.4950339920554595e-06, "loss": 0.9042, "step": 20598 }, { "epoch": 0.39, "learning_rate": 3.4948938462261604e-06, "loss": 1.0139, "step": 20599 }, { "epoch": 0.39, "learning_rate": 3.494753696681959e-06, "loss": 1.165, "step": 20600 }, { "epoch": 0.39, "learning_rate": 3.4946135434233776e-06, "loss": 0.9616, "step": 20601 }, { "epoch": 0.39, "learning_rate": 3.4944733864509396e-06, "loss": 0.9585, "step": 20602 }, { "epoch": 0.39, "learning_rate": 3.494333225765169e-06, "loss": 1.0659, "step": 20603 }, { "epoch": 0.39, "learning_rate": 3.494193061366588e-06, "loss": 0.7363, "step": 20604 }, { "epoch": 0.39, "learning_rate": 3.494052893255721e-06, "loss": 0.7776, "step": 20605 }, { "epoch": 0.39, "learning_rate": 3.4939127214330905e-06, "loss": 1.1033, "step": 20606 }, { "epoch": 0.39, "learning_rate": 3.4937725458992205e-06, "loss": 0.9876, "step": 20607 }, { "epoch": 0.39, "learning_rate": 3.4936323666546347e-06, "loss": 0.6741, "step": 20608 }, { "epoch": 0.39, "learning_rate": 3.4934921836998557e-06, "loss": 1.0609, "step": 20609 }, { "epoch": 0.39, "learning_rate": 3.493351997035408e-06, "loss": 0.7138, "step": 20610 }, { "epoch": 0.39, "learning_rate": 3.4932118066618136e-06, "loss": 0.9604, "step": 20611 }, { "epoch": 0.39, "learning_rate": 3.493071612579597e-06, "loss": 1.2694, "step": 20612 }, { "epoch": 0.39, "learning_rate": 3.4929314147892813e-06, "loss": 0.8723, "step": 20613 }, { "epoch": 0.39, "learning_rate": 3.4927912132913904e-06, "loss": 1.0197, "step": 20614 }, { "epoch": 0.39, "learning_rate": 3.492651008086448e-06, "loss": 0.9406, "step": 20615 }, { "epoch": 0.39, "learning_rate": 3.492510799174976e-06, "loss": 0.9802, "step": 20616 }, { "epoch": 0.39, "learning_rate": 3.4923705865575e-06, "loss": 0.9015, "step": 20617 }, { "epoch": 0.39, "learning_rate": 3.4922303702345426e-06, "loss": 1.0135, "step": 20618 }, { "epoch": 0.39, "learning_rate": 3.4920901502066274e-06, "loss": 0.9407, "step": 20619 }, { "epoch": 0.39, "learning_rate": 3.491949926474278e-06, "loss": 1.0086, "step": 20620 }, { "epoch": 0.39, "learning_rate": 3.491809699038018e-06, "loss": 0.8797, "step": 20621 }, { "epoch": 0.39, "learning_rate": 3.49166946789837e-06, "loss": 1.0327, "step": 20622 }, { "epoch": 0.39, "learning_rate": 3.4915292330558597e-06, "loss": 0.8403, "step": 20623 }, { "epoch": 0.39, "learning_rate": 3.49138899451101e-06, "loss": 1.1697, "step": 20624 }, { "epoch": 0.39, "learning_rate": 3.4912487522643433e-06, "loss": 0.7618, "step": 20625 }, { "epoch": 0.39, "learning_rate": 3.4911085063163847e-06, "loss": 1.1075, "step": 20626 }, { "epoch": 0.39, "learning_rate": 3.4909682566676565e-06, "loss": 0.8068, "step": 20627 }, { "epoch": 0.39, "learning_rate": 3.4908280033186836e-06, "loss": 0.7761, "step": 20628 }, { "epoch": 0.39, "learning_rate": 3.4906877462699893e-06, "loss": 0.827, "step": 20629 }, { "epoch": 0.39, "learning_rate": 3.4905474855220985e-06, "loss": 0.8818, "step": 20630 }, { "epoch": 0.39, "learning_rate": 3.4904072210755324e-06, "loss": 1.1333, "step": 20631 }, { "epoch": 0.39, "learning_rate": 3.4902669529308166e-06, "loss": 0.8857, "step": 20632 }, { "epoch": 0.39, "learning_rate": 3.4901266810884747e-06, "loss": 1.0422, "step": 20633 }, { "epoch": 0.39, "learning_rate": 3.489986405549029e-06, "loss": 0.8611, "step": 20634 }, { "epoch": 0.39, "learning_rate": 3.489846126313005e-06, "loss": 0.782, "step": 20635 }, { "epoch": 0.39, "learning_rate": 3.489705843380926e-06, "loss": 0.8077, "step": 20636 }, { "epoch": 0.39, "learning_rate": 3.489565556753316e-06, "loss": 0.9851, "step": 20637 }, { "epoch": 0.39, "learning_rate": 3.4894252664306984e-06, "loss": 0.9754, "step": 20638 }, { "epoch": 0.39, "learning_rate": 3.4892849724135976e-06, "loss": 1.0662, "step": 20639 }, { "epoch": 0.39, "learning_rate": 3.4891446747025357e-06, "loss": 0.909, "step": 20640 }, { "epoch": 0.39, "learning_rate": 3.4890043732980396e-06, "loss": 0.7887, "step": 20641 }, { "epoch": 0.39, "learning_rate": 3.48886406820063e-06, "loss": 1.1054, "step": 20642 }, { "epoch": 0.39, "learning_rate": 3.4887237594108326e-06, "loss": 1.012, "step": 20643 }, { "epoch": 0.39, "learning_rate": 3.4885834469291712e-06, "loss": 1.1095, "step": 20644 }, { "epoch": 0.39, "learning_rate": 3.4884431307561708e-06, "loss": 0.9425, "step": 20645 }, { "epoch": 0.39, "learning_rate": 3.488302810892352e-06, "loss": 0.6906, "step": 20646 }, { "epoch": 0.39, "learning_rate": 3.4881624873382417e-06, "loss": 0.8815, "step": 20647 }, { "epoch": 0.39, "learning_rate": 3.488022160094363e-06, "loss": 0.967, "step": 20648 }, { "epoch": 0.39, "learning_rate": 3.4878818291612396e-06, "loss": 0.984, "step": 20649 }, { "epoch": 0.39, "learning_rate": 3.487741494539396e-06, "loss": 1.0818, "step": 20650 }, { "epoch": 0.39, "learning_rate": 3.4876011562293564e-06, "loss": 0.959, "step": 20651 }, { "epoch": 0.39, "learning_rate": 3.4874608142316436e-06, "loss": 1.0189, "step": 20652 }, { "epoch": 0.39, "learning_rate": 3.487320468546783e-06, "loss": 0.8817, "step": 20653 }, { "epoch": 0.39, "learning_rate": 3.487180119175298e-06, "loss": 0.8384, "step": 20654 }, { "epoch": 0.39, "learning_rate": 3.487039766117711e-06, "loss": 0.9131, "step": 20655 }, { "epoch": 0.39, "learning_rate": 3.4868994093745494e-06, "loss": 1.0093, "step": 20656 }, { "epoch": 0.39, "learning_rate": 3.486759048946336e-06, "loss": 1.0919, "step": 20657 }, { "epoch": 0.39, "learning_rate": 3.486618684833594e-06, "loss": 0.8184, "step": 20658 }, { "epoch": 0.39, "learning_rate": 3.486478317036848e-06, "loss": 0.8441, "step": 20659 }, { "epoch": 0.39, "learning_rate": 3.4863379455566225e-06, "loss": 0.9123, "step": 20660 }, { "epoch": 0.39, "learning_rate": 3.4861975703934413e-06, "loss": 0.9515, "step": 20661 }, { "epoch": 0.39, "learning_rate": 3.4860571915478285e-06, "loss": 0.9234, "step": 20662 }, { "epoch": 0.39, "learning_rate": 3.4859168090203083e-06, "loss": 0.8643, "step": 20663 }, { "epoch": 0.39, "learning_rate": 3.485776422811405e-06, "loss": 0.8757, "step": 20664 }, { "epoch": 0.39, "learning_rate": 3.4856360329216425e-06, "loss": 0.8958, "step": 20665 }, { "epoch": 0.39, "learning_rate": 3.485495639351546e-06, "loss": 0.8958, "step": 20666 }, { "epoch": 0.39, "learning_rate": 3.4853552421016386e-06, "loss": 0.9655, "step": 20667 }, { "epoch": 0.39, "learning_rate": 3.4852148411724445e-06, "loss": 0.973, "step": 20668 }, { "epoch": 0.39, "learning_rate": 3.4850744365644885e-06, "loss": 1.2026, "step": 20669 }, { "epoch": 0.39, "learning_rate": 3.4849340282782953e-06, "loss": 0.9444, "step": 20670 }, { "epoch": 0.39, "learning_rate": 3.484793616314388e-06, "loss": 0.8409, "step": 20671 }, { "epoch": 0.39, "learning_rate": 3.4846532006732924e-06, "loss": 0.9852, "step": 20672 }, { "epoch": 0.39, "learning_rate": 3.4845127813555314e-06, "loss": 0.9765, "step": 20673 }, { "epoch": 0.39, "learning_rate": 3.4843723583616296e-06, "loss": 1.0066, "step": 20674 }, { "epoch": 0.39, "learning_rate": 3.4842319316921127e-06, "loss": 0.967, "step": 20675 }, { "epoch": 0.39, "learning_rate": 3.4840915013475023e-06, "loss": 0.9, "step": 20676 }, { "epoch": 0.39, "learning_rate": 3.483951067328325e-06, "loss": 0.9508, "step": 20677 }, { "epoch": 0.39, "learning_rate": 3.4838106296351052e-06, "loss": 0.7762, "step": 20678 }, { "epoch": 0.39, "learning_rate": 3.4836701882683664e-06, "loss": 0.9236, "step": 20679 }, { "epoch": 0.39, "learning_rate": 3.483529743228633e-06, "loss": 1.1136, "step": 20680 }, { "epoch": 0.39, "learning_rate": 3.4833892945164304e-06, "loss": 1.1432, "step": 20681 }, { "epoch": 0.39, "learning_rate": 3.483248842132282e-06, "loss": 0.8629, "step": 20682 }, { "epoch": 0.39, "learning_rate": 3.483108386076712e-06, "loss": 0.9188, "step": 20683 }, { "epoch": 0.39, "learning_rate": 3.482967926350246e-06, "loss": 1.0882, "step": 20684 }, { "epoch": 0.39, "learning_rate": 3.482827462953407e-06, "loss": 0.7726, "step": 20685 }, { "epoch": 0.39, "learning_rate": 3.482686995886721e-06, "loss": 0.9475, "step": 20686 }, { "epoch": 0.39, "learning_rate": 3.482546525150713e-06, "loss": 1.1069, "step": 20687 }, { "epoch": 0.39, "learning_rate": 3.4824060507459044e-06, "loss": 0.9398, "step": 20688 }, { "epoch": 0.39, "learning_rate": 3.4822655726728226e-06, "loss": 0.9968, "step": 20689 }, { "epoch": 0.39, "learning_rate": 3.4821250909319915e-06, "loss": 0.8763, "step": 20690 }, { "epoch": 0.39, "learning_rate": 3.4819846055239354e-06, "loss": 0.915, "step": 20691 }, { "epoch": 0.39, "learning_rate": 3.481844116449179e-06, "loss": 1.0272, "step": 20692 }, { "epoch": 0.39, "learning_rate": 3.4817036237082468e-06, "loss": 0.9517, "step": 20693 }, { "epoch": 0.39, "learning_rate": 3.4815631273016628e-06, "loss": 1.046, "step": 20694 }, { "epoch": 0.39, "learning_rate": 3.4814226272299523e-06, "loss": 1.1026, "step": 20695 }, { "epoch": 0.39, "learning_rate": 3.4812821234936407e-06, "loss": 0.8578, "step": 20696 }, { "epoch": 0.39, "learning_rate": 3.4811416160932505e-06, "loss": 0.7401, "step": 20697 }, { "epoch": 0.39, "learning_rate": 3.4810011050293085e-06, "loss": 0.8721, "step": 20698 }, { "epoch": 0.39, "learning_rate": 3.480860590302338e-06, "loss": 0.83, "step": 20699 }, { "epoch": 0.39, "learning_rate": 3.4807200719128644e-06, "loss": 1.0294, "step": 20700 }, { "epoch": 0.39, "learning_rate": 3.480579549861412e-06, "loss": 0.8593, "step": 20701 }, { "epoch": 0.39, "learning_rate": 3.4804390241485055e-06, "loss": 0.8922, "step": 20702 }, { "epoch": 0.39, "learning_rate": 3.48029849477467e-06, "loss": 1.0928, "step": 20703 }, { "epoch": 0.39, "learning_rate": 3.480157961740429e-06, "loss": 0.9257, "step": 20704 }, { "epoch": 0.39, "learning_rate": 3.480017425046309e-06, "loss": 0.9875, "step": 20705 }, { "epoch": 0.39, "learning_rate": 3.4798768846928343e-06, "loss": 0.9397, "step": 20706 }, { "epoch": 0.39, "learning_rate": 3.4797363406805296e-06, "loss": 1.1217, "step": 20707 }, { "epoch": 0.39, "learning_rate": 3.4795957930099183e-06, "loss": 0.7755, "step": 20708 }, { "epoch": 0.39, "learning_rate": 3.479455241681527e-06, "loss": 0.8945, "step": 20709 }, { "epoch": 0.39, "learning_rate": 3.4793146866958795e-06, "loss": 0.8809, "step": 20710 }, { "epoch": 0.39, "learning_rate": 3.4791741280535014e-06, "loss": 0.9311, "step": 20711 }, { "epoch": 0.39, "learning_rate": 3.4790335657549166e-06, "loss": 1.0898, "step": 20712 }, { "epoch": 0.39, "learning_rate": 3.4788929998006515e-06, "loss": 1.0897, "step": 20713 }, { "epoch": 0.39, "learning_rate": 3.478752430191229e-06, "loss": 0.8119, "step": 20714 }, { "epoch": 0.39, "learning_rate": 3.4786118569271752e-06, "loss": 0.8462, "step": 20715 }, { "epoch": 0.39, "learning_rate": 3.4784712800090152e-06, "loss": 0.8001, "step": 20716 }, { "epoch": 0.39, "learning_rate": 3.4783306994372734e-06, "loss": 0.9389, "step": 20717 }, { "epoch": 0.39, "learning_rate": 3.478190115212474e-06, "loss": 0.9878, "step": 20718 }, { "epoch": 0.39, "learning_rate": 3.478049527335143e-06, "loss": 1.1443, "step": 20719 }, { "epoch": 0.39, "learning_rate": 3.477908935805805e-06, "loss": 1.1298, "step": 20720 }, { "epoch": 0.39, "learning_rate": 3.4777683406249853e-06, "loss": 1.0234, "step": 20721 }, { "epoch": 0.39, "learning_rate": 3.477627741793209e-06, "loss": 0.7959, "step": 20722 }, { "epoch": 0.39, "learning_rate": 3.4774871393109998e-06, "loss": 0.9099, "step": 20723 }, { "epoch": 0.39, "learning_rate": 3.4773465331788843e-06, "loss": 1.2214, "step": 20724 }, { "epoch": 0.39, "learning_rate": 3.477205923397386e-06, "loss": 1.0277, "step": 20725 }, { "epoch": 0.39, "learning_rate": 3.4770653099670317e-06, "loss": 0.8489, "step": 20726 }, { "epoch": 0.39, "learning_rate": 3.4769246928883443e-06, "loss": 0.7817, "step": 20727 }, { "epoch": 0.39, "learning_rate": 3.476784072161851e-06, "loss": 1.0002, "step": 20728 }, { "epoch": 0.39, "learning_rate": 3.4766434477880757e-06, "loss": 0.9132, "step": 20729 }, { "epoch": 0.39, "learning_rate": 3.476502819767544e-06, "loss": 0.8696, "step": 20730 }, { "epoch": 0.39, "learning_rate": 3.4763621881007803e-06, "loss": 1.045, "step": 20731 }, { "epoch": 0.39, "learning_rate": 3.47622155278831e-06, "loss": 0.8282, "step": 20732 }, { "epoch": 0.39, "learning_rate": 3.4760809138306583e-06, "loss": 0.9673, "step": 20733 }, { "epoch": 0.39, "learning_rate": 3.475940271228351e-06, "loss": 0.9532, "step": 20734 }, { "epoch": 0.39, "learning_rate": 3.4757996249819125e-06, "loss": 0.8637, "step": 20735 }, { "epoch": 0.39, "learning_rate": 3.475658975091868e-06, "loss": 1.0841, "step": 20736 }, { "epoch": 0.39, "learning_rate": 3.475518321558743e-06, "loss": 0.8625, "step": 20737 }, { "epoch": 0.39, "learning_rate": 3.475377664383062e-06, "loss": 1.0677, "step": 20738 }, { "epoch": 0.39, "learning_rate": 3.4752370035653503e-06, "loss": 0.8401, "step": 20739 }, { "epoch": 0.39, "learning_rate": 3.4750963391061344e-06, "loss": 0.7856, "step": 20740 }, { "epoch": 0.39, "learning_rate": 3.4749556710059386e-06, "loss": 0.8872, "step": 20741 }, { "epoch": 0.39, "learning_rate": 3.474814999265288e-06, "loss": 0.9002, "step": 20742 }, { "epoch": 0.39, "learning_rate": 3.4746743238847086e-06, "loss": 0.8607, "step": 20743 }, { "epoch": 0.39, "learning_rate": 3.4745336448647245e-06, "loss": 1.0507, "step": 20744 }, { "epoch": 0.39, "learning_rate": 3.4743929622058614e-06, "loss": 0.8306, "step": 20745 }, { "epoch": 0.39, "learning_rate": 3.4742522759086454e-06, "loss": 0.8623, "step": 20746 }, { "epoch": 0.39, "learning_rate": 3.474111585973601e-06, "loss": 1.1105, "step": 20747 }, { "epoch": 0.39, "learning_rate": 3.473970892401254e-06, "loss": 0.7844, "step": 20748 }, { "epoch": 0.39, "learning_rate": 3.47383019519213e-06, "loss": 1.0928, "step": 20749 }, { "epoch": 0.39, "learning_rate": 3.4736894943467538e-06, "loss": 1.1072, "step": 20750 }, { "epoch": 0.39, "learning_rate": 3.47354878986565e-06, "loss": 0.9355, "step": 20751 }, { "epoch": 0.39, "learning_rate": 3.4734080817493455e-06, "loss": 0.876, "step": 20752 }, { "epoch": 0.39, "learning_rate": 3.4732673699983642e-06, "loss": 0.8329, "step": 20753 }, { "epoch": 0.39, "learning_rate": 3.473126654613234e-06, "loss": 0.9698, "step": 20754 }, { "epoch": 0.39, "learning_rate": 3.4729859355944777e-06, "loss": 0.8703, "step": 20755 }, { "epoch": 0.39, "learning_rate": 3.4728452129426216e-06, "loss": 1.2141, "step": 20756 }, { "epoch": 0.39, "learning_rate": 3.472704486658192e-06, "loss": 1.0627, "step": 20757 }, { "epoch": 0.39, "learning_rate": 3.4725637567417135e-06, "loss": 0.9355, "step": 20758 }, { "epoch": 0.39, "learning_rate": 3.472423023193711e-06, "loss": 0.9449, "step": 20759 }, { "epoch": 0.39, "learning_rate": 3.472282286014711e-06, "loss": 0.7084, "step": 20760 }, { "epoch": 0.39, "learning_rate": 3.4721415452052395e-06, "loss": 0.8306, "step": 20761 }, { "epoch": 0.39, "learning_rate": 3.4720008007658206e-06, "loss": 1.0005, "step": 20762 }, { "epoch": 0.39, "learning_rate": 3.4718600526969803e-06, "loss": 1.1082, "step": 20763 }, { "epoch": 0.39, "learning_rate": 3.4717193009992455e-06, "loss": 0.9666, "step": 20764 }, { "epoch": 0.39, "learning_rate": 3.47157854567314e-06, "loss": 1.0397, "step": 20765 }, { "epoch": 0.39, "learning_rate": 3.4714377867191894e-06, "loss": 0.8008, "step": 20766 }, { "epoch": 0.39, "learning_rate": 3.4712970241379206e-06, "loss": 0.9005, "step": 20767 }, { "epoch": 0.39, "learning_rate": 3.471156257929858e-06, "loss": 0.9272, "step": 20768 }, { "epoch": 0.39, "learning_rate": 3.471015488095528e-06, "loss": 1.1765, "step": 20769 }, { "epoch": 0.39, "learning_rate": 3.470874714635456e-06, "loss": 0.9468, "step": 20770 }, { "epoch": 0.39, "learning_rate": 3.4707339375501676e-06, "loss": 0.8412, "step": 20771 }, { "epoch": 0.39, "learning_rate": 3.4705931568401885e-06, "loss": 0.9158, "step": 20772 }, { "epoch": 0.39, "learning_rate": 3.4704523725060442e-06, "loss": 0.9747, "step": 20773 }, { "epoch": 0.39, "learning_rate": 3.47031158454826e-06, "loss": 1.1138, "step": 20774 }, { "epoch": 0.39, "learning_rate": 3.470170792967362e-06, "loss": 1.0682, "step": 20775 }, { "epoch": 0.39, "learning_rate": 3.4700299977638773e-06, "loss": 0.9734, "step": 20776 }, { "epoch": 0.39, "learning_rate": 3.46988919893833e-06, "loss": 1.0001, "step": 20777 }, { "epoch": 0.39, "learning_rate": 3.4697483964912454e-06, "loss": 0.833, "step": 20778 }, { "epoch": 0.39, "learning_rate": 3.4696075904231506e-06, "loss": 0.8046, "step": 20779 }, { "epoch": 0.39, "learning_rate": 3.4694667807345704e-06, "loss": 0.8749, "step": 20780 }, { "epoch": 0.39, "learning_rate": 3.4693259674260303e-06, "loss": 1.0825, "step": 20781 }, { "epoch": 0.39, "learning_rate": 3.4691851504980582e-06, "loss": 1.1487, "step": 20782 }, { "epoch": 0.39, "learning_rate": 3.4690443299511777e-06, "loss": 0.7658, "step": 20783 }, { "epoch": 0.39, "learning_rate": 3.4689035057859156e-06, "loss": 0.8227, "step": 20784 }, { "epoch": 0.39, "learning_rate": 3.4687626780027982e-06, "loss": 0.6574, "step": 20785 }, { "epoch": 0.39, "learning_rate": 3.4686218466023497e-06, "loss": 0.91, "step": 20786 }, { "epoch": 0.39, "learning_rate": 3.468481011585097e-06, "loss": 0.9173, "step": 20787 }, { "epoch": 0.39, "learning_rate": 3.468340172951566e-06, "loss": 1.0947, "step": 20788 }, { "epoch": 0.39, "learning_rate": 3.4681993307022822e-06, "loss": 1.0307, "step": 20789 }, { "epoch": 0.39, "learning_rate": 3.468058484837772e-06, "loss": 0.9336, "step": 20790 }, { "epoch": 0.39, "learning_rate": 3.467917635358562e-06, "loss": 0.8937, "step": 20791 }, { "epoch": 0.39, "learning_rate": 3.467776782265176e-06, "loss": 0.7899, "step": 20792 }, { "epoch": 0.39, "learning_rate": 3.4676359255581416e-06, "loss": 0.8142, "step": 20793 }, { "epoch": 0.39, "learning_rate": 3.467495065237984e-06, "loss": 1.212, "step": 20794 }, { "epoch": 0.39, "learning_rate": 3.46735420130523e-06, "loss": 0.7562, "step": 20795 }, { "epoch": 0.39, "learning_rate": 3.4672133337604048e-06, "loss": 0.8245, "step": 20796 }, { "epoch": 0.39, "learning_rate": 3.4670724626040354e-06, "loss": 0.964, "step": 20797 }, { "epoch": 0.39, "learning_rate": 3.466931587836646e-06, "loss": 1.0231, "step": 20798 }, { "epoch": 0.39, "learning_rate": 3.4667907094587637e-06, "loss": 0.9673, "step": 20799 }, { "epoch": 0.39, "learning_rate": 3.466649827470916e-06, "loss": 1.0591, "step": 20800 }, { "epoch": 0.39, "learning_rate": 3.466508941873626e-06, "loss": 0.8486, "step": 20801 }, { "epoch": 0.39, "learning_rate": 3.466368052667421e-06, "loss": 1.0257, "step": 20802 }, { "epoch": 0.39, "learning_rate": 3.4662271598528287e-06, "loss": 0.9278, "step": 20803 }, { "epoch": 0.39, "learning_rate": 3.4660862634303728e-06, "loss": 0.9164, "step": 20804 }, { "epoch": 0.39, "learning_rate": 3.4659453634005806e-06, "loss": 0.8928, "step": 20805 }, { "epoch": 0.39, "learning_rate": 3.4658044597639785e-06, "loss": 1.1069, "step": 20806 }, { "epoch": 0.39, "learning_rate": 3.4656635525210918e-06, "loss": 0.8286, "step": 20807 }, { "epoch": 0.39, "learning_rate": 3.4655226416724467e-06, "loss": 0.9855, "step": 20808 }, { "epoch": 0.39, "learning_rate": 3.4653817272185703e-06, "loss": 1.0262, "step": 20809 }, { "epoch": 0.39, "learning_rate": 3.4652408091599876e-06, "loss": 0.8425, "step": 20810 }, { "epoch": 0.39, "learning_rate": 3.465099887497225e-06, "loss": 1.0006, "step": 20811 }, { "epoch": 0.39, "learning_rate": 3.46495896223081e-06, "loss": 1.0415, "step": 20812 }, { "epoch": 0.39, "learning_rate": 3.4648180333612675e-06, "loss": 0.9034, "step": 20813 }, { "epoch": 0.39, "learning_rate": 3.4646771008891245e-06, "loss": 0.9757, "step": 20814 }, { "epoch": 0.39, "learning_rate": 3.4645361648149058e-06, "loss": 0.851, "step": 20815 }, { "epoch": 0.39, "learning_rate": 3.464395225139139e-06, "loss": 0.8142, "step": 20816 }, { "epoch": 0.39, "learning_rate": 3.46425428186235e-06, "loss": 0.9963, "step": 20817 }, { "epoch": 0.39, "learning_rate": 3.4641133349850653e-06, "loss": 0.9052, "step": 20818 }, { "epoch": 0.39, "learning_rate": 3.4639723845078106e-06, "loss": 1.1031, "step": 20819 }, { "epoch": 0.39, "learning_rate": 3.4638314304311127e-06, "loss": 0.8991, "step": 20820 }, { "epoch": 0.39, "learning_rate": 3.4636904727554976e-06, "loss": 0.8737, "step": 20821 }, { "epoch": 0.39, "learning_rate": 3.463549511481492e-06, "loss": 0.8321, "step": 20822 }, { "epoch": 0.39, "learning_rate": 3.4634085466096224e-06, "loss": 0.9579, "step": 20823 }, { "epoch": 0.39, "learning_rate": 3.4632675781404146e-06, "loss": 1.0033, "step": 20824 }, { "epoch": 0.39, "learning_rate": 3.4631266060743946e-06, "loss": 1.2043, "step": 20825 }, { "epoch": 0.39, "learning_rate": 3.4629856304120903e-06, "loss": 1.1659, "step": 20826 }, { "epoch": 0.39, "learning_rate": 3.462844651154027e-06, "loss": 0.8331, "step": 20827 }, { "epoch": 0.39, "learning_rate": 3.462703668300731e-06, "loss": 0.9533, "step": 20828 }, { "epoch": 0.39, "learning_rate": 3.462562681852729e-06, "loss": 0.8677, "step": 20829 }, { "epoch": 0.39, "learning_rate": 3.4624216918105475e-06, "loss": 0.9066, "step": 20830 }, { "epoch": 0.39, "learning_rate": 3.4622806981747128e-06, "loss": 1.1323, "step": 20831 }, { "epoch": 0.39, "learning_rate": 3.462139700945752e-06, "loss": 0.9327, "step": 20832 }, { "epoch": 0.39, "learning_rate": 3.4619987001241907e-06, "loss": 0.6954, "step": 20833 }, { "epoch": 0.39, "learning_rate": 3.4618576957105554e-06, "loss": 1.0749, "step": 20834 }, { "epoch": 0.39, "learning_rate": 3.4617166877053738e-06, "loss": 0.7036, "step": 20835 }, { "epoch": 0.39, "learning_rate": 3.4615756761091706e-06, "loss": 1.1244, "step": 20836 }, { "epoch": 0.39, "learning_rate": 3.4614346609224735e-06, "loss": 1.0073, "step": 20837 }, { "epoch": 0.39, "learning_rate": 3.4612936421458098e-06, "loss": 1.0429, "step": 20838 }, { "epoch": 0.39, "learning_rate": 3.461152619779704e-06, "loss": 0.9676, "step": 20839 }, { "epoch": 0.39, "learning_rate": 3.461011593824685e-06, "loss": 0.9771, "step": 20840 }, { "epoch": 0.39, "learning_rate": 3.4608705642812773e-06, "loss": 0.8739, "step": 20841 }, { "epoch": 0.39, "learning_rate": 3.4607295311500085e-06, "loss": 0.999, "step": 20842 }, { "epoch": 0.39, "learning_rate": 3.460588494431405e-06, "loss": 1.1025, "step": 20843 }, { "epoch": 0.39, "learning_rate": 3.4604474541259935e-06, "loss": 1.0364, "step": 20844 }, { "epoch": 0.39, "learning_rate": 3.460306410234301e-06, "loss": 0.8734, "step": 20845 }, { "epoch": 0.39, "learning_rate": 3.4601653627568534e-06, "loss": 0.9416, "step": 20846 }, { "epoch": 0.39, "learning_rate": 3.460024311694178e-06, "loss": 1.0302, "step": 20847 }, { "epoch": 0.39, "learning_rate": 3.459883257046801e-06, "loss": 0.7956, "step": 20848 }, { "epoch": 0.39, "learning_rate": 3.45974219881525e-06, "loss": 0.9843, "step": 20849 }, { "epoch": 0.39, "learning_rate": 3.4596011370000505e-06, "loss": 1.0725, "step": 20850 }, { "epoch": 0.39, "learning_rate": 3.4594600716017294e-06, "loss": 1.0101, "step": 20851 }, { "epoch": 0.39, "learning_rate": 3.459319002620814e-06, "loss": 0.9457, "step": 20852 }, { "epoch": 0.39, "learning_rate": 3.4591779300578316e-06, "loss": 0.885, "step": 20853 }, { "epoch": 0.39, "learning_rate": 3.4590368539133078e-06, "loss": 0.8251, "step": 20854 }, { "epoch": 0.39, "learning_rate": 3.458895774187769e-06, "loss": 0.9594, "step": 20855 }, { "epoch": 0.39, "learning_rate": 3.4587546908817448e-06, "loss": 1.2118, "step": 20856 }, { "epoch": 0.39, "learning_rate": 3.458613603995758e-06, "loss": 1.0772, "step": 20857 }, { "epoch": 0.39, "learning_rate": 3.4584725135303376e-06, "loss": 0.9059, "step": 20858 }, { "epoch": 0.39, "learning_rate": 3.458331419486012e-06, "loss": 0.7354, "step": 20859 }, { "epoch": 0.39, "learning_rate": 3.4581903218633046e-06, "loss": 1.0436, "step": 20860 }, { "epoch": 0.39, "learning_rate": 3.458049220662744e-06, "loss": 0.8276, "step": 20861 }, { "epoch": 0.39, "learning_rate": 3.4579081158848575e-06, "loss": 1.047, "step": 20862 }, { "epoch": 0.39, "learning_rate": 3.4577670075301715e-06, "loss": 1.0949, "step": 20863 }, { "epoch": 0.39, "learning_rate": 3.4576258955992125e-06, "loss": 0.9999, "step": 20864 }, { "epoch": 0.39, "learning_rate": 3.4574847800925076e-06, "loss": 0.9705, "step": 20865 }, { "epoch": 0.39, "learning_rate": 3.4573436610105843e-06, "loss": 0.8841, "step": 20866 }, { "epoch": 0.39, "learning_rate": 3.4572025383539685e-06, "loss": 0.9784, "step": 20867 }, { "epoch": 0.39, "learning_rate": 3.4570614121231888e-06, "loss": 0.9239, "step": 20868 }, { "epoch": 0.39, "learning_rate": 3.4569202823187707e-06, "loss": 0.9327, "step": 20869 }, { "epoch": 0.39, "learning_rate": 3.4567791489412415e-06, "loss": 0.9186, "step": 20870 }, { "epoch": 0.39, "learning_rate": 3.456638011991128e-06, "loss": 0.7599, "step": 20871 }, { "epoch": 0.39, "learning_rate": 3.4564968714689577e-06, "loss": 0.8592, "step": 20872 }, { "epoch": 0.39, "learning_rate": 3.4563557273752573e-06, "loss": 0.7271, "step": 20873 }, { "epoch": 0.39, "learning_rate": 3.4562145797105553e-06, "loss": 1.2004, "step": 20874 }, { "epoch": 0.39, "learning_rate": 3.4560734284753756e-06, "loss": 0.9293, "step": 20875 }, { "epoch": 0.39, "learning_rate": 3.4559322736702477e-06, "loss": 0.8871, "step": 20876 }, { "epoch": 0.39, "learning_rate": 3.455791115295698e-06, "loss": 0.9501, "step": 20877 }, { "epoch": 0.39, "learning_rate": 3.455649953352253e-06, "loss": 0.9082, "step": 20878 }, { "epoch": 0.39, "learning_rate": 3.455508787840441e-06, "loss": 0.8263, "step": 20879 }, { "epoch": 0.39, "learning_rate": 3.455367618760789e-06, "loss": 0.8557, "step": 20880 }, { "epoch": 0.39, "learning_rate": 3.455226446113823e-06, "loss": 1.0726, "step": 20881 }, { "epoch": 0.39, "learning_rate": 3.4550852699000703e-06, "loss": 0.8551, "step": 20882 }, { "epoch": 0.39, "learning_rate": 3.454944090120059e-06, "loss": 0.9714, "step": 20883 }, { "epoch": 0.39, "learning_rate": 3.454802906774316e-06, "loss": 0.9148, "step": 20884 }, { "epoch": 0.39, "learning_rate": 3.454661719863367e-06, "loss": 1.0519, "step": 20885 }, { "epoch": 0.39, "learning_rate": 3.4545205293877416e-06, "loss": 0.7509, "step": 20886 }, { "epoch": 0.39, "learning_rate": 3.454379335347966e-06, "loss": 1.0465, "step": 20887 }, { "epoch": 0.39, "learning_rate": 3.4542381377445666e-06, "loss": 1.1437, "step": 20888 }, { "epoch": 0.39, "learning_rate": 3.454096936578071e-06, "loss": 0.9613, "step": 20889 }, { "epoch": 0.39, "learning_rate": 3.4539557318490073e-06, "loss": 0.7754, "step": 20890 }, { "epoch": 0.39, "learning_rate": 3.4538145235579018e-06, "loss": 0.8038, "step": 20891 }, { "epoch": 0.39, "learning_rate": 3.4536733117052823e-06, "loss": 0.725, "step": 20892 }, { "epoch": 0.39, "learning_rate": 3.453532096291676e-06, "loss": 0.8972, "step": 20893 }, { "epoch": 0.39, "learning_rate": 3.4533908773176095e-06, "loss": 1.0381, "step": 20894 }, { "epoch": 0.39, "learning_rate": 3.4532496547836115e-06, "loss": 0.7293, "step": 20895 }, { "epoch": 0.39, "learning_rate": 3.4531084286902083e-06, "loss": 1.0135, "step": 20896 }, { "epoch": 0.39, "learning_rate": 3.452967199037927e-06, "loss": 0.9443, "step": 20897 }, { "epoch": 0.39, "learning_rate": 3.4528259658272957e-06, "loss": 0.8272, "step": 20898 }, { "epoch": 0.39, "learning_rate": 3.4526847290588412e-06, "loss": 0.9581, "step": 20899 }, { "epoch": 0.39, "learning_rate": 3.452543488733091e-06, "loss": 1.1022, "step": 20900 }, { "epoch": 0.39, "learning_rate": 3.4524022448505734e-06, "loss": 0.8691, "step": 20901 }, { "epoch": 0.39, "learning_rate": 3.452260997411815e-06, "loss": 1.1459, "step": 20902 }, { "epoch": 0.39, "learning_rate": 3.4521197464173427e-06, "loss": 0.8635, "step": 20903 }, { "epoch": 0.39, "learning_rate": 3.4519784918676846e-06, "loss": 0.8317, "step": 20904 }, { "epoch": 0.39, "learning_rate": 3.451837233763368e-06, "loss": 1.0784, "step": 20905 }, { "epoch": 0.39, "learning_rate": 3.45169597210492e-06, "loss": 0.9572, "step": 20906 }, { "epoch": 0.39, "learning_rate": 3.451554706892869e-06, "loss": 1.0087, "step": 20907 }, { "epoch": 0.39, "learning_rate": 3.4514134381277414e-06, "loss": 0.7148, "step": 20908 }, { "epoch": 0.39, "learning_rate": 3.4512721658100655e-06, "loss": 0.8147, "step": 20909 }, { "epoch": 0.39, "learning_rate": 3.4511308899403688e-06, "loss": 0.9805, "step": 20910 }, { "epoch": 0.39, "learning_rate": 3.450989610519178e-06, "loss": 1.0078, "step": 20911 }, { "epoch": 0.39, "learning_rate": 3.4508483275470216e-06, "loss": 1.1076, "step": 20912 }, { "epoch": 0.39, "learning_rate": 3.4507070410244258e-06, "loss": 0.8718, "step": 20913 }, { "epoch": 0.39, "learning_rate": 3.45056575095192e-06, "loss": 0.7791, "step": 20914 }, { "epoch": 0.39, "learning_rate": 3.4504244573300304e-06, "loss": 1.034, "step": 20915 }, { "epoch": 0.39, "learning_rate": 3.4502831601592855e-06, "loss": 0.8172, "step": 20916 }, { "epoch": 0.39, "learning_rate": 3.450141859440212e-06, "loss": 0.8422, "step": 20917 }, { "epoch": 0.39, "learning_rate": 3.4500005551733377e-06, "loss": 1.2591, "step": 20918 }, { "epoch": 0.39, "learning_rate": 3.449859247359191e-06, "loss": 1.2448, "step": 20919 }, { "epoch": 0.39, "learning_rate": 3.4497179359982983e-06, "loss": 1.0037, "step": 20920 }, { "epoch": 0.39, "learning_rate": 3.4495766210911884e-06, "loss": 0.8957, "step": 20921 }, { "epoch": 0.39, "learning_rate": 3.4494353026383887e-06, "loss": 0.9131, "step": 20922 }, { "epoch": 0.39, "learning_rate": 3.4492939806404267e-06, "loss": 0.9484, "step": 20923 }, { "epoch": 0.39, "learning_rate": 3.449152655097829e-06, "loss": 0.9539, "step": 20924 }, { "epoch": 0.39, "learning_rate": 3.4490113260111263e-06, "loss": 1.1146, "step": 20925 }, { "epoch": 0.39, "learning_rate": 3.4488699933808434e-06, "loss": 0.9817, "step": 20926 }, { "epoch": 0.39, "learning_rate": 3.4487286572075085e-06, "loss": 0.8002, "step": 20927 }, { "epoch": 0.39, "learning_rate": 3.4485873174916505e-06, "loss": 0.8901, "step": 20928 }, { "epoch": 0.39, "learning_rate": 3.448445974233796e-06, "loss": 0.9523, "step": 20929 }, { "epoch": 0.39, "learning_rate": 3.4483046274344746e-06, "loss": 1.006, "step": 20930 }, { "epoch": 0.39, "learning_rate": 3.448163277094212e-06, "loss": 0.8347, "step": 20931 }, { "epoch": 0.39, "learning_rate": 3.448021923213536e-06, "loss": 1.0098, "step": 20932 }, { "epoch": 0.39, "learning_rate": 3.447880565792976e-06, "loss": 0.8831, "step": 20933 }, { "epoch": 0.39, "learning_rate": 3.447739204833059e-06, "loss": 1.0509, "step": 20934 }, { "epoch": 0.39, "learning_rate": 3.4475978403343125e-06, "loss": 1.0314, "step": 20935 }, { "epoch": 0.39, "learning_rate": 3.447456472297266e-06, "loss": 0.9869, "step": 20936 }, { "epoch": 0.4, "learning_rate": 3.4473151007224447e-06, "loss": 1.2188, "step": 20937 }, { "epoch": 0.4, "learning_rate": 3.4471737256103784e-06, "loss": 1.1248, "step": 20938 }, { "epoch": 0.4, "learning_rate": 3.4470323469615946e-06, "loss": 0.9684, "step": 20939 }, { "epoch": 0.4, "learning_rate": 3.44689096477662e-06, "loss": 0.9189, "step": 20940 }, { "epoch": 0.4, "learning_rate": 3.446749579055984e-06, "loss": 0.9647, "step": 20941 }, { "epoch": 0.4, "learning_rate": 3.446608189800215e-06, "loss": 0.8016, "step": 20942 }, { "epoch": 0.4, "learning_rate": 3.4464667970098397e-06, "loss": 1.2115, "step": 20943 }, { "epoch": 0.4, "learning_rate": 3.4463254006853858e-06, "loss": 1.0378, "step": 20944 }, { "epoch": 0.4, "learning_rate": 3.4461840008273828e-06, "loss": 1.0357, "step": 20945 }, { "epoch": 0.4, "learning_rate": 3.446042597436357e-06, "loss": 0.9492, "step": 20946 }, { "epoch": 0.4, "learning_rate": 3.4459011905128376e-06, "loss": 0.804, "step": 20947 }, { "epoch": 0.4, "learning_rate": 3.4457597800573517e-06, "loss": 1.0994, "step": 20948 }, { "epoch": 0.4, "learning_rate": 3.445618366070428e-06, "loss": 0.9651, "step": 20949 }, { "epoch": 0.4, "learning_rate": 3.4454769485525942e-06, "loss": 1.1993, "step": 20950 }, { "epoch": 0.4, "learning_rate": 3.4453355275043786e-06, "loss": 0.8166, "step": 20951 }, { "epoch": 0.4, "learning_rate": 3.4451941029263094e-06, "loss": 0.8012, "step": 20952 }, { "epoch": 0.4, "learning_rate": 3.445052674818914e-06, "loss": 0.8047, "step": 20953 }, { "epoch": 0.4, "learning_rate": 3.4449112431827207e-06, "loss": 0.8341, "step": 20954 }, { "epoch": 0.4, "learning_rate": 3.444769808018258e-06, "loss": 0.849, "step": 20955 }, { "epoch": 0.4, "learning_rate": 3.4446283693260542e-06, "loss": 1.2408, "step": 20956 }, { "epoch": 0.4, "learning_rate": 3.4444869271066367e-06, "loss": 0.7729, "step": 20957 }, { "epoch": 0.4, "learning_rate": 3.4443454813605336e-06, "loss": 0.9963, "step": 20958 }, { "epoch": 0.4, "learning_rate": 3.444204032088274e-06, "loss": 0.9027, "step": 20959 }, { "epoch": 0.4, "learning_rate": 3.444062579290386e-06, "loss": 0.8186, "step": 20960 }, { "epoch": 0.4, "learning_rate": 3.443921122967396e-06, "loss": 0.9953, "step": 20961 }, { "epoch": 0.4, "learning_rate": 3.443779663119834e-06, "loss": 0.9836, "step": 20962 }, { "epoch": 0.4, "learning_rate": 3.4436381997482275e-06, "loss": 0.9783, "step": 20963 }, { "epoch": 0.4, "learning_rate": 3.4434967328531055e-06, "loss": 0.9301, "step": 20964 }, { "epoch": 0.4, "learning_rate": 3.4433552624349947e-06, "loss": 0.9291, "step": 20965 }, { "epoch": 0.4, "learning_rate": 3.4432137884944254e-06, "loss": 0.9094, "step": 20966 }, { "epoch": 0.4, "learning_rate": 3.443072311031924e-06, "loss": 0.839, "step": 20967 }, { "epoch": 0.4, "learning_rate": 3.4429308300480195e-06, "loss": 0.9906, "step": 20968 }, { "epoch": 0.4, "learning_rate": 3.4427893455432404e-06, "loss": 1.0173, "step": 20969 }, { "epoch": 0.4, "learning_rate": 3.4426478575181145e-06, "loss": 0.7985, "step": 20970 }, { "epoch": 0.4, "learning_rate": 3.4425063659731707e-06, "loss": 0.8744, "step": 20971 }, { "epoch": 0.4, "learning_rate": 3.4423648709089376e-06, "loss": 1.0748, "step": 20972 }, { "epoch": 0.4, "learning_rate": 3.442223372325942e-06, "loss": 0.8069, "step": 20973 }, { "epoch": 0.4, "learning_rate": 3.4420818702247133e-06, "loss": 1.0273, "step": 20974 }, { "epoch": 0.4, "learning_rate": 3.44194036460578e-06, "loss": 0.9301, "step": 20975 }, { "epoch": 0.4, "learning_rate": 3.44179885546967e-06, "loss": 0.8846, "step": 20976 }, { "epoch": 0.4, "learning_rate": 3.4416573428169125e-06, "loss": 0.819, "step": 20977 }, { "epoch": 0.4, "learning_rate": 3.4415158266480353e-06, "loss": 0.9828, "step": 20978 }, { "epoch": 0.4, "learning_rate": 3.441374306963567e-06, "loss": 0.7664, "step": 20979 }, { "epoch": 0.4, "learning_rate": 3.4412327837640354e-06, "loss": 0.8378, "step": 20980 }, { "epoch": 0.4, "learning_rate": 3.4410912570499698e-06, "loss": 1.1933, "step": 20981 }, { "epoch": 0.4, "learning_rate": 3.4409497268218974e-06, "loss": 1.0263, "step": 20982 }, { "epoch": 0.4, "learning_rate": 3.4408081930803484e-06, "loss": 0.8521, "step": 20983 }, { "epoch": 0.4, "learning_rate": 3.4406666558258506e-06, "loss": 0.8985, "step": 20984 }, { "epoch": 0.4, "learning_rate": 3.440525115058932e-06, "loss": 0.86, "step": 20985 }, { "epoch": 0.4, "learning_rate": 3.4403835707801216e-06, "loss": 0.9542, "step": 20986 }, { "epoch": 0.4, "learning_rate": 3.440242022989948e-06, "loss": 1.1835, "step": 20987 }, { "epoch": 0.4, "learning_rate": 3.440100471688939e-06, "loss": 1.0031, "step": 20988 }, { "epoch": 0.4, "learning_rate": 3.4399589168776237e-06, "loss": 1.0306, "step": 20989 }, { "epoch": 0.4, "learning_rate": 3.439817358556531e-06, "loss": 0.8387, "step": 20990 }, { "epoch": 0.4, "learning_rate": 3.4396757967261886e-06, "loss": 0.8584, "step": 20991 }, { "epoch": 0.4, "learning_rate": 3.439534231387126e-06, "loss": 0.9488, "step": 20992 }, { "epoch": 0.4, "learning_rate": 3.4393926625398716e-06, "loss": 0.9523, "step": 20993 }, { "epoch": 0.4, "learning_rate": 3.4392510901849535e-06, "loss": 1.1423, "step": 20994 }, { "epoch": 0.4, "learning_rate": 3.4391095143229e-06, "loss": 0.9391, "step": 20995 }, { "epoch": 0.4, "learning_rate": 3.4389679349542414e-06, "loss": 0.8502, "step": 20996 }, { "epoch": 0.4, "learning_rate": 3.438826352079505e-06, "loss": 1.0134, "step": 20997 }, { "epoch": 0.4, "learning_rate": 3.4386847656992197e-06, "loss": 0.8165, "step": 20998 }, { "epoch": 0.4, "learning_rate": 3.438543175813914e-06, "loss": 0.7541, "step": 20999 }, { "epoch": 0.4, "learning_rate": 3.4384015824241174e-06, "loss": 0.9465, "step": 21000 }, { "epoch": 0.4, "learning_rate": 3.4382599855303576e-06, "loss": 0.9706, "step": 21001 }, { "epoch": 0.4, "learning_rate": 3.4381183851331644e-06, "loss": 0.8835, "step": 21002 }, { "epoch": 0.4, "learning_rate": 3.437976781233065e-06, "loss": 1.0265, "step": 21003 }, { "epoch": 0.4, "learning_rate": 3.4378351738305894e-06, "loss": 0.7902, "step": 21004 }, { "epoch": 0.4, "learning_rate": 3.4376935629262664e-06, "loss": 1.0976, "step": 21005 }, { "epoch": 0.4, "learning_rate": 3.4375519485206242e-06, "loss": 1.0564, "step": 21006 }, { "epoch": 0.4, "learning_rate": 3.4374103306141915e-06, "loss": 0.9008, "step": 21007 }, { "epoch": 0.4, "learning_rate": 3.437268709207498e-06, "loss": 1.0558, "step": 21008 }, { "epoch": 0.4, "learning_rate": 3.4371270843010716e-06, "loss": 0.885, "step": 21009 }, { "epoch": 0.4, "learning_rate": 3.4369854558954406e-06, "loss": 0.788, "step": 21010 }, { "epoch": 0.4, "learning_rate": 3.4368438239911354e-06, "loss": 0.95, "step": 21011 }, { "epoch": 0.4, "learning_rate": 3.436702188588684e-06, "loss": 1.2037, "step": 21012 }, { "epoch": 0.4, "learning_rate": 3.436560549688615e-06, "loss": 1.1458, "step": 21013 }, { "epoch": 0.4, "learning_rate": 3.436418907291459e-06, "loss": 1.1487, "step": 21014 }, { "epoch": 0.4, "learning_rate": 3.4362772613977417e-06, "loss": 0.7841, "step": 21015 }, { "epoch": 0.4, "learning_rate": 3.4361356120079947e-06, "loss": 0.9029, "step": 21016 }, { "epoch": 0.4, "learning_rate": 3.435993959122746e-06, "loss": 0.885, "step": 21017 }, { "epoch": 0.4, "learning_rate": 3.435852302742524e-06, "loss": 1.0854, "step": 21018 }, { "epoch": 0.4, "learning_rate": 3.4357106428678588e-06, "loss": 1.1823, "step": 21019 }, { "epoch": 0.4, "learning_rate": 3.4355689794992793e-06, "loss": 0.9568, "step": 21020 }, { "epoch": 0.4, "learning_rate": 3.435427312637313e-06, "loss": 0.8226, "step": 21021 }, { "epoch": 0.4, "learning_rate": 3.43528564228249e-06, "loss": 0.9146, "step": 21022 }, { "epoch": 0.4, "learning_rate": 3.4351439684353396e-06, "loss": 0.8061, "step": 21023 }, { "epoch": 0.4, "learning_rate": 3.4350022910963886e-06, "loss": 0.8726, "step": 21024 }, { "epoch": 0.4, "learning_rate": 3.434860610266169e-06, "loss": 1.0545, "step": 21025 }, { "epoch": 0.4, "learning_rate": 3.4347189259452086e-06, "loss": 0.8833, "step": 21026 }, { "epoch": 0.4, "learning_rate": 3.4345772381340365e-06, "loss": 0.9581, "step": 21027 }, { "epoch": 0.4, "learning_rate": 3.4344355468331815e-06, "loss": 0.9844, "step": 21028 }, { "epoch": 0.4, "learning_rate": 3.434293852043173e-06, "loss": 0.9018, "step": 21029 }, { "epoch": 0.4, "learning_rate": 3.4341521537645396e-06, "loss": 1.0739, "step": 21030 }, { "epoch": 0.4, "learning_rate": 3.4340104519978103e-06, "loss": 1.1519, "step": 21031 }, { "epoch": 0.4, "learning_rate": 3.433868746743515e-06, "loss": 0.9587, "step": 21032 }, { "epoch": 0.4, "learning_rate": 3.4337270380021827e-06, "loss": 0.9073, "step": 21033 }, { "epoch": 0.4, "learning_rate": 3.433585325774341e-06, "loss": 1.0243, "step": 21034 }, { "epoch": 0.4, "learning_rate": 3.4334436100605222e-06, "loss": 0.7298, "step": 21035 }, { "epoch": 0.4, "learning_rate": 3.4333018908612526e-06, "loss": 0.8151, "step": 21036 }, { "epoch": 0.4, "learning_rate": 3.433160168177062e-06, "loss": 0.9835, "step": 21037 }, { "epoch": 0.4, "learning_rate": 3.4330184420084807e-06, "loss": 1.0128, "step": 21038 }, { "epoch": 0.4, "learning_rate": 3.4328767123560367e-06, "loss": 0.8094, "step": 21039 }, { "epoch": 0.4, "learning_rate": 3.4327349792202596e-06, "loss": 0.9596, "step": 21040 }, { "epoch": 0.4, "learning_rate": 3.4325932426016795e-06, "loss": 0.7957, "step": 21041 }, { "epoch": 0.4, "learning_rate": 3.432451502500824e-06, "loss": 0.9791, "step": 21042 }, { "epoch": 0.4, "learning_rate": 3.4323097589182237e-06, "loss": 0.9781, "step": 21043 }, { "epoch": 0.4, "learning_rate": 3.4321680118544073e-06, "loss": 0.9865, "step": 21044 }, { "epoch": 0.4, "learning_rate": 3.4320262613099033e-06, "loss": 1.0086, "step": 21045 }, { "epoch": 0.4, "learning_rate": 3.4318845072852425e-06, "loss": 0.9757, "step": 21046 }, { "epoch": 0.4, "learning_rate": 3.4317427497809534e-06, "loss": 0.8086, "step": 21047 }, { "epoch": 0.4, "learning_rate": 3.4316009887975655e-06, "loss": 0.6396, "step": 21048 }, { "epoch": 0.4, "learning_rate": 3.431459224335608e-06, "loss": 1.0267, "step": 21049 }, { "epoch": 0.4, "learning_rate": 3.431317456395611e-06, "loss": 1.0955, "step": 21050 }, { "epoch": 0.4, "learning_rate": 3.431175684978102e-06, "loss": 0.7352, "step": 21051 }, { "epoch": 0.4, "learning_rate": 3.431033910083612e-06, "loss": 1.0153, "step": 21052 }, { "epoch": 0.4, "learning_rate": 3.43089213171267e-06, "loss": 0.8884, "step": 21053 }, { "epoch": 0.4, "learning_rate": 3.430750349865805e-06, "loss": 0.8069, "step": 21054 }, { "epoch": 0.4, "learning_rate": 3.4306085645435478e-06, "loss": 0.8485, "step": 21055 }, { "epoch": 0.4, "learning_rate": 3.4304667757464256e-06, "loss": 1.2046, "step": 21056 }, { "epoch": 0.4, "learning_rate": 3.4303249834749696e-06, "loss": 1.0731, "step": 21057 }, { "epoch": 0.4, "learning_rate": 3.430183187729708e-06, "loss": 0.9669, "step": 21058 }, { "epoch": 0.4, "learning_rate": 3.4300413885111712e-06, "loss": 0.9547, "step": 21059 }, { "epoch": 0.4, "learning_rate": 3.4298995858198886e-06, "loss": 0.859, "step": 21060 }, { "epoch": 0.4, "learning_rate": 3.4297577796563896e-06, "loss": 0.8542, "step": 21061 }, { "epoch": 0.4, "learning_rate": 3.4296159700212032e-06, "loss": 0.9354, "step": 21062 }, { "epoch": 0.4, "learning_rate": 3.4294741569148593e-06, "loss": 0.9506, "step": 21063 }, { "epoch": 0.4, "learning_rate": 3.4293323403378877e-06, "loss": 0.9271, "step": 21064 }, { "epoch": 0.4, "learning_rate": 3.429190520290817e-06, "loss": 0.954, "step": 21065 }, { "epoch": 0.4, "learning_rate": 3.4290486967741777e-06, "loss": 0.8893, "step": 21066 }, { "epoch": 0.4, "learning_rate": 3.4289068697884997e-06, "loss": 0.8588, "step": 21067 }, { "epoch": 0.4, "learning_rate": 3.428765039334311e-06, "loss": 1.0174, "step": 21068 }, { "epoch": 0.4, "learning_rate": 3.428623205412143e-06, "loss": 0.977, "step": 21069 }, { "epoch": 0.4, "learning_rate": 3.428481368022524e-06, "loss": 0.9609, "step": 21070 }, { "epoch": 0.4, "learning_rate": 3.4283395271659835e-06, "loss": 1.1224, "step": 21071 }, { "epoch": 0.4, "learning_rate": 3.428197682843052e-06, "loss": 1.0507, "step": 21072 }, { "epoch": 0.4, "learning_rate": 3.428055835054259e-06, "loss": 0.7119, "step": 21073 }, { "epoch": 0.4, "learning_rate": 3.4279139838001343e-06, "loss": 0.8158, "step": 21074 }, { "epoch": 0.4, "learning_rate": 3.427772129081206e-06, "loss": 0.9054, "step": 21075 }, { "epoch": 0.4, "learning_rate": 3.4276302708980065e-06, "loss": 0.951, "step": 21076 }, { "epoch": 0.4, "learning_rate": 3.427488409251063e-06, "loss": 1.1556, "step": 21077 }, { "epoch": 0.4, "learning_rate": 3.4273465441409065e-06, "loss": 0.7357, "step": 21078 }, { "epoch": 0.4, "learning_rate": 3.4272046755680666e-06, "loss": 0.8463, "step": 21079 }, { "epoch": 0.4, "learning_rate": 3.4270628035330726e-06, "loss": 0.8198, "step": 21080 }, { "epoch": 0.4, "learning_rate": 3.4269209280364545e-06, "loss": 1.0437, "step": 21081 }, { "epoch": 0.4, "learning_rate": 3.426779049078743e-06, "loss": 0.9742, "step": 21082 }, { "epoch": 0.4, "learning_rate": 3.4266371666604658e-06, "loss": 0.9285, "step": 21083 }, { "epoch": 0.4, "learning_rate": 3.4264952807821544e-06, "loss": 0.7618, "step": 21084 }, { "epoch": 0.4, "learning_rate": 3.426353391444338e-06, "loss": 0.8783, "step": 21085 }, { "epoch": 0.4, "learning_rate": 3.4262114986475464e-06, "loss": 0.8829, "step": 21086 }, { "epoch": 0.4, "learning_rate": 3.426069602392309e-06, "loss": 1.1663, "step": 21087 }, { "epoch": 0.4, "learning_rate": 3.4259277026791565e-06, "loss": 0.9033, "step": 21088 }, { "epoch": 0.4, "learning_rate": 3.4257857995086184e-06, "loss": 0.7355, "step": 21089 }, { "epoch": 0.4, "learning_rate": 3.425643892881224e-06, "loss": 0.7184, "step": 21090 }, { "epoch": 0.4, "learning_rate": 3.425501982797505e-06, "loss": 0.9865, "step": 21091 }, { "epoch": 0.4, "learning_rate": 3.425360069257989e-06, "loss": 1.0082, "step": 21092 }, { "epoch": 0.4, "learning_rate": 3.4252181522632066e-06, "loss": 1.3608, "step": 21093 }, { "epoch": 0.4, "learning_rate": 3.425076231813689e-06, "loss": 1.0994, "step": 21094 }, { "epoch": 0.4, "learning_rate": 3.4249343079099637e-06, "loss": 1.0388, "step": 21095 }, { "epoch": 0.4, "learning_rate": 3.424792380552563e-06, "loss": 0.691, "step": 21096 }, { "epoch": 0.4, "learning_rate": 3.4246504497420163e-06, "loss": 0.7924, "step": 21097 }, { "epoch": 0.4, "learning_rate": 3.424508515478852e-06, "loss": 1.0046, "step": 21098 }, { "epoch": 0.4, "learning_rate": 3.424366577763602e-06, "loss": 1.1315, "step": 21099 }, { "epoch": 0.4, "learning_rate": 3.424224636596795e-06, "loss": 0.9948, "step": 21100 }, { "epoch": 0.4, "learning_rate": 3.424082691978962e-06, "loss": 0.8342, "step": 21101 }, { "epoch": 0.4, "learning_rate": 3.4239407439106325e-06, "loss": 0.8705, "step": 21102 }, { "epoch": 0.4, "learning_rate": 3.423798792392337e-06, "loss": 1.0643, "step": 21103 }, { "epoch": 0.4, "learning_rate": 3.423656837424605e-06, "loss": 0.878, "step": 21104 }, { "epoch": 0.4, "learning_rate": 3.4235148790079657e-06, "loss": 1.0709, "step": 21105 }, { "epoch": 0.4, "learning_rate": 3.4233729171429512e-06, "loss": 1.1758, "step": 21106 }, { "epoch": 0.4, "learning_rate": 3.4232309518300904e-06, "loss": 1.03, "step": 21107 }, { "epoch": 0.4, "learning_rate": 3.4230889830699127e-06, "loss": 0.92, "step": 21108 }, { "epoch": 0.4, "learning_rate": 3.4229470108629503e-06, "loss": 0.9542, "step": 21109 }, { "epoch": 0.4, "learning_rate": 3.4228050352097307e-06, "loss": 0.7187, "step": 21110 }, { "epoch": 0.4, "learning_rate": 3.4226630561107865e-06, "loss": 0.6967, "step": 21111 }, { "epoch": 0.4, "learning_rate": 3.4225210735666468e-06, "loss": 1.1917, "step": 21112 }, { "epoch": 0.4, "learning_rate": 3.4223790875778413e-06, "loss": 1.0437, "step": 21113 }, { "epoch": 0.4, "learning_rate": 3.4222370981449004e-06, "loss": 0.9865, "step": 21114 }, { "epoch": 0.4, "learning_rate": 3.422095105268354e-06, "loss": 0.9322, "step": 21115 }, { "epoch": 0.4, "learning_rate": 3.4219531089487334e-06, "loss": 0.7766, "step": 21116 }, { "epoch": 0.4, "learning_rate": 3.421811109186568e-06, "loss": 0.9535, "step": 21117 }, { "epoch": 0.4, "learning_rate": 3.4216691059823886e-06, "loss": 0.9274, "step": 21118 }, { "epoch": 0.4, "learning_rate": 3.421527099336725e-06, "loss": 1.1005, "step": 21119 }, { "epoch": 0.4, "learning_rate": 3.421385089250107e-06, "loss": 0.7225, "step": 21120 }, { "epoch": 0.4, "learning_rate": 3.421243075723065e-06, "loss": 0.9271, "step": 21121 }, { "epoch": 0.4, "learning_rate": 3.4211010587561298e-06, "loss": 0.9567, "step": 21122 }, { "epoch": 0.4, "learning_rate": 3.420959038349832e-06, "loss": 0.8023, "step": 21123 }, { "epoch": 0.4, "learning_rate": 3.4208170145047016e-06, "loss": 0.7996, "step": 21124 }, { "epoch": 0.4, "learning_rate": 3.4206749872212684e-06, "loss": 1.0584, "step": 21125 }, { "epoch": 0.4, "learning_rate": 3.4205329565000626e-06, "loss": 0.9385, "step": 21126 }, { "epoch": 0.4, "learning_rate": 3.4203909223416154e-06, "loss": 0.7559, "step": 21127 }, { "epoch": 0.4, "learning_rate": 3.4202488847464564e-06, "loss": 0.9351, "step": 21128 }, { "epoch": 0.4, "learning_rate": 3.4201068437151165e-06, "loss": 1.0097, "step": 21129 }, { "epoch": 0.4, "learning_rate": 3.419964799248126e-06, "loss": 1.0351, "step": 21130 }, { "epoch": 0.4, "learning_rate": 3.4198227513460146e-06, "loss": 1.0109, "step": 21131 }, { "epoch": 0.4, "learning_rate": 3.4196807000093135e-06, "loss": 0.9747, "step": 21132 }, { "epoch": 0.4, "learning_rate": 3.4195386452385536e-06, "loss": 0.6066, "step": 21133 }, { "epoch": 0.4, "learning_rate": 3.419396587034264e-06, "loss": 0.7864, "step": 21134 }, { "epoch": 0.4, "learning_rate": 3.4192545253969757e-06, "loss": 0.6768, "step": 21135 }, { "epoch": 0.4, "learning_rate": 3.4191124603272185e-06, "loss": 0.8244, "step": 21136 }, { "epoch": 0.4, "learning_rate": 3.4189703918255247e-06, "loss": 1.0414, "step": 21137 }, { "epoch": 0.4, "learning_rate": 3.4188283198924226e-06, "loss": 1.1368, "step": 21138 }, { "epoch": 0.4, "learning_rate": 3.418686244528445e-06, "loss": 0.9016, "step": 21139 }, { "epoch": 0.4, "learning_rate": 3.41854416573412e-06, "loss": 1.0279, "step": 21140 }, { "epoch": 0.4, "learning_rate": 3.4184020835099797e-06, "loss": 0.7284, "step": 21141 }, { "epoch": 0.4, "learning_rate": 3.418259997856554e-06, "loss": 0.8714, "step": 21142 }, { "epoch": 0.4, "learning_rate": 3.4181179087743737e-06, "loss": 1.1077, "step": 21143 }, { "epoch": 0.4, "learning_rate": 3.4179758162639694e-06, "loss": 1.0822, "step": 21144 }, { "epoch": 0.4, "learning_rate": 3.4178337203258714e-06, "loss": 0.8056, "step": 21145 }, { "epoch": 0.4, "learning_rate": 3.4176916209606107e-06, "loss": 0.8896, "step": 21146 }, { "epoch": 0.4, "learning_rate": 3.4175495181687173e-06, "loss": 0.9106, "step": 21147 }, { "epoch": 0.4, "learning_rate": 3.417407411950723e-06, "loss": 0.8091, "step": 21148 }, { "epoch": 0.4, "learning_rate": 3.4172653023071566e-06, "loss": 1.3039, "step": 21149 }, { "epoch": 0.4, "learning_rate": 3.417123189238549e-06, "loss": 1.0713, "step": 21150 }, { "epoch": 0.4, "learning_rate": 3.4169810727454335e-06, "loss": 1.0137, "step": 21151 }, { "epoch": 0.4, "learning_rate": 3.4168389528283376e-06, "loss": 0.9256, "step": 21152 }, { "epoch": 0.4, "learning_rate": 3.416696829487793e-06, "loss": 0.8918, "step": 21153 }, { "epoch": 0.4, "learning_rate": 3.416554702724331e-06, "loss": 0.9355, "step": 21154 }, { "epoch": 0.4, "learning_rate": 3.4164125725384816e-06, "loss": 0.9337, "step": 21155 }, { "epoch": 0.4, "learning_rate": 3.416270438930776e-06, "loss": 1.2392, "step": 21156 }, { "epoch": 0.4, "learning_rate": 3.4161283019017443e-06, "loss": 0.8389, "step": 21157 }, { "epoch": 0.4, "learning_rate": 3.4159861614519176e-06, "loss": 0.9715, "step": 21158 }, { "epoch": 0.4, "learning_rate": 3.415844017581827e-06, "loss": 0.9799, "step": 21159 }, { "epoch": 0.4, "learning_rate": 3.415701870292003e-06, "loss": 0.8713, "step": 21160 }, { "epoch": 0.4, "learning_rate": 3.415559719582976e-06, "loss": 0.8851, "step": 21161 }, { "epoch": 0.4, "learning_rate": 3.4154175654552773e-06, "loss": 0.9218, "step": 21162 }, { "epoch": 0.4, "learning_rate": 3.4152754079094377e-06, "loss": 0.9204, "step": 21163 }, { "epoch": 0.4, "learning_rate": 3.415133246945987e-06, "loss": 0.9993, "step": 21164 }, { "epoch": 0.4, "learning_rate": 3.4149910825654576e-06, "loss": 1.0212, "step": 21165 }, { "epoch": 0.4, "learning_rate": 3.414848914768379e-06, "loss": 0.9879, "step": 21166 }, { "epoch": 0.4, "learning_rate": 3.4147067435552827e-06, "loss": 0.8154, "step": 21167 }, { "epoch": 0.4, "learning_rate": 3.4145645689267e-06, "loss": 1.2453, "step": 21168 }, { "epoch": 0.4, "learning_rate": 3.414422390883161e-06, "loss": 1.1301, "step": 21169 }, { "epoch": 0.4, "learning_rate": 3.414280209425196e-06, "loss": 0.9207, "step": 21170 }, { "epoch": 0.4, "learning_rate": 3.4141380245533373e-06, "loss": 0.8507, "step": 21171 }, { "epoch": 0.4, "learning_rate": 3.413995836268115e-06, "loss": 0.9781, "step": 21172 }, { "epoch": 0.4, "learning_rate": 3.413853644570061e-06, "loss": 1.2109, "step": 21173 }, { "epoch": 0.4, "learning_rate": 3.4137114494597055e-06, "loss": 1.0804, "step": 21174 }, { "epoch": 0.4, "learning_rate": 3.413569250937579e-06, "loss": 1.0499, "step": 21175 }, { "epoch": 0.4, "learning_rate": 3.4134270490042127e-06, "loss": 1.038, "step": 21176 }, { "epoch": 0.4, "learning_rate": 3.413284843660138e-06, "loss": 0.8436, "step": 21177 }, { "epoch": 0.4, "learning_rate": 3.413142634905886e-06, "loss": 0.7879, "step": 21178 }, { "epoch": 0.4, "learning_rate": 3.4130004227419867e-06, "loss": 0.8425, "step": 21179 }, { "epoch": 0.4, "learning_rate": 3.412858207168973e-06, "loss": 0.8768, "step": 21180 }, { "epoch": 0.4, "learning_rate": 3.4127159881873738e-06, "loss": 1.1078, "step": 21181 }, { "epoch": 0.4, "learning_rate": 3.412573765797721e-06, "loss": 0.8618, "step": 21182 }, { "epoch": 0.4, "learning_rate": 3.4124315400005457e-06, "loss": 0.8829, "step": 21183 }, { "epoch": 0.4, "learning_rate": 3.4122893107963794e-06, "loss": 0.9847, "step": 21184 }, { "epoch": 0.4, "learning_rate": 3.412147078185753e-06, "loss": 0.8836, "step": 21185 }, { "epoch": 0.4, "learning_rate": 3.4120048421691975e-06, "loss": 0.9337, "step": 21186 }, { "epoch": 0.4, "learning_rate": 3.4118626027472435e-06, "loss": 1.3856, "step": 21187 }, { "epoch": 0.4, "learning_rate": 3.4117203599204226e-06, "loss": 0.9832, "step": 21188 }, { "epoch": 0.4, "learning_rate": 3.411578113689266e-06, "loss": 1.0054, "step": 21189 }, { "epoch": 0.4, "learning_rate": 3.4114358640543043e-06, "loss": 0.8738, "step": 21190 }, { "epoch": 0.4, "learning_rate": 3.4112936110160687e-06, "loss": 0.7764, "step": 21191 }, { "epoch": 0.4, "learning_rate": 3.4111513545750913e-06, "loss": 0.7896, "step": 21192 }, { "epoch": 0.4, "learning_rate": 3.4110090947319023e-06, "loss": 1.2385, "step": 21193 }, { "epoch": 0.4, "learning_rate": 3.4108668314870337e-06, "loss": 1.2143, "step": 21194 }, { "epoch": 0.4, "learning_rate": 3.4107245648410164e-06, "loss": 0.9571, "step": 21195 }, { "epoch": 0.4, "learning_rate": 3.4105822947943813e-06, "loss": 0.9075, "step": 21196 }, { "epoch": 0.4, "learning_rate": 3.41044002134766e-06, "loss": 0.7915, "step": 21197 }, { "epoch": 0.4, "learning_rate": 3.4102977445013826e-06, "loss": 0.7389, "step": 21198 }, { "epoch": 0.4, "learning_rate": 3.410155464256082e-06, "loss": 0.782, "step": 21199 }, { "epoch": 0.4, "learning_rate": 3.4100131806122883e-06, "loss": 1.0675, "step": 21200 }, { "epoch": 0.4, "learning_rate": 3.4098708935705342e-06, "loss": 0.8012, "step": 21201 }, { "epoch": 0.4, "learning_rate": 3.4097286031313497e-06, "loss": 0.9222, "step": 21202 }, { "epoch": 0.4, "learning_rate": 3.4095863092952665e-06, "loss": 0.9106, "step": 21203 }, { "epoch": 0.4, "learning_rate": 3.409444012062816e-06, "loss": 0.7685, "step": 21204 }, { "epoch": 0.4, "learning_rate": 3.409301711434529e-06, "loss": 0.9241, "step": 21205 }, { "epoch": 0.4, "learning_rate": 3.4091594074109373e-06, "loss": 1.1241, "step": 21206 }, { "epoch": 0.4, "learning_rate": 3.4090170999925733e-06, "loss": 0.9067, "step": 21207 }, { "epoch": 0.4, "learning_rate": 3.4088747891799666e-06, "loss": 0.9904, "step": 21208 }, { "epoch": 0.4, "learning_rate": 3.408732474973649e-06, "loss": 0.9234, "step": 21209 }, { "epoch": 0.4, "learning_rate": 3.408590157374153e-06, "loss": 0.8497, "step": 21210 }, { "epoch": 0.4, "learning_rate": 3.408447836382008e-06, "loss": 1.0388, "step": 21211 }, { "epoch": 0.4, "learning_rate": 3.408305511997747e-06, "loss": 1.1327, "step": 21212 }, { "epoch": 0.4, "learning_rate": 3.408163184221902e-06, "loss": 0.9043, "step": 21213 }, { "epoch": 0.4, "learning_rate": 3.408020853055003e-06, "loss": 0.9242, "step": 21214 }, { "epoch": 0.4, "learning_rate": 3.4078785184975817e-06, "loss": 1.0029, "step": 21215 }, { "epoch": 0.4, "learning_rate": 3.4077361805501707e-06, "loss": 0.9058, "step": 21216 }, { "epoch": 0.4, "learning_rate": 3.4075938392132994e-06, "loss": 0.8411, "step": 21217 }, { "epoch": 0.4, "learning_rate": 3.4074514944875013e-06, "loss": 0.8281, "step": 21218 }, { "epoch": 0.4, "learning_rate": 3.4073091463733064e-06, "loss": 0.9955, "step": 21219 }, { "epoch": 0.4, "learning_rate": 3.4071667948712477e-06, "loss": 1.1303, "step": 21220 }, { "epoch": 0.4, "learning_rate": 3.407024439981856e-06, "loss": 0.8984, "step": 21221 }, { "epoch": 0.4, "learning_rate": 3.4068820817056624e-06, "loss": 0.824, "step": 21222 }, { "epoch": 0.4, "learning_rate": 3.4067397200431995e-06, "loss": 0.6006, "step": 21223 }, { "epoch": 0.4, "learning_rate": 3.406597354994998e-06, "loss": 0.7186, "step": 21224 }, { "epoch": 0.4, "learning_rate": 3.406454986561589e-06, "loss": 1.0394, "step": 21225 }, { "epoch": 0.4, "learning_rate": 3.406312614743506e-06, "loss": 0.81, "step": 21226 }, { "epoch": 0.4, "learning_rate": 3.406170239541279e-06, "loss": 1.0092, "step": 21227 }, { "epoch": 0.4, "learning_rate": 3.406027860955441e-06, "loss": 0.845, "step": 21228 }, { "epoch": 0.4, "learning_rate": 3.4058854789865214e-06, "loss": 0.9988, "step": 21229 }, { "epoch": 0.4, "learning_rate": 3.405743093635054e-06, "loss": 0.9557, "step": 21230 }, { "epoch": 0.4, "learning_rate": 3.4056007049015692e-06, "loss": 1.0191, "step": 21231 }, { "epoch": 0.4, "learning_rate": 3.405458312786599e-06, "loss": 1.0059, "step": 21232 }, { "epoch": 0.4, "learning_rate": 3.4053159172906757e-06, "loss": 1.0133, "step": 21233 }, { "epoch": 0.4, "learning_rate": 3.4051735184143307e-06, "loss": 0.8941, "step": 21234 }, { "epoch": 0.4, "learning_rate": 3.405031116158095e-06, "loss": 0.9288, "step": 21235 }, { "epoch": 0.4, "learning_rate": 3.404888710522501e-06, "loss": 1.0502, "step": 21236 }, { "epoch": 0.4, "learning_rate": 3.4047463015080808e-06, "loss": 1.2723, "step": 21237 }, { "epoch": 0.4, "learning_rate": 3.4046038891153655e-06, "loss": 0.9945, "step": 21238 }, { "epoch": 0.4, "learning_rate": 3.404461473344886e-06, "loss": 0.7968, "step": 21239 }, { "epoch": 0.4, "learning_rate": 3.404319054197176e-06, "loss": 0.82, "step": 21240 }, { "epoch": 0.4, "learning_rate": 3.404176631672766e-06, "loss": 0.7325, "step": 21241 }, { "epoch": 0.4, "learning_rate": 3.4040342057721885e-06, "loss": 0.98, "step": 21242 }, { "epoch": 0.4, "learning_rate": 3.403891776495975e-06, "loss": 0.9386, "step": 21243 }, { "epoch": 0.4, "learning_rate": 3.403749343844657e-06, "loss": 1.0193, "step": 21244 }, { "epoch": 0.4, "learning_rate": 3.403606907818767e-06, "loss": 0.8993, "step": 21245 }, { "epoch": 0.4, "learning_rate": 3.403464468418836e-06, "loss": 1.0161, "step": 21246 }, { "epoch": 0.4, "learning_rate": 3.403322025645397e-06, "loss": 1.061, "step": 21247 }, { "epoch": 0.4, "learning_rate": 3.4031795794989808e-06, "loss": 0.9036, "step": 21248 }, { "epoch": 0.4, "learning_rate": 3.4030371299801202e-06, "loss": 0.9958, "step": 21249 }, { "epoch": 0.4, "learning_rate": 3.402894677089347e-06, "loss": 1.084, "step": 21250 }, { "epoch": 0.4, "learning_rate": 3.4027522208271914e-06, "loss": 0.8913, "step": 21251 }, { "epoch": 0.4, "learning_rate": 3.402609761194188e-06, "loss": 0.8645, "step": 21252 }, { "epoch": 0.4, "learning_rate": 3.402467298190867e-06, "loss": 0.8189, "step": 21253 }, { "epoch": 0.4, "learning_rate": 3.40232483181776e-06, "loss": 0.9067, "step": 21254 }, { "epoch": 0.4, "learning_rate": 3.4021823620754007e-06, "loss": 1.0511, "step": 21255 }, { "epoch": 0.4, "learning_rate": 3.4020398889643195e-06, "loss": 1.0732, "step": 21256 }, { "epoch": 0.4, "learning_rate": 3.4018974124850495e-06, "loss": 0.8457, "step": 21257 }, { "epoch": 0.4, "learning_rate": 3.401754932638122e-06, "loss": 0.8974, "step": 21258 }, { "epoch": 0.4, "learning_rate": 3.4016124494240695e-06, "loss": 0.9816, "step": 21259 }, { "epoch": 0.4, "learning_rate": 3.4014699628434234e-06, "loss": 0.8901, "step": 21260 }, { "epoch": 0.4, "learning_rate": 3.401327472896716e-06, "loss": 0.6544, "step": 21261 }, { "epoch": 0.4, "learning_rate": 3.40118497958448e-06, "loss": 0.9847, "step": 21262 }, { "epoch": 0.4, "learning_rate": 3.4010424829072463e-06, "loss": 0.8313, "step": 21263 }, { "epoch": 0.4, "learning_rate": 3.4008999828655483e-06, "loss": 1.0023, "step": 21264 }, { "epoch": 0.4, "learning_rate": 3.400757479459917e-06, "loss": 0.764, "step": 21265 }, { "epoch": 0.4, "learning_rate": 3.4006149726908843e-06, "loss": 0.8517, "step": 21266 }, { "epoch": 0.4, "learning_rate": 3.4004724625589835e-06, "loss": 0.9322, "step": 21267 }, { "epoch": 0.4, "learning_rate": 3.4003299490647463e-06, "loss": 0.9874, "step": 21268 }, { "epoch": 0.4, "learning_rate": 3.400187432208704e-06, "loss": 1.0762, "step": 21269 }, { "epoch": 0.4, "learning_rate": 3.4000449119913903e-06, "loss": 0.9019, "step": 21270 }, { "epoch": 0.4, "learning_rate": 3.3999023884133364e-06, "loss": 0.9625, "step": 21271 }, { "epoch": 0.4, "learning_rate": 3.3997598614750737e-06, "loss": 0.926, "step": 21272 }, { "epoch": 0.4, "learning_rate": 3.3996173311771365e-06, "loss": 1.088, "step": 21273 }, { "epoch": 0.4, "learning_rate": 3.3994747975200547e-06, "loss": 1.1632, "step": 21274 }, { "epoch": 0.4, "learning_rate": 3.3993322605043615e-06, "loss": 1.298, "step": 21275 }, { "epoch": 0.4, "learning_rate": 3.39918972013059e-06, "loss": 1.127, "step": 21276 }, { "epoch": 0.4, "learning_rate": 3.3990471763992714e-06, "loss": 0.857, "step": 21277 }, { "epoch": 0.4, "learning_rate": 3.3989046293109385e-06, "loss": 0.7549, "step": 21278 }, { "epoch": 0.4, "learning_rate": 3.398762078866123e-06, "loss": 1.106, "step": 21279 }, { "epoch": 0.4, "learning_rate": 3.3986195250653574e-06, "loss": 1.124, "step": 21280 }, { "epoch": 0.4, "learning_rate": 3.398476967909174e-06, "loss": 1.0177, "step": 21281 }, { "epoch": 0.4, "learning_rate": 3.398334407398105e-06, "loss": 0.9393, "step": 21282 }, { "epoch": 0.4, "learning_rate": 3.3981918435326826e-06, "loss": 0.8764, "step": 21283 }, { "epoch": 0.4, "learning_rate": 3.3980492763134402e-06, "loss": 0.8651, "step": 21284 }, { "epoch": 0.4, "learning_rate": 3.3979067057409092e-06, "loss": 1.0441, "step": 21285 }, { "epoch": 0.4, "learning_rate": 3.397764131815622e-06, "loss": 0.8322, "step": 21286 }, { "epoch": 0.4, "learning_rate": 3.3976215545381115e-06, "loss": 1.166, "step": 21287 }, { "epoch": 0.4, "learning_rate": 3.3974789739089082e-06, "loss": 0.9644, "step": 21288 }, { "epoch": 0.4, "learning_rate": 3.3973363899285466e-06, "loss": 0.9061, "step": 21289 }, { "epoch": 0.4, "learning_rate": 3.3971938025975593e-06, "loss": 0.9486, "step": 21290 }, { "epoch": 0.4, "learning_rate": 3.3970512119164767e-06, "loss": 0.8575, "step": 21291 }, { "epoch": 0.4, "learning_rate": 3.396908617885833e-06, "loss": 0.837, "step": 21292 }, { "epoch": 0.4, "learning_rate": 3.3967660205061604e-06, "loss": 0.9392, "step": 21293 }, { "epoch": 0.4, "learning_rate": 3.39662341977799e-06, "loss": 1.011, "step": 21294 }, { "epoch": 0.4, "learning_rate": 3.3964808157018557e-06, "loss": 0.6971, "step": 21295 }, { "epoch": 0.4, "learning_rate": 3.39633820827829e-06, "loss": 0.7154, "step": 21296 }, { "epoch": 0.4, "learning_rate": 3.3961955975078236e-06, "loss": 1.0184, "step": 21297 }, { "epoch": 0.4, "learning_rate": 3.3960529833909915e-06, "loss": 0.9243, "step": 21298 }, { "epoch": 0.4, "learning_rate": 3.395910365928325e-06, "loss": 1.1584, "step": 21299 }, { "epoch": 0.4, "learning_rate": 3.3957677451203566e-06, "loss": 0.9921, "step": 21300 }, { "epoch": 0.4, "learning_rate": 3.3956251209676185e-06, "loss": 0.9787, "step": 21301 }, { "epoch": 0.4, "learning_rate": 3.395482493470643e-06, "loss": 0.8217, "step": 21302 }, { "epoch": 0.4, "learning_rate": 3.3953398626299645e-06, "loss": 0.9998, "step": 21303 }, { "epoch": 0.4, "learning_rate": 3.395197228446114e-06, "loss": 0.8183, "step": 21304 }, { "epoch": 0.4, "learning_rate": 3.3950545909196247e-06, "loss": 1.1481, "step": 21305 }, { "epoch": 0.4, "learning_rate": 3.3949119500510285e-06, "loss": 0.918, "step": 21306 }, { "epoch": 0.4, "learning_rate": 3.3947693058408594e-06, "loss": 1.1269, "step": 21307 }, { "epoch": 0.4, "learning_rate": 3.394626658289649e-06, "loss": 1.1013, "step": 21308 }, { "epoch": 0.4, "learning_rate": 3.394484007397929e-06, "loss": 1.0292, "step": 21309 }, { "epoch": 0.4, "learning_rate": 3.3943413531662334e-06, "loss": 0.7715, "step": 21310 }, { "epoch": 0.4, "learning_rate": 3.3941986955950958e-06, "loss": 0.9147, "step": 21311 }, { "epoch": 0.4, "learning_rate": 3.3940560346850466e-06, "loss": 1.2757, "step": 21312 }, { "epoch": 0.4, "learning_rate": 3.39391337043662e-06, "loss": 1.0537, "step": 21313 }, { "epoch": 0.4, "learning_rate": 3.3937707028503485e-06, "loss": 1.0168, "step": 21314 }, { "epoch": 0.4, "learning_rate": 3.393628031926764e-06, "loss": 0.9827, "step": 21315 }, { "epoch": 0.4, "learning_rate": 3.3934853576664e-06, "loss": 0.8188, "step": 21316 }, { "epoch": 0.4, "learning_rate": 3.3933426800697887e-06, "loss": 0.9946, "step": 21317 }, { "epoch": 0.4, "learning_rate": 3.393199999137464e-06, "loss": 0.8735, "step": 21318 }, { "epoch": 0.4, "learning_rate": 3.3930573148699576e-06, "loss": 1.1107, "step": 21319 }, { "epoch": 0.4, "learning_rate": 3.3929146272678026e-06, "loss": 0.8332, "step": 21320 }, { "epoch": 0.4, "learning_rate": 3.392771936331532e-06, "loss": 0.9238, "step": 21321 }, { "epoch": 0.4, "learning_rate": 3.392629242061678e-06, "loss": 1.0861, "step": 21322 }, { "epoch": 0.4, "learning_rate": 3.392486544458774e-06, "loss": 0.9523, "step": 21323 }, { "epoch": 0.4, "learning_rate": 3.3923438435233525e-06, "loss": 0.9992, "step": 21324 }, { "epoch": 0.4, "learning_rate": 3.392201139255946e-06, "loss": 0.9113, "step": 21325 }, { "epoch": 0.4, "learning_rate": 3.3920584316570885e-06, "loss": 0.944, "step": 21326 }, { "epoch": 0.4, "learning_rate": 3.391915720727312e-06, "loss": 0.8629, "step": 21327 }, { "epoch": 0.4, "learning_rate": 3.3917730064671497e-06, "loss": 0.8663, "step": 21328 }, { "epoch": 0.4, "learning_rate": 3.391630288877134e-06, "loss": 0.9668, "step": 21329 }, { "epoch": 0.4, "learning_rate": 3.3914875679577973e-06, "loss": 1.1315, "step": 21330 }, { "epoch": 0.4, "learning_rate": 3.3913448437096745e-06, "loss": 1.0258, "step": 21331 }, { "epoch": 0.4, "learning_rate": 3.3912021161332974e-06, "loss": 0.9969, "step": 21332 }, { "epoch": 0.4, "learning_rate": 3.3910593852291986e-06, "loss": 0.877, "step": 21333 }, { "epoch": 0.4, "learning_rate": 3.390916650997911e-06, "loss": 0.9905, "step": 21334 }, { "epoch": 0.4, "learning_rate": 3.390773913439969e-06, "loss": 0.8735, "step": 21335 }, { "epoch": 0.4, "learning_rate": 3.3906311725559037e-06, "loss": 0.8148, "step": 21336 }, { "epoch": 0.4, "learning_rate": 3.390488428346249e-06, "loss": 1.0614, "step": 21337 }, { "epoch": 0.4, "learning_rate": 3.390345680811538e-06, "loss": 1.0314, "step": 21338 }, { "epoch": 0.4, "learning_rate": 3.3902029299523036e-06, "loss": 0.9491, "step": 21339 }, { "epoch": 0.4, "learning_rate": 3.390060175769079e-06, "loss": 0.9957, "step": 21340 }, { "epoch": 0.4, "learning_rate": 3.389917418262396e-06, "loss": 0.9058, "step": 21341 }, { "epoch": 0.4, "learning_rate": 3.3897746574327894e-06, "loss": 0.99, "step": 21342 }, { "epoch": 0.4, "learning_rate": 3.3896318932807915e-06, "loss": 1.0571, "step": 21343 }, { "epoch": 0.4, "learning_rate": 3.389489125806935e-06, "loss": 1.0501, "step": 21344 }, { "epoch": 0.4, "learning_rate": 3.3893463550117534e-06, "loss": 0.9026, "step": 21345 }, { "epoch": 0.4, "learning_rate": 3.38920358089578e-06, "loss": 0.7733, "step": 21346 }, { "epoch": 0.4, "learning_rate": 3.3890608034595485e-06, "loss": 0.9132, "step": 21347 }, { "epoch": 0.4, "learning_rate": 3.3889180227035903e-06, "loss": 1.032, "step": 21348 }, { "epoch": 0.4, "learning_rate": 3.388775238628439e-06, "loss": 1.2426, "step": 21349 }, { "epoch": 0.4, "learning_rate": 3.388632451234629e-06, "loss": 1.2142, "step": 21350 }, { "epoch": 0.4, "learning_rate": 3.3884896605226926e-06, "loss": 0.8969, "step": 21351 }, { "epoch": 0.4, "learning_rate": 3.3883468664931623e-06, "loss": 0.8818, "step": 21352 }, { "epoch": 0.4, "learning_rate": 3.3882040691465734e-06, "loss": 1.0755, "step": 21353 }, { "epoch": 0.4, "learning_rate": 3.3880612684834567e-06, "loss": 0.8611, "step": 21354 }, { "epoch": 0.4, "learning_rate": 3.3879184645043466e-06, "loss": 1.0219, "step": 21355 }, { "epoch": 0.4, "learning_rate": 3.387775657209777e-06, "loss": 1.0732, "step": 21356 }, { "epoch": 0.4, "learning_rate": 3.3876328466002794e-06, "loss": 0.892, "step": 21357 }, { "epoch": 0.4, "learning_rate": 3.387490032676388e-06, "loss": 0.9804, "step": 21358 }, { "epoch": 0.4, "learning_rate": 3.387347215438636e-06, "loss": 0.8491, "step": 21359 }, { "epoch": 0.4, "learning_rate": 3.3872043948875567e-06, "loss": 0.8491, "step": 21360 }, { "epoch": 0.4, "learning_rate": 3.3870615710236837e-06, "loss": 0.9532, "step": 21361 }, { "epoch": 0.4, "learning_rate": 3.3869187438475505e-06, "loss": 1.1873, "step": 21362 }, { "epoch": 0.4, "learning_rate": 3.386775913359689e-06, "loss": 1.1092, "step": 21363 }, { "epoch": 0.4, "learning_rate": 3.386633079560634e-06, "loss": 0.9825, "step": 21364 }, { "epoch": 0.4, "learning_rate": 3.3864902424509176e-06, "loss": 1.084, "step": 21365 }, { "epoch": 0.4, "learning_rate": 3.3863474020310737e-06, "loss": 0.785, "step": 21366 }, { "epoch": 0.4, "learning_rate": 3.3862045583016366e-06, "loss": 0.89, "step": 21367 }, { "epoch": 0.4, "learning_rate": 3.386061711263139e-06, "loss": 0.9659, "step": 21368 }, { "epoch": 0.4, "learning_rate": 3.385918860916114e-06, "loss": 1.1542, "step": 21369 }, { "epoch": 0.4, "learning_rate": 3.3857760072610947e-06, "loss": 0.8429, "step": 21370 }, { "epoch": 0.4, "learning_rate": 3.385633150298615e-06, "loss": 1.0099, "step": 21371 }, { "epoch": 0.4, "learning_rate": 3.3854902900292076e-06, "loss": 0.8085, "step": 21372 }, { "epoch": 0.4, "learning_rate": 3.3853474264534077e-06, "loss": 0.9704, "step": 21373 }, { "epoch": 0.4, "learning_rate": 3.3852045595717476e-06, "loss": 0.9455, "step": 21374 }, { "epoch": 0.4, "learning_rate": 3.3850616893847603e-06, "loss": 1.0429, "step": 21375 }, { "epoch": 0.4, "learning_rate": 3.3849188158929804e-06, "loss": 0.9197, "step": 21376 }, { "epoch": 0.4, "learning_rate": 3.3847759390969402e-06, "loss": 0.9773, "step": 21377 }, { "epoch": 0.4, "learning_rate": 3.384633058997174e-06, "loss": 0.9437, "step": 21378 }, { "epoch": 0.4, "learning_rate": 3.384490175594215e-06, "loss": 0.8477, "step": 21379 }, { "epoch": 0.4, "learning_rate": 3.3843472888885964e-06, "loss": 0.7936, "step": 21380 }, { "epoch": 0.4, "learning_rate": 3.3842043988808526e-06, "loss": 1.0211, "step": 21381 }, { "epoch": 0.4, "learning_rate": 3.3840615055715164e-06, "loss": 1.0389, "step": 21382 }, { "epoch": 0.4, "learning_rate": 3.3839186089611224e-06, "loss": 0.735, "step": 21383 }, { "epoch": 0.4, "learning_rate": 3.383775709050203e-06, "loss": 0.8912, "step": 21384 }, { "epoch": 0.4, "learning_rate": 3.383632805839292e-06, "loss": 0.8429, "step": 21385 }, { "epoch": 0.4, "learning_rate": 3.3834898993289234e-06, "loss": 1.0193, "step": 21386 }, { "epoch": 0.4, "learning_rate": 3.38334698951963e-06, "loss": 1.1431, "step": 21387 }, { "epoch": 0.4, "learning_rate": 3.383204076411947e-06, "loss": 0.975, "step": 21388 }, { "epoch": 0.4, "learning_rate": 3.3830611600064065e-06, "loss": 0.8437, "step": 21389 }, { "epoch": 0.4, "learning_rate": 3.382918240303543e-06, "loss": 0.8227, "step": 21390 }, { "epoch": 0.4, "learning_rate": 3.3827753173038898e-06, "loss": 0.9968, "step": 21391 }, { "epoch": 0.4, "learning_rate": 3.3826323910079806e-06, "loss": 0.7974, "step": 21392 }, { "epoch": 0.4, "learning_rate": 3.3824894614163485e-06, "loss": 1.1095, "step": 21393 }, { "epoch": 0.4, "learning_rate": 3.382346528529528e-06, "loss": 0.9919, "step": 21394 }, { "epoch": 0.4, "learning_rate": 3.3822035923480534e-06, "loss": 1.0182, "step": 21395 }, { "epoch": 0.4, "learning_rate": 3.382060652872457e-06, "loss": 0.8804, "step": 21396 }, { "epoch": 0.4, "learning_rate": 3.381917710103274e-06, "loss": 0.8821, "step": 21397 }, { "epoch": 0.4, "learning_rate": 3.3817747640410365e-06, "loss": 0.8115, "step": 21398 }, { "epoch": 0.4, "learning_rate": 3.381631814686279e-06, "loss": 0.9114, "step": 21399 }, { "epoch": 0.4, "learning_rate": 3.3814888620395355e-06, "loss": 1.2437, "step": 21400 }, { "epoch": 0.4, "learning_rate": 3.38134590610134e-06, "loss": 1.033, "step": 21401 }, { "epoch": 0.4, "learning_rate": 3.381202946872225e-06, "loss": 0.8663, "step": 21402 }, { "epoch": 0.4, "learning_rate": 3.3810599843527263e-06, "loss": 0.8842, "step": 21403 }, { "epoch": 0.4, "learning_rate": 3.380917018543376e-06, "loss": 0.7686, "step": 21404 }, { "epoch": 0.4, "learning_rate": 3.3807740494447085e-06, "loss": 0.9579, "step": 21405 }, { "epoch": 0.4, "learning_rate": 3.380631077057258e-06, "loss": 1.0472, "step": 21406 }, { "epoch": 0.4, "learning_rate": 3.380488101381558e-06, "loss": 0.8182, "step": 21407 }, { "epoch": 0.4, "learning_rate": 3.380345122418142e-06, "loss": 0.7984, "step": 21408 }, { "epoch": 0.4, "learning_rate": 3.380202140167545e-06, "loss": 0.9238, "step": 21409 }, { "epoch": 0.4, "learning_rate": 3.3800591546302996e-06, "loss": 0.8906, "step": 21410 }, { "epoch": 0.4, "learning_rate": 3.379916165806941e-06, "loss": 0.8161, "step": 21411 }, { "epoch": 0.4, "learning_rate": 3.3797731736980024e-06, "loss": 1.1198, "step": 21412 }, { "epoch": 0.4, "learning_rate": 3.379630178304017e-06, "loss": 1.054, "step": 21413 }, { "epoch": 0.4, "learning_rate": 3.379487179625519e-06, "loss": 1.0184, "step": 21414 }, { "epoch": 0.4, "learning_rate": 3.3793441776630443e-06, "loss": 0.8517, "step": 21415 }, { "epoch": 0.4, "learning_rate": 3.3792011724171245e-06, "loss": 0.8643, "step": 21416 }, { "epoch": 0.4, "learning_rate": 3.379058163888295e-06, "loss": 0.9225, "step": 21417 }, { "epoch": 0.4, "learning_rate": 3.378915152077089e-06, "loss": 0.9989, "step": 21418 }, { "epoch": 0.4, "learning_rate": 3.378772136984041e-06, "loss": 1.0953, "step": 21419 }, { "epoch": 0.4, "learning_rate": 3.3786291186096843e-06, "loss": 1.1044, "step": 21420 }, { "epoch": 0.4, "learning_rate": 3.3784860969545535e-06, "loss": 0.8197, "step": 21421 }, { "epoch": 0.4, "learning_rate": 3.378343072019183e-06, "loss": 1.0023, "step": 21422 }, { "epoch": 0.4, "learning_rate": 3.3782000438041057e-06, "loss": 0.8707, "step": 21423 }, { "epoch": 0.4, "learning_rate": 3.378057012309857e-06, "loss": 0.8565, "step": 21424 }, { "epoch": 0.4, "learning_rate": 3.3779139775369703e-06, "loss": 1.0457, "step": 21425 }, { "epoch": 0.4, "learning_rate": 3.377770939485979e-06, "loss": 1.0134, "step": 21426 }, { "epoch": 0.4, "learning_rate": 3.3776278981574184e-06, "loss": 1.0464, "step": 21427 }, { "epoch": 0.4, "learning_rate": 3.3774848535518223e-06, "loss": 0.9573, "step": 21428 }, { "epoch": 0.4, "learning_rate": 3.377341805669725e-06, "loss": 0.8796, "step": 21429 }, { "epoch": 0.4, "learning_rate": 3.3771987545116604e-06, "loss": 0.9117, "step": 21430 }, { "epoch": 0.4, "learning_rate": 3.3770557000781613e-06, "loss": 1.1222, "step": 21431 }, { "epoch": 0.4, "learning_rate": 3.376912642369764e-06, "loss": 1.0859, "step": 21432 }, { "epoch": 0.4, "learning_rate": 3.376769581387002e-06, "loss": 0.9642, "step": 21433 }, { "epoch": 0.4, "learning_rate": 3.3766265171304087e-06, "loss": 0.957, "step": 21434 }, { "epoch": 0.4, "learning_rate": 3.376483449600518e-06, "loss": 0.8457, "step": 21435 }, { "epoch": 0.4, "learning_rate": 3.3763403787978664e-06, "loss": 0.955, "step": 21436 }, { "epoch": 0.4, "learning_rate": 3.3761973047229866e-06, "loss": 1.0077, "step": 21437 }, { "epoch": 0.4, "learning_rate": 3.3760542273764124e-06, "loss": 0.8686, "step": 21438 }, { "epoch": 0.4, "learning_rate": 3.375911146758679e-06, "loss": 0.82, "step": 21439 }, { "epoch": 0.4, "learning_rate": 3.3757680628703203e-06, "loss": 0.9267, "step": 21440 }, { "epoch": 0.4, "learning_rate": 3.3756249757118698e-06, "loss": 0.9179, "step": 21441 }, { "epoch": 0.4, "learning_rate": 3.375481885283863e-06, "loss": 0.7462, "step": 21442 }, { "epoch": 0.4, "learning_rate": 3.3753387915868336e-06, "loss": 0.9265, "step": 21443 }, { "epoch": 0.4, "learning_rate": 3.375195694621316e-06, "loss": 1.0139, "step": 21444 }, { "epoch": 0.4, "learning_rate": 3.375052594387845e-06, "loss": 0.8679, "step": 21445 }, { "epoch": 0.4, "learning_rate": 3.374909490886954e-06, "loss": 1.0208, "step": 21446 }, { "epoch": 0.4, "learning_rate": 3.3747663841191774e-06, "loss": 0.8564, "step": 21447 }, { "epoch": 0.4, "learning_rate": 3.3746232740850504e-06, "loss": 0.8204, "step": 21448 }, { "epoch": 0.4, "learning_rate": 3.3744801607851064e-06, "loss": 1.0273, "step": 21449 }, { "epoch": 0.4, "learning_rate": 3.374337044219881e-06, "loss": 0.963, "step": 21450 }, { "epoch": 0.4, "learning_rate": 3.3741939243899073e-06, "loss": 0.919, "step": 21451 }, { "epoch": 0.4, "learning_rate": 3.3740508012957205e-06, "loss": 0.7308, "step": 21452 }, { "epoch": 0.4, "learning_rate": 3.3739076749378553e-06, "loss": 0.9092, "step": 21453 }, { "epoch": 0.4, "learning_rate": 3.3737645453168456e-06, "loss": 0.8094, "step": 21454 }, { "epoch": 0.4, "learning_rate": 3.373621412433225e-06, "loss": 0.8245, "step": 21455 }, { "epoch": 0.4, "learning_rate": 3.3734782762875282e-06, "loss": 1.0535, "step": 21456 }, { "epoch": 0.4, "learning_rate": 3.3733351368802925e-06, "loss": 0.9785, "step": 21457 }, { "epoch": 0.4, "learning_rate": 3.373191994212049e-06, "loss": 0.8825, "step": 21458 }, { "epoch": 0.4, "learning_rate": 3.3730488482833333e-06, "loss": 0.9618, "step": 21459 }, { "epoch": 0.4, "learning_rate": 3.372905699094681e-06, "loss": 0.8707, "step": 21460 }, { "epoch": 0.4, "learning_rate": 3.372762546646624e-06, "loss": 1.0746, "step": 21461 }, { "epoch": 0.4, "learning_rate": 3.372619390939699e-06, "loss": 0.9679, "step": 21462 }, { "epoch": 0.4, "learning_rate": 3.3724762319744396e-06, "loss": 1.0603, "step": 21463 }, { "epoch": 0.4, "learning_rate": 3.372333069751381e-06, "loss": 0.9587, "step": 21464 }, { "epoch": 0.4, "learning_rate": 3.372189904271058e-06, "loss": 1.0601, "step": 21465 }, { "epoch": 0.4, "learning_rate": 3.3720467355340046e-06, "loss": 0.7917, "step": 21466 }, { "epoch": 0.41, "learning_rate": 3.371903563540755e-06, "loss": 0.86, "step": 21467 }, { "epoch": 0.41, "learning_rate": 3.3717603882918443e-06, "loss": 0.8624, "step": 21468 }, { "epoch": 0.41, "learning_rate": 3.371617209787807e-06, "loss": 0.9127, "step": 21469 }, { "epoch": 0.41, "learning_rate": 3.371474028029178e-06, "loss": 0.973, "step": 21470 }, { "epoch": 0.41, "learning_rate": 3.371330843016491e-06, "loss": 1.0121, "step": 21471 }, { "epoch": 0.41, "learning_rate": 3.3711876547502826e-06, "loss": 0.9093, "step": 21472 }, { "epoch": 0.41, "learning_rate": 3.371044463231085e-06, "loss": 0.9545, "step": 21473 }, { "epoch": 0.41, "learning_rate": 3.3709012684594346e-06, "loss": 0.9182, "step": 21474 }, { "epoch": 0.41, "learning_rate": 3.370758070435866e-06, "loss": 0.8304, "step": 21475 }, { "epoch": 0.41, "learning_rate": 3.370614869160913e-06, "loss": 0.9833, "step": 21476 }, { "epoch": 0.41, "learning_rate": 3.37047166463511e-06, "loss": 0.8492, "step": 21477 }, { "epoch": 0.41, "learning_rate": 3.370328456858994e-06, "loss": 0.9555, "step": 21478 }, { "epoch": 0.41, "learning_rate": 3.370185245833097e-06, "loss": 0.853, "step": 21479 }, { "epoch": 0.41, "learning_rate": 3.370042031557955e-06, "loss": 1.1298, "step": 21480 }, { "epoch": 0.41, "learning_rate": 3.369898814034104e-06, "loss": 1.0029, "step": 21481 }, { "epoch": 0.41, "learning_rate": 3.3697555932620767e-06, "loss": 0.8171, "step": 21482 }, { "epoch": 0.41, "learning_rate": 3.3696123692424087e-06, "loss": 0.9099, "step": 21483 }, { "epoch": 0.41, "learning_rate": 3.3694691419756344e-06, "loss": 0.8992, "step": 21484 }, { "epoch": 0.41, "learning_rate": 3.369325911462289e-06, "loss": 0.8805, "step": 21485 }, { "epoch": 0.41, "learning_rate": 3.3691826777029078e-06, "loss": 1.143, "step": 21486 }, { "epoch": 0.41, "learning_rate": 3.3690394406980252e-06, "loss": 1.002, "step": 21487 }, { "epoch": 0.41, "learning_rate": 3.3688962004481755e-06, "loss": 0.8809, "step": 21488 }, { "epoch": 0.41, "learning_rate": 3.3687529569538945e-06, "loss": 0.8413, "step": 21489 }, { "epoch": 0.41, "learning_rate": 3.368609710215716e-06, "loss": 0.8883, "step": 21490 }, { "epoch": 0.41, "learning_rate": 3.368466460234176e-06, "loss": 1.0541, "step": 21491 }, { "epoch": 0.41, "learning_rate": 3.3683232070098082e-06, "loss": 1.0422, "step": 21492 }, { "epoch": 0.41, "learning_rate": 3.3681799505431494e-06, "loss": 0.9935, "step": 21493 }, { "epoch": 0.41, "learning_rate": 3.3680366908347324e-06, "loss": 1.0517, "step": 21494 }, { "epoch": 0.41, "learning_rate": 3.3678934278850935e-06, "loss": 0.6992, "step": 21495 }, { "epoch": 0.41, "learning_rate": 3.3677501616947666e-06, "loss": 0.9029, "step": 21496 }, { "epoch": 0.41, "learning_rate": 3.3676068922642867e-06, "loss": 1.0557, "step": 21497 }, { "epoch": 0.41, "learning_rate": 3.36746361959419e-06, "loss": 0.7659, "step": 21498 }, { "epoch": 0.41, "learning_rate": 3.367320343685011e-06, "loss": 0.9133, "step": 21499 }, { "epoch": 0.41, "learning_rate": 3.3671770645372844e-06, "loss": 1.1292, "step": 21500 }, { "epoch": 0.41, "learning_rate": 3.367033782151545e-06, "loss": 0.806, "step": 21501 }, { "epoch": 0.41, "learning_rate": 3.3668904965283285e-06, "loss": 0.8436, "step": 21502 }, { "epoch": 0.41, "learning_rate": 3.3667472076681685e-06, "loss": 0.9048, "step": 21503 }, { "epoch": 0.41, "learning_rate": 3.366603915571601e-06, "loss": 0.8616, "step": 21504 }, { "epoch": 0.41, "learning_rate": 3.366460620239162e-06, "loss": 1.0258, "step": 21505 }, { "epoch": 0.41, "learning_rate": 3.3663173216713853e-06, "loss": 1.0922, "step": 21506 }, { "epoch": 0.41, "learning_rate": 3.366174019868806e-06, "loss": 0.8485, "step": 21507 }, { "epoch": 0.41, "learning_rate": 3.36603071483196e-06, "loss": 0.7042, "step": 21508 }, { "epoch": 0.41, "learning_rate": 3.3658874065613813e-06, "loss": 0.8521, "step": 21509 }, { "epoch": 0.41, "learning_rate": 3.3657440950576052e-06, "loss": 0.9759, "step": 21510 }, { "epoch": 0.41, "learning_rate": 3.3656007803211677e-06, "loss": 1.0171, "step": 21511 }, { "epoch": 0.41, "learning_rate": 3.3654574623526036e-06, "loss": 1.129, "step": 21512 }, { "epoch": 0.41, "learning_rate": 3.3653141411524474e-06, "loss": 1.0974, "step": 21513 }, { "epoch": 0.41, "learning_rate": 3.3651708167212354e-06, "loss": 1.0815, "step": 21514 }, { "epoch": 0.41, "learning_rate": 3.365027489059502e-06, "loss": 0.9733, "step": 21515 }, { "epoch": 0.41, "learning_rate": 3.3648841581677825e-06, "loss": 0.8339, "step": 21516 }, { "epoch": 0.41, "learning_rate": 3.364740824046612e-06, "loss": 0.8419, "step": 21517 }, { "epoch": 0.41, "learning_rate": 3.364597486696525e-06, "loss": 1.1284, "step": 21518 }, { "epoch": 0.41, "learning_rate": 3.364454146118058e-06, "loss": 0.8314, "step": 21519 }, { "epoch": 0.41, "learning_rate": 3.364310802311746e-06, "loss": 0.8837, "step": 21520 }, { "epoch": 0.41, "learning_rate": 3.3641674552781234e-06, "loss": 0.8583, "step": 21521 }, { "epoch": 0.41, "learning_rate": 3.364024105017727e-06, "loss": 0.9289, "step": 21522 }, { "epoch": 0.41, "learning_rate": 3.36388075153109e-06, "loss": 0.739, "step": 21523 }, { "epoch": 0.41, "learning_rate": 3.3637373948187492e-06, "loss": 0.9166, "step": 21524 }, { "epoch": 0.41, "learning_rate": 3.3635940348812396e-06, "loss": 1.1028, "step": 21525 }, { "epoch": 0.41, "learning_rate": 3.363450671719096e-06, "loss": 0.7104, "step": 21526 }, { "epoch": 0.41, "learning_rate": 3.363307305332854e-06, "loss": 1.1512, "step": 21527 }, { "epoch": 0.41, "learning_rate": 3.36316393572305e-06, "loss": 0.8656, "step": 21528 }, { "epoch": 0.41, "learning_rate": 3.3630205628902173e-06, "loss": 0.9299, "step": 21529 }, { "epoch": 0.41, "learning_rate": 3.3628771868348925e-06, "loss": 0.8934, "step": 21530 }, { "epoch": 0.41, "learning_rate": 3.362733807557611e-06, "loss": 1.1529, "step": 21531 }, { "epoch": 0.41, "learning_rate": 3.3625904250589074e-06, "loss": 0.6049, "step": 21532 }, { "epoch": 0.41, "learning_rate": 3.362447039339318e-06, "loss": 1.0148, "step": 21533 }, { "epoch": 0.41, "learning_rate": 3.3623036503993776e-06, "loss": 0.8097, "step": 21534 }, { "epoch": 0.41, "learning_rate": 3.3621602582396225e-06, "loss": 0.9566, "step": 21535 }, { "epoch": 0.41, "learning_rate": 3.3620168628605865e-06, "loss": 0.9246, "step": 21536 }, { "epoch": 0.41, "learning_rate": 3.361873464262807e-06, "loss": 1.0936, "step": 21537 }, { "epoch": 0.41, "learning_rate": 3.3617300624468174e-06, "loss": 1.0132, "step": 21538 }, { "epoch": 0.41, "learning_rate": 3.3615866574131538e-06, "loss": 0.8963, "step": 21539 }, { "epoch": 0.41, "learning_rate": 3.361443249162353e-06, "loss": 0.8442, "step": 21540 }, { "epoch": 0.41, "learning_rate": 3.3612998376949495e-06, "loss": 0.9308, "step": 21541 }, { "epoch": 0.41, "learning_rate": 3.3611564230114787e-06, "loss": 0.9451, "step": 21542 }, { "epoch": 0.41, "learning_rate": 3.3610130051124764e-06, "loss": 1.011, "step": 21543 }, { "epoch": 0.41, "learning_rate": 3.360869583998477e-06, "loss": 1.1835, "step": 21544 }, { "epoch": 0.41, "learning_rate": 3.360726159670018e-06, "loss": 0.9428, "step": 21545 }, { "epoch": 0.41, "learning_rate": 3.3605827321276336e-06, "loss": 0.9921, "step": 21546 }, { "epoch": 0.41, "learning_rate": 3.3604393013718595e-06, "loss": 0.8172, "step": 21547 }, { "epoch": 0.41, "learning_rate": 3.3602958674032315e-06, "loss": 0.9738, "step": 21548 }, { "epoch": 0.41, "learning_rate": 3.3601524302222856e-06, "loss": 0.9493, "step": 21549 }, { "epoch": 0.41, "learning_rate": 3.3600089898295564e-06, "loss": 1.2451, "step": 21550 }, { "epoch": 0.41, "learning_rate": 3.3598655462255797e-06, "loss": 0.9399, "step": 21551 }, { "epoch": 0.41, "learning_rate": 3.3597220994108915e-06, "loss": 0.8876, "step": 21552 }, { "epoch": 0.41, "learning_rate": 3.359578649386027e-06, "loss": 0.899, "step": 21553 }, { "epoch": 0.41, "learning_rate": 3.359435196151523e-06, "loss": 0.8877, "step": 21554 }, { "epoch": 0.41, "learning_rate": 3.359291739707915e-06, "loss": 0.8694, "step": 21555 }, { "epoch": 0.41, "learning_rate": 3.359148280055737e-06, "loss": 1.1115, "step": 21556 }, { "epoch": 0.41, "learning_rate": 3.3590048171955252e-06, "loss": 0.9773, "step": 21557 }, { "epoch": 0.41, "learning_rate": 3.3588613511278167e-06, "loss": 0.9713, "step": 21558 }, { "epoch": 0.41, "learning_rate": 3.3587178818531457e-06, "loss": 1.0133, "step": 21559 }, { "epoch": 0.41, "learning_rate": 3.358574409372048e-06, "loss": 0.8086, "step": 21560 }, { "epoch": 0.41, "learning_rate": 3.3584309336850605e-06, "loss": 0.7862, "step": 21561 }, { "epoch": 0.41, "learning_rate": 3.3582874547927183e-06, "loss": 1.0772, "step": 21562 }, { "epoch": 0.41, "learning_rate": 3.3581439726955567e-06, "loss": 0.8194, "step": 21563 }, { "epoch": 0.41, "learning_rate": 3.3580004873941126e-06, "loss": 0.9482, "step": 21564 }, { "epoch": 0.41, "learning_rate": 3.3578569988889206e-06, "loss": 1.0244, "step": 21565 }, { "epoch": 0.41, "learning_rate": 3.3577135071805163e-06, "loss": 0.795, "step": 21566 }, { "epoch": 0.41, "learning_rate": 3.357570012269436e-06, "loss": 0.9868, "step": 21567 }, { "epoch": 0.41, "learning_rate": 3.357426514156216e-06, "loss": 0.9751, "step": 21568 }, { "epoch": 0.41, "learning_rate": 3.3572830128413915e-06, "loss": 1.0603, "step": 21569 }, { "epoch": 0.41, "learning_rate": 3.3571395083254993e-06, "loss": 0.8653, "step": 21570 }, { "epoch": 0.41, "learning_rate": 3.3569960006090735e-06, "loss": 0.9789, "step": 21571 }, { "epoch": 0.41, "learning_rate": 3.3568524896926514e-06, "loss": 0.8994, "step": 21572 }, { "epoch": 0.41, "learning_rate": 3.356708975576768e-06, "loss": 0.6754, "step": 21573 }, { "epoch": 0.41, "learning_rate": 3.3565654582619594e-06, "loss": 1.1152, "step": 21574 }, { "epoch": 0.41, "learning_rate": 3.3564219377487615e-06, "loss": 1.1752, "step": 21575 }, { "epoch": 0.41, "learning_rate": 3.356278414037712e-06, "loss": 1.0742, "step": 21576 }, { "epoch": 0.41, "learning_rate": 3.3561348871293436e-06, "loss": 0.8884, "step": 21577 }, { "epoch": 0.41, "learning_rate": 3.3559913570241942e-06, "loss": 0.8455, "step": 21578 }, { "epoch": 0.41, "learning_rate": 3.3558478237228e-06, "loss": 0.8307, "step": 21579 }, { "epoch": 0.41, "learning_rate": 3.355704287225695e-06, "loss": 0.7482, "step": 21580 }, { "epoch": 0.41, "learning_rate": 3.355560747533416e-06, "loss": 1.1385, "step": 21581 }, { "epoch": 0.41, "learning_rate": 3.355417204646501e-06, "loss": 0.9325, "step": 21582 }, { "epoch": 0.41, "learning_rate": 3.3552736585654837e-06, "loss": 0.8679, "step": 21583 }, { "epoch": 0.41, "learning_rate": 3.3551301092909013e-06, "loss": 0.8497, "step": 21584 }, { "epoch": 0.41, "learning_rate": 3.3549865568232885e-06, "loss": 0.7108, "step": 21585 }, { "epoch": 0.41, "learning_rate": 3.3548430011631827e-06, "loss": 0.8094, "step": 21586 }, { "epoch": 0.41, "learning_rate": 3.354699442311119e-06, "loss": 0.9584, "step": 21587 }, { "epoch": 0.41, "learning_rate": 3.3545558802676337e-06, "loss": 1.0522, "step": 21588 }, { "epoch": 0.41, "learning_rate": 3.354412315033263e-06, "loss": 0.8852, "step": 21589 }, { "epoch": 0.41, "learning_rate": 3.3542687466085433e-06, "loss": 0.9163, "step": 21590 }, { "epoch": 0.41, "learning_rate": 3.35412517499401e-06, "loss": 0.8812, "step": 21591 }, { "epoch": 0.41, "learning_rate": 3.3539816001901997e-06, "loss": 0.812, "step": 21592 }, { "epoch": 0.41, "learning_rate": 3.353838022197648e-06, "loss": 1.0247, "step": 21593 }, { "epoch": 0.41, "learning_rate": 3.3536944410168913e-06, "loss": 1.0099, "step": 21594 }, { "epoch": 0.41, "learning_rate": 3.353550856648466e-06, "loss": 0.9732, "step": 21595 }, { "epoch": 0.41, "learning_rate": 3.3534072690929076e-06, "loss": 1.0567, "step": 21596 }, { "epoch": 0.41, "learning_rate": 3.3532636783507533e-06, "loss": 0.6758, "step": 21597 }, { "epoch": 0.41, "learning_rate": 3.3531200844225383e-06, "loss": 0.8008, "step": 21598 }, { "epoch": 0.41, "learning_rate": 3.3529764873087984e-06, "loss": 0.9711, "step": 21599 }, { "epoch": 0.41, "learning_rate": 3.352832887010071e-06, "loss": 1.1118, "step": 21600 }, { "epoch": 0.41, "learning_rate": 3.352689283526892e-06, "loss": 0.9257, "step": 21601 }, { "epoch": 0.41, "learning_rate": 3.3525456768597962e-06, "loss": 0.9573, "step": 21602 }, { "epoch": 0.41, "learning_rate": 3.3524020670093227e-06, "loss": 0.9122, "step": 21603 }, { "epoch": 0.41, "learning_rate": 3.352258453976005e-06, "loss": 0.9008, "step": 21604 }, { "epoch": 0.41, "learning_rate": 3.35211483776038e-06, "loss": 1.1475, "step": 21605 }, { "epoch": 0.41, "learning_rate": 3.3519712183629856e-06, "loss": 1.0176, "step": 21606 }, { "epoch": 0.41, "learning_rate": 3.351827595784356e-06, "loss": 0.893, "step": 21607 }, { "epoch": 0.41, "learning_rate": 3.3516839700250282e-06, "loss": 0.9337, "step": 21608 }, { "epoch": 0.41, "learning_rate": 3.3515403410855386e-06, "loss": 0.8884, "step": 21609 }, { "epoch": 0.41, "learning_rate": 3.3513967089664236e-06, "loss": 1.1031, "step": 21610 }, { "epoch": 0.41, "learning_rate": 3.351253073668219e-06, "loss": 0.7648, "step": 21611 }, { "epoch": 0.41, "learning_rate": 3.351109435191462e-06, "loss": 1.0256, "step": 21612 }, { "epoch": 0.41, "learning_rate": 3.3509657935366886e-06, "loss": 1.1111, "step": 21613 }, { "epoch": 0.41, "learning_rate": 3.3508221487044346e-06, "loss": 0.8431, "step": 21614 }, { "epoch": 0.41, "learning_rate": 3.350678500695237e-06, "loss": 0.8735, "step": 21615 }, { "epoch": 0.41, "learning_rate": 3.3505348495096314e-06, "loss": 0.9412, "step": 21616 }, { "epoch": 0.41, "learning_rate": 3.350391195148155e-06, "loss": 0.9385, "step": 21617 }, { "epoch": 0.41, "learning_rate": 3.350247537611345e-06, "loss": 1.0154, "step": 21618 }, { "epoch": 0.41, "learning_rate": 3.3501038768997358e-06, "loss": 1.052, "step": 21619 }, { "epoch": 0.41, "learning_rate": 3.3499602130138648e-06, "loss": 0.857, "step": 21620 }, { "epoch": 0.41, "learning_rate": 3.3498165459542685e-06, "loss": 0.8189, "step": 21621 }, { "epoch": 0.41, "learning_rate": 3.3496728757214835e-06, "loss": 0.7963, "step": 21622 }, { "epoch": 0.41, "learning_rate": 3.3495292023160455e-06, "loss": 0.9653, "step": 21623 }, { "epoch": 0.41, "learning_rate": 3.349385525738492e-06, "loss": 1.2509, "step": 21624 }, { "epoch": 0.41, "learning_rate": 3.3492418459893587e-06, "loss": 1.201, "step": 21625 }, { "epoch": 0.41, "learning_rate": 3.3490981630691827e-06, "loss": 0.9883, "step": 21626 }, { "epoch": 0.41, "learning_rate": 3.3489544769785006e-06, "loss": 0.8988, "step": 21627 }, { "epoch": 0.41, "learning_rate": 3.3488107877178476e-06, "loss": 0.8834, "step": 21628 }, { "epoch": 0.41, "learning_rate": 3.3486670952877616e-06, "loss": 0.8566, "step": 21629 }, { "epoch": 0.41, "learning_rate": 3.3485233996887785e-06, "loss": 1.0501, "step": 21630 }, { "epoch": 0.41, "learning_rate": 3.3483797009214347e-06, "loss": 1.093, "step": 21631 }, { "epoch": 0.41, "learning_rate": 3.3482359989862677e-06, "loss": 1.0179, "step": 21632 }, { "epoch": 0.41, "learning_rate": 3.3480922938838133e-06, "loss": 0.8009, "step": 21633 }, { "epoch": 0.41, "learning_rate": 3.347948585614609e-06, "loss": 0.685, "step": 21634 }, { "epoch": 0.41, "learning_rate": 3.3478048741791903e-06, "loss": 0.837, "step": 21635 }, { "epoch": 0.41, "learning_rate": 3.3476611595780928e-06, "loss": 0.7493, "step": 21636 }, { "epoch": 0.41, "learning_rate": 3.3475174418118554e-06, "loss": 1.0485, "step": 21637 }, { "epoch": 0.41, "learning_rate": 3.347373720881015e-06, "loss": 0.8813, "step": 21638 }, { "epoch": 0.41, "learning_rate": 3.3472299967861053e-06, "loss": 0.8138, "step": 21639 }, { "epoch": 0.41, "learning_rate": 3.347086269527666e-06, "loss": 0.8815, "step": 21640 }, { "epoch": 0.41, "learning_rate": 3.3469425391062327e-06, "loss": 0.8079, "step": 21641 }, { "epoch": 0.41, "learning_rate": 3.346798805522341e-06, "loss": 0.8798, "step": 21642 }, { "epoch": 0.41, "learning_rate": 3.346655068776529e-06, "loss": 1.1079, "step": 21643 }, { "epoch": 0.41, "learning_rate": 3.346511328869333e-06, "loss": 0.9506, "step": 21644 }, { "epoch": 0.41, "learning_rate": 3.346367585801289e-06, "loss": 1.0402, "step": 21645 }, { "epoch": 0.41, "learning_rate": 3.3462238395729352e-06, "loss": 0.9761, "step": 21646 }, { "epoch": 0.41, "learning_rate": 3.3460800901848074e-06, "loss": 0.8604, "step": 21647 }, { "epoch": 0.41, "learning_rate": 3.3459363376374423e-06, "loss": 0.9125, "step": 21648 }, { "epoch": 0.41, "learning_rate": 3.345792581931377e-06, "loss": 1.0493, "step": 21649 }, { "epoch": 0.41, "learning_rate": 3.3456488230671477e-06, "loss": 1.1311, "step": 21650 }, { "epoch": 0.41, "learning_rate": 3.3455050610452917e-06, "loss": 1.0364, "step": 21651 }, { "epoch": 0.41, "learning_rate": 3.3453612958663462e-06, "loss": 0.9247, "step": 21652 }, { "epoch": 0.41, "learning_rate": 3.3452175275308473e-06, "loss": 0.8921, "step": 21653 }, { "epoch": 0.41, "learning_rate": 3.345073756039332e-06, "loss": 0.7568, "step": 21654 }, { "epoch": 0.41, "learning_rate": 3.3449299813923374e-06, "loss": 0.8275, "step": 21655 }, { "epoch": 0.41, "learning_rate": 3.3447862035904e-06, "loss": 1.1258, "step": 21656 }, { "epoch": 0.41, "learning_rate": 3.3446424226340563e-06, "loss": 0.9641, "step": 21657 }, { "epoch": 0.41, "learning_rate": 3.3444986385238444e-06, "loss": 0.905, "step": 21658 }, { "epoch": 0.41, "learning_rate": 3.3443548512603008e-06, "loss": 0.7014, "step": 21659 }, { "epoch": 0.41, "learning_rate": 3.3442110608439616e-06, "loss": 0.9144, "step": 21660 }, { "epoch": 0.41, "learning_rate": 3.344067267275364e-06, "loss": 1.0823, "step": 21661 }, { "epoch": 0.41, "learning_rate": 3.3439234705550455e-06, "loss": 0.9974, "step": 21662 }, { "epoch": 0.41, "learning_rate": 3.3437796706835423e-06, "loss": 0.8995, "step": 21663 }, { "epoch": 0.41, "learning_rate": 3.343635867661391e-06, "loss": 0.8393, "step": 21664 }, { "epoch": 0.41, "learning_rate": 3.3434920614891303e-06, "loss": 0.8234, "step": 21665 }, { "epoch": 0.41, "learning_rate": 3.3433482521672957e-06, "loss": 0.9467, "step": 21666 }, { "epoch": 0.41, "learning_rate": 3.3432044396964247e-06, "loss": 0.8419, "step": 21667 }, { "epoch": 0.41, "learning_rate": 3.3430606240770547e-06, "loss": 1.0016, "step": 21668 }, { "epoch": 0.41, "learning_rate": 3.3429168053097215e-06, "loss": 0.8718, "step": 21669 }, { "epoch": 0.41, "learning_rate": 3.342772983394963e-06, "loss": 1.0166, "step": 21670 }, { "epoch": 0.41, "learning_rate": 3.342629158333316e-06, "loss": 0.8443, "step": 21671 }, { "epoch": 0.41, "learning_rate": 3.342485330125317e-06, "loss": 0.7305, "step": 21672 }, { "epoch": 0.41, "learning_rate": 3.342341498771504e-06, "loss": 1.11, "step": 21673 }, { "epoch": 0.41, "learning_rate": 3.3421976642724142e-06, "loss": 0.8227, "step": 21674 }, { "epoch": 0.41, "learning_rate": 3.342053826628584e-06, "loss": 0.997, "step": 21675 }, { "epoch": 0.41, "learning_rate": 3.34190998584055e-06, "loss": 0.8545, "step": 21676 }, { "epoch": 0.41, "learning_rate": 3.341766141908851e-06, "loss": 0.8795, "step": 21677 }, { "epoch": 0.41, "learning_rate": 3.3416222948340218e-06, "loss": 0.8864, "step": 21678 }, { "epoch": 0.41, "learning_rate": 3.341478444616601e-06, "loss": 0.887, "step": 21679 }, { "epoch": 0.41, "learning_rate": 3.341334591257126e-06, "loss": 0.6639, "step": 21680 }, { "epoch": 0.41, "learning_rate": 3.3411907347561335e-06, "loss": 1.05, "step": 21681 }, { "epoch": 0.41, "learning_rate": 3.34104687511416e-06, "loss": 0.9687, "step": 21682 }, { "epoch": 0.41, "learning_rate": 3.340903012331744e-06, "loss": 0.8912, "step": 21683 }, { "epoch": 0.41, "learning_rate": 3.3407591464094215e-06, "loss": 0.9212, "step": 21684 }, { "epoch": 0.41, "learning_rate": 3.3406152773477296e-06, "loss": 0.7618, "step": 21685 }, { "epoch": 0.41, "learning_rate": 3.3404714051472067e-06, "loss": 0.9226, "step": 21686 }, { "epoch": 0.41, "learning_rate": 3.3403275298083894e-06, "loss": 1.1163, "step": 21687 }, { "epoch": 0.41, "learning_rate": 3.340183651331814e-06, "loss": 0.7916, "step": 21688 }, { "epoch": 0.41, "learning_rate": 3.3400397697180196e-06, "loss": 0.9131, "step": 21689 }, { "epoch": 0.41, "learning_rate": 3.3398958849675423e-06, "loss": 0.8006, "step": 21690 }, { "epoch": 0.41, "learning_rate": 3.3397519970809188e-06, "loss": 0.8153, "step": 21691 }, { "epoch": 0.41, "learning_rate": 3.339608106058688e-06, "loss": 0.8778, "step": 21692 }, { "epoch": 0.41, "learning_rate": 3.339464211901385e-06, "loss": 0.9875, "step": 21693 }, { "epoch": 0.41, "learning_rate": 3.33932031460955e-06, "loss": 1.0709, "step": 21694 }, { "epoch": 0.41, "learning_rate": 3.339176414183718e-06, "loss": 0.8395, "step": 21695 }, { "epoch": 0.41, "learning_rate": 3.339032510624427e-06, "loss": 1.0226, "step": 21696 }, { "epoch": 0.41, "learning_rate": 3.3388886039322146e-06, "loss": 1.1429, "step": 21697 }, { "epoch": 0.41, "learning_rate": 3.3387446941076173e-06, "loss": 0.8757, "step": 21698 }, { "epoch": 0.41, "learning_rate": 3.338600781151173e-06, "loss": 0.9566, "step": 21699 }, { "epoch": 0.41, "learning_rate": 3.338456865063419e-06, "loss": 1.2881, "step": 21700 }, { "epoch": 0.41, "learning_rate": 3.338312945844894e-06, "loss": 1.0112, "step": 21701 }, { "epoch": 0.41, "learning_rate": 3.3381690234961327e-06, "loss": 0.9353, "step": 21702 }, { "epoch": 0.41, "learning_rate": 3.338025098017675e-06, "loss": 0.7884, "step": 21703 }, { "epoch": 0.41, "learning_rate": 3.337881169410057e-06, "loss": 0.8514, "step": 21704 }, { "epoch": 0.41, "learning_rate": 3.337737237673816e-06, "loss": 0.9443, "step": 21705 }, { "epoch": 0.41, "learning_rate": 3.3375933028094904e-06, "loss": 0.9917, "step": 21706 }, { "epoch": 0.41, "learning_rate": 3.3374493648176167e-06, "loss": 0.9836, "step": 21707 }, { "epoch": 0.41, "learning_rate": 3.3373054236987324e-06, "loss": 0.8898, "step": 21708 }, { "epoch": 0.41, "learning_rate": 3.3371614794533758e-06, "loss": 0.9119, "step": 21709 }, { "epoch": 0.41, "learning_rate": 3.3370175320820843e-06, "loss": 0.9823, "step": 21710 }, { "epoch": 0.41, "learning_rate": 3.3368735815853946e-06, "loss": 1.1208, "step": 21711 }, { "epoch": 0.41, "learning_rate": 3.3367296279638445e-06, "loss": 1.098, "step": 21712 }, { "epoch": 0.41, "learning_rate": 3.336585671217971e-06, "loss": 1.1267, "step": 21713 }, { "epoch": 0.41, "learning_rate": 3.3364417113483132e-06, "loss": 0.9083, "step": 21714 }, { "epoch": 0.41, "learning_rate": 3.336297748355408e-06, "loss": 1.0096, "step": 21715 }, { "epoch": 0.41, "learning_rate": 3.3361537822397923e-06, "loss": 0.866, "step": 21716 }, { "epoch": 0.41, "learning_rate": 3.3360098130020035e-06, "loss": 0.9709, "step": 21717 }, { "epoch": 0.41, "learning_rate": 3.33586584064258e-06, "loss": 0.9846, "step": 21718 }, { "epoch": 0.41, "learning_rate": 3.335721865162059e-06, "loss": 0.9337, "step": 21719 }, { "epoch": 0.41, "learning_rate": 3.335577886560978e-06, "loss": 0.7233, "step": 21720 }, { "epoch": 0.41, "learning_rate": 3.3354339048398747e-06, "loss": 0.9431, "step": 21721 }, { "epoch": 0.41, "learning_rate": 3.3352899199992876e-06, "loss": 1.0735, "step": 21722 }, { "epoch": 0.41, "learning_rate": 3.335145932039753e-06, "loss": 0.7453, "step": 21723 }, { "epoch": 0.41, "learning_rate": 3.3350019409618094e-06, "loss": 1.0234, "step": 21724 }, { "epoch": 0.41, "learning_rate": 3.334857946765994e-06, "loss": 1.1097, "step": 21725 }, { "epoch": 0.41, "learning_rate": 3.3347139494528447e-06, "loss": 0.8313, "step": 21726 }, { "epoch": 0.41, "learning_rate": 3.334569949022899e-06, "loss": 0.6454, "step": 21727 }, { "epoch": 0.41, "learning_rate": 3.3344259454766947e-06, "loss": 0.8461, "step": 21728 }, { "epoch": 0.41, "learning_rate": 3.334281938814769e-06, "loss": 0.7301, "step": 21729 }, { "epoch": 0.41, "learning_rate": 3.3341379290376606e-06, "loss": 0.7483, "step": 21730 }, { "epoch": 0.41, "learning_rate": 3.3339939161459075e-06, "loss": 1.0337, "step": 21731 }, { "epoch": 0.41, "learning_rate": 3.3338499001400454e-06, "loss": 1.0609, "step": 21732 }, { "epoch": 0.41, "learning_rate": 3.3337058810206142e-06, "loss": 0.9377, "step": 21733 }, { "epoch": 0.41, "learning_rate": 3.3335618587881503e-06, "loss": 0.897, "step": 21734 }, { "epoch": 0.41, "learning_rate": 3.333417833443192e-06, "loss": 0.6912, "step": 21735 }, { "epoch": 0.41, "learning_rate": 3.333273804986277e-06, "loss": 0.8415, "step": 21736 }, { "epoch": 0.41, "learning_rate": 3.3331297734179436e-06, "loss": 1.1529, "step": 21737 }, { "epoch": 0.41, "learning_rate": 3.3329857387387294e-06, "loss": 0.9694, "step": 21738 }, { "epoch": 0.41, "learning_rate": 3.332841700949171e-06, "loss": 1.034, "step": 21739 }, { "epoch": 0.41, "learning_rate": 3.3326976600498084e-06, "loss": 0.8974, "step": 21740 }, { "epoch": 0.41, "learning_rate": 3.332553616041177e-06, "loss": 0.7396, "step": 21741 }, { "epoch": 0.41, "learning_rate": 3.3324095689238165e-06, "loss": 0.7254, "step": 21742 }, { "epoch": 0.41, "learning_rate": 3.3322655186982642e-06, "loss": 1.1271, "step": 21743 }, { "epoch": 0.41, "learning_rate": 3.3321214653650586e-06, "loss": 1.1087, "step": 21744 }, { "epoch": 0.41, "learning_rate": 3.3319774089247358e-06, "loss": 0.9351, "step": 21745 }, { "epoch": 0.41, "learning_rate": 3.331833349377836e-06, "loss": 0.9715, "step": 21746 }, { "epoch": 0.41, "learning_rate": 3.3316892867248956e-06, "loss": 0.9752, "step": 21747 }, { "epoch": 0.41, "learning_rate": 3.3315452209664522e-06, "loss": 0.9551, "step": 21748 }, { "epoch": 0.41, "learning_rate": 3.3314011521030453e-06, "loss": 0.9106, "step": 21749 }, { "epoch": 0.41, "learning_rate": 3.331257080135212e-06, "loss": 1.3766, "step": 21750 }, { "epoch": 0.41, "learning_rate": 3.33111300506349e-06, "loss": 0.9787, "step": 21751 }, { "epoch": 0.41, "learning_rate": 3.330968926888417e-06, "loss": 0.9693, "step": 21752 }, { "epoch": 0.41, "learning_rate": 3.3308248456105318e-06, "loss": 1.0046, "step": 21753 }, { "epoch": 0.41, "learning_rate": 3.3306807612303728e-06, "loss": 0.8336, "step": 21754 }, { "epoch": 0.41, "learning_rate": 3.330536673748476e-06, "loss": 1.0259, "step": 21755 }, { "epoch": 0.41, "learning_rate": 3.3303925831653817e-06, "loss": 1.0059, "step": 21756 }, { "epoch": 0.41, "learning_rate": 3.3302484894816267e-06, "loss": 0.7808, "step": 21757 }, { "epoch": 0.41, "learning_rate": 3.3301043926977493e-06, "loss": 0.7196, "step": 21758 }, { "epoch": 0.41, "learning_rate": 3.3299602928142878e-06, "loss": 0.9824, "step": 21759 }, { "epoch": 0.41, "learning_rate": 3.3298161898317805e-06, "loss": 1.0322, "step": 21760 }, { "epoch": 0.41, "learning_rate": 3.3296720837507635e-06, "loss": 0.8442, "step": 21761 }, { "epoch": 0.41, "learning_rate": 3.329527974571777e-06, "loss": 1.1339, "step": 21762 }, { "epoch": 0.41, "learning_rate": 3.329383862295359e-06, "loss": 0.9983, "step": 21763 }, { "epoch": 0.41, "learning_rate": 3.329239746922047e-06, "loss": 0.9462, "step": 21764 }, { "epoch": 0.41, "learning_rate": 3.3290956284523785e-06, "loss": 0.8704, "step": 21765 }, { "epoch": 0.41, "learning_rate": 3.328951506886893e-06, "loss": 0.817, "step": 21766 }, { "epoch": 0.41, "learning_rate": 3.328807382226128e-06, "loss": 1.0054, "step": 21767 }, { "epoch": 0.41, "learning_rate": 3.328663254470621e-06, "loss": 1.0541, "step": 21768 }, { "epoch": 0.41, "learning_rate": 3.328519123620911e-06, "loss": 1.1835, "step": 21769 }, { "epoch": 0.41, "learning_rate": 3.3283749896775366e-06, "loss": 0.797, "step": 21770 }, { "epoch": 0.41, "learning_rate": 3.3282308526410344e-06, "loss": 0.8647, "step": 21771 }, { "epoch": 0.41, "learning_rate": 3.3280867125119446e-06, "loss": 1.0758, "step": 21772 }, { "epoch": 0.41, "learning_rate": 3.327942569290804e-06, "loss": 0.9409, "step": 21773 }, { "epoch": 0.41, "learning_rate": 3.3277984229781512e-06, "loss": 0.9676, "step": 21774 }, { "epoch": 0.41, "learning_rate": 3.327654273574524e-06, "loss": 1.208, "step": 21775 }, { "epoch": 0.41, "learning_rate": 3.327510121080462e-06, "loss": 1.0084, "step": 21776 }, { "epoch": 0.41, "learning_rate": 3.3273659654965017e-06, "loss": 0.897, "step": 21777 }, { "epoch": 0.41, "learning_rate": 3.3272218068231837e-06, "loss": 0.8887, "step": 21778 }, { "epoch": 0.41, "learning_rate": 3.3270776450610435e-06, "loss": 0.7166, "step": 21779 }, { "epoch": 0.41, "learning_rate": 3.3269334802106213e-06, "loss": 0.8711, "step": 21780 }, { "epoch": 0.41, "learning_rate": 3.3267893122724548e-06, "loss": 0.8688, "step": 21781 }, { "epoch": 0.41, "learning_rate": 3.3266451412470823e-06, "loss": 1.0034, "step": 21782 }, { "epoch": 0.41, "learning_rate": 3.3265009671350412e-06, "loss": 0.6371, "step": 21783 }, { "epoch": 0.41, "learning_rate": 3.3263567899368725e-06, "loss": 0.8659, "step": 21784 }, { "epoch": 0.41, "learning_rate": 3.3262126096531123e-06, "loss": 0.8539, "step": 21785 }, { "epoch": 0.41, "learning_rate": 3.3260684262842992e-06, "loss": 1.1557, "step": 21786 }, { "epoch": 0.41, "learning_rate": 3.325924239830972e-06, "loss": 1.0323, "step": 21787 }, { "epoch": 0.41, "learning_rate": 3.3257800502936695e-06, "loss": 0.9202, "step": 21788 }, { "epoch": 0.41, "learning_rate": 3.3256358576729286e-06, "loss": 0.7596, "step": 21789 }, { "epoch": 0.41, "learning_rate": 3.3254916619692893e-06, "loss": 0.8293, "step": 21790 }, { "epoch": 0.41, "learning_rate": 3.3253474631832895e-06, "loss": 0.9347, "step": 21791 }, { "epoch": 0.41, "learning_rate": 3.325203261315467e-06, "loss": 0.8655, "step": 21792 }, { "epoch": 0.41, "learning_rate": 3.325059056366362e-06, "loss": 1.2239, "step": 21793 }, { "epoch": 0.41, "learning_rate": 3.324914848336511e-06, "loss": 1.0908, "step": 21794 }, { "epoch": 0.41, "learning_rate": 3.324770637226454e-06, "loss": 0.7576, "step": 21795 }, { "epoch": 0.41, "learning_rate": 3.3246264230367275e-06, "loss": 0.9057, "step": 21796 }, { "epoch": 0.41, "learning_rate": 3.324482205767872e-06, "loss": 0.8759, "step": 21797 }, { "epoch": 0.41, "learning_rate": 3.324337985420425e-06, "loss": 1.0118, "step": 21798 }, { "epoch": 0.41, "learning_rate": 3.324193761994926e-06, "loss": 1.1662, "step": 21799 }, { "epoch": 0.41, "learning_rate": 3.3240495354919115e-06, "loss": 1.1196, "step": 21800 }, { "epoch": 0.41, "learning_rate": 3.323905305911922e-06, "loss": 1.0854, "step": 21801 }, { "epoch": 0.41, "learning_rate": 3.323761073255496e-06, "loss": 1.1219, "step": 21802 }, { "epoch": 0.41, "learning_rate": 3.3236168375231697e-06, "loss": 0.9304, "step": 21803 }, { "epoch": 0.41, "learning_rate": 3.323472598715484e-06, "loss": 0.9839, "step": 21804 }, { "epoch": 0.41, "learning_rate": 3.3233283568329777e-06, "loss": 0.9592, "step": 21805 }, { "epoch": 0.41, "learning_rate": 3.323184111876188e-06, "loss": 1.0515, "step": 21806 }, { "epoch": 0.41, "learning_rate": 3.323039863845654e-06, "loss": 0.8752, "step": 21807 }, { "epoch": 0.41, "learning_rate": 3.322895612741915e-06, "loss": 0.9377, "step": 21808 }, { "epoch": 0.41, "learning_rate": 3.3227513585655086e-06, "loss": 0.8607, "step": 21809 }, { "epoch": 0.41, "learning_rate": 3.3226071013169737e-06, "loss": 0.8345, "step": 21810 }, { "epoch": 0.41, "learning_rate": 3.322462840996849e-06, "loss": 0.9456, "step": 21811 }, { "epoch": 0.41, "learning_rate": 3.3223185776056733e-06, "loss": 0.8663, "step": 21812 }, { "epoch": 0.41, "learning_rate": 3.3221743111439852e-06, "loss": 1.0289, "step": 21813 }, { "epoch": 0.41, "learning_rate": 3.322030041612324e-06, "loss": 0.8782, "step": 21814 }, { "epoch": 0.41, "learning_rate": 3.3218857690112273e-06, "loss": 0.8069, "step": 21815 }, { "epoch": 0.41, "learning_rate": 3.3217414933412344e-06, "loss": 0.7801, "step": 21816 }, { "epoch": 0.41, "learning_rate": 3.321597214602884e-06, "loss": 0.7819, "step": 21817 }, { "epoch": 0.41, "learning_rate": 3.3214529327967148e-06, "loss": 1.1893, "step": 21818 }, { "epoch": 0.41, "learning_rate": 3.3213086479232655e-06, "loss": 0.8964, "step": 21819 }, { "epoch": 0.41, "learning_rate": 3.321164359983076e-06, "loss": 1.0094, "step": 21820 }, { "epoch": 0.41, "learning_rate": 3.321020068976682e-06, "loss": 0.8625, "step": 21821 }, { "epoch": 0.41, "learning_rate": 3.320875774904625e-06, "loss": 0.8599, "step": 21822 }, { "epoch": 0.41, "learning_rate": 3.3207314777674436e-06, "loss": 0.8306, "step": 21823 }, { "epoch": 0.41, "learning_rate": 3.320587177565675e-06, "loss": 1.1036, "step": 21824 }, { "epoch": 0.41, "learning_rate": 3.3204428742998597e-06, "loss": 1.1593, "step": 21825 }, { "epoch": 0.41, "learning_rate": 3.3202985679705365e-06, "loss": 0.8945, "step": 21826 }, { "epoch": 0.41, "learning_rate": 3.3201542585782426e-06, "loss": 0.7363, "step": 21827 }, { "epoch": 0.41, "learning_rate": 3.320009946123518e-06, "loss": 1.0557, "step": 21828 }, { "epoch": 0.41, "learning_rate": 3.3198656306069023e-06, "loss": 0.8256, "step": 21829 }, { "epoch": 0.41, "learning_rate": 3.3197213120289325e-06, "loss": 0.8958, "step": 21830 }, { "epoch": 0.41, "learning_rate": 3.319576990390148e-06, "loss": 1.1724, "step": 21831 }, { "epoch": 0.41, "learning_rate": 3.3194326656910893e-06, "loss": 0.9718, "step": 21832 }, { "epoch": 0.41, "learning_rate": 3.3192883379322932e-06, "loss": 0.8633, "step": 21833 }, { "epoch": 0.41, "learning_rate": 3.3191440071143e-06, "loss": 1.0175, "step": 21834 }, { "epoch": 0.41, "learning_rate": 3.318999673237649e-06, "loss": 0.7883, "step": 21835 }, { "epoch": 0.41, "learning_rate": 3.3188553363028777e-06, "loss": 1.0234, "step": 21836 }, { "epoch": 0.41, "learning_rate": 3.3187109963105246e-06, "loss": 1.1543, "step": 21837 }, { "epoch": 0.41, "learning_rate": 3.318566653261131e-06, "loss": 1.0168, "step": 21838 }, { "epoch": 0.41, "learning_rate": 3.318422307155234e-06, "loss": 0.941, "step": 21839 }, { "epoch": 0.41, "learning_rate": 3.318277957993373e-06, "loss": 0.8348, "step": 21840 }, { "epoch": 0.41, "learning_rate": 3.3181336057760887e-06, "loss": 0.9138, "step": 21841 }, { "epoch": 0.41, "learning_rate": 3.3179892505039173e-06, "loss": 0.8992, "step": 21842 }, { "epoch": 0.41, "learning_rate": 3.3178448921773992e-06, "loss": 0.987, "step": 21843 }, { "epoch": 0.41, "learning_rate": 3.3177005307970746e-06, "loss": 0.8788, "step": 21844 }, { "epoch": 0.41, "learning_rate": 3.317556166363479e-06, "loss": 0.9776, "step": 21845 }, { "epoch": 0.41, "learning_rate": 3.3174117988771547e-06, "loss": 0.5962, "step": 21846 }, { "epoch": 0.41, "learning_rate": 3.317267428338641e-06, "loss": 0.9016, "step": 21847 }, { "epoch": 0.41, "learning_rate": 3.3171230547484747e-06, "loss": 0.8367, "step": 21848 }, { "epoch": 0.41, "learning_rate": 3.316978678107196e-06, "loss": 1.0991, "step": 21849 }, { "epoch": 0.41, "learning_rate": 3.3168342984153446e-06, "loss": 1.2034, "step": 21850 }, { "epoch": 0.41, "learning_rate": 3.3166899156734584e-06, "loss": 0.9383, "step": 21851 }, { "epoch": 0.41, "learning_rate": 3.316545529882077e-06, "loss": 0.7794, "step": 21852 }, { "epoch": 0.41, "learning_rate": 3.3164011410417396e-06, "loss": 1.0267, "step": 21853 }, { "epoch": 0.41, "learning_rate": 3.3162567491529856e-06, "loss": 0.6989, "step": 21854 }, { "epoch": 0.41, "learning_rate": 3.316112354216354e-06, "loss": 0.863, "step": 21855 }, { "epoch": 0.41, "learning_rate": 3.3159679562323842e-06, "loss": 1.0265, "step": 21856 }, { "epoch": 0.41, "learning_rate": 3.3158235552016143e-06, "loss": 1.0554, "step": 21857 }, { "epoch": 0.41, "learning_rate": 3.3156791511245843e-06, "loss": 0.7722, "step": 21858 }, { "epoch": 0.41, "learning_rate": 3.315534744001834e-06, "loss": 0.8868, "step": 21859 }, { "epoch": 0.41, "learning_rate": 3.3153903338339014e-06, "loss": 1.0043, "step": 21860 }, { "epoch": 0.41, "learning_rate": 3.315245920621327e-06, "loss": 1.0732, "step": 21861 }, { "epoch": 0.41, "learning_rate": 3.315101504364649e-06, "loss": 1.0214, "step": 21862 }, { "epoch": 0.41, "learning_rate": 3.3149570850644064e-06, "loss": 1.0352, "step": 21863 }, { "epoch": 0.41, "learning_rate": 3.31481266272114e-06, "loss": 0.9221, "step": 21864 }, { "epoch": 0.41, "learning_rate": 3.314668237335388e-06, "loss": 0.9131, "step": 21865 }, { "epoch": 0.41, "learning_rate": 3.3145238089076883e-06, "loss": 0.8184, "step": 21866 }, { "epoch": 0.41, "learning_rate": 3.3143793774385835e-06, "loss": 0.7887, "step": 21867 }, { "epoch": 0.41, "learning_rate": 3.3142349429286097e-06, "loss": 1.097, "step": 21868 }, { "epoch": 0.41, "learning_rate": 3.3140905053783086e-06, "loss": 0.8094, "step": 21869 }, { "epoch": 0.41, "learning_rate": 3.3139460647882183e-06, "loss": 1.0379, "step": 21870 }, { "epoch": 0.41, "learning_rate": 3.313801621158878e-06, "loss": 0.8959, "step": 21871 }, { "epoch": 0.41, "learning_rate": 3.3136571744908276e-06, "loss": 0.6822, "step": 21872 }, { "epoch": 0.41, "learning_rate": 3.313512724784606e-06, "loss": 0.8769, "step": 21873 }, { "epoch": 0.41, "learning_rate": 3.313368272040753e-06, "loss": 1.0941, "step": 21874 }, { "epoch": 0.41, "learning_rate": 3.3132238162598073e-06, "loss": 0.9738, "step": 21875 }, { "epoch": 0.41, "learning_rate": 3.3130793574423105e-06, "loss": 0.8855, "step": 21876 }, { "epoch": 0.41, "learning_rate": 3.3129348955887986e-06, "loss": 0.8001, "step": 21877 }, { "epoch": 0.41, "learning_rate": 3.312790430699813e-06, "loss": 1.0704, "step": 21878 }, { "epoch": 0.41, "learning_rate": 3.3126459627758935e-06, "loss": 0.816, "step": 21879 }, { "epoch": 0.41, "learning_rate": 3.312501491817578e-06, "loss": 1.051, "step": 21880 }, { "epoch": 0.41, "learning_rate": 3.312357017825408e-06, "loss": 1.1431, "step": 21881 }, { "epoch": 0.41, "learning_rate": 3.312212540799921e-06, "loss": 0.9263, "step": 21882 }, { "epoch": 0.41, "learning_rate": 3.3120680607416576e-06, "loss": 0.8326, "step": 21883 }, { "epoch": 0.41, "learning_rate": 3.3119235776511565e-06, "loss": 1.0251, "step": 21884 }, { "epoch": 0.41, "learning_rate": 3.3117790915289584e-06, "loss": 0.7837, "step": 21885 }, { "epoch": 0.41, "learning_rate": 3.3116346023756017e-06, "loss": 0.8916, "step": 21886 }, { "epoch": 0.41, "learning_rate": 3.3114901101916254e-06, "loss": 1.1736, "step": 21887 }, { "epoch": 0.41, "learning_rate": 3.3113456149775714e-06, "loss": 1.0237, "step": 21888 }, { "epoch": 0.41, "learning_rate": 3.311201116733977e-06, "loss": 0.8303, "step": 21889 }, { "epoch": 0.41, "learning_rate": 3.311056615461382e-06, "loss": 0.8395, "step": 21890 }, { "epoch": 0.41, "learning_rate": 3.3109121111603276e-06, "loss": 0.9343, "step": 21891 }, { "epoch": 0.41, "learning_rate": 3.310767603831352e-06, "loss": 0.8498, "step": 21892 }, { "epoch": 0.41, "learning_rate": 3.3106230934749944e-06, "loss": 1.1931, "step": 21893 }, { "epoch": 0.41, "learning_rate": 3.3104785800917948e-06, "loss": 1.1224, "step": 21894 }, { "epoch": 0.41, "learning_rate": 3.310334063682294e-06, "loss": 1.0792, "step": 21895 }, { "epoch": 0.41, "learning_rate": 3.31018954424703e-06, "loss": 0.7243, "step": 21896 }, { "epoch": 0.41, "learning_rate": 3.3100450217865436e-06, "loss": 0.8984, "step": 21897 }, { "epoch": 0.41, "learning_rate": 3.309900496301374e-06, "loss": 0.8239, "step": 21898 }, { "epoch": 0.41, "learning_rate": 3.3097559677920598e-06, "loss": 1.0667, "step": 21899 }, { "epoch": 0.41, "learning_rate": 3.3096114362591426e-06, "loss": 1.1356, "step": 21900 }, { "epoch": 0.41, "learning_rate": 3.30946690170316e-06, "loss": 0.8008, "step": 21901 }, { "epoch": 0.41, "learning_rate": 3.3093223641246536e-06, "loss": 0.9305, "step": 21902 }, { "epoch": 0.41, "learning_rate": 3.3091778235241628e-06, "loss": 1.0001, "step": 21903 }, { "epoch": 0.41, "learning_rate": 3.309033279902226e-06, "loss": 0.9931, "step": 21904 }, { "epoch": 0.41, "learning_rate": 3.3088887332593842e-06, "loss": 0.952, "step": 21905 }, { "epoch": 0.41, "learning_rate": 3.308744183596177e-06, "loss": 1.1245, "step": 21906 }, { "epoch": 0.41, "learning_rate": 3.308599630913143e-06, "loss": 0.8945, "step": 21907 }, { "epoch": 0.41, "learning_rate": 3.3084550752108226e-06, "loss": 0.8585, "step": 21908 }, { "epoch": 0.41, "learning_rate": 3.3083105164897568e-06, "loss": 0.9602, "step": 21909 }, { "epoch": 0.41, "learning_rate": 3.3081659547504834e-06, "loss": 0.9146, "step": 21910 }, { "epoch": 0.41, "learning_rate": 3.3080213899935433e-06, "loss": 0.7907, "step": 21911 }, { "epoch": 0.41, "learning_rate": 3.307876822219477e-06, "loss": 0.855, "step": 21912 }, { "epoch": 0.41, "learning_rate": 3.307732251428822e-06, "loss": 0.9999, "step": 21913 }, { "epoch": 0.41, "learning_rate": 3.3075876776221207e-06, "loss": 0.6819, "step": 21914 }, { "epoch": 0.41, "learning_rate": 3.3074431007999108e-06, "loss": 0.957, "step": 21915 }, { "epoch": 0.41, "learning_rate": 3.307298520962734e-06, "loss": 0.9783, "step": 21916 }, { "epoch": 0.41, "learning_rate": 3.3071539381111285e-06, "loss": 1.0561, "step": 21917 }, { "epoch": 0.41, "learning_rate": 3.307009352245636e-06, "loss": 1.2029, "step": 21918 }, { "epoch": 0.41, "learning_rate": 3.306864763366794e-06, "loss": 0.985, "step": 21919 }, { "epoch": 0.41, "learning_rate": 3.3067201714751444e-06, "loss": 1.0175, "step": 21920 }, { "epoch": 0.41, "learning_rate": 3.306575576571226e-06, "loss": 0.9136, "step": 21921 }, { "epoch": 0.41, "learning_rate": 3.30643097865558e-06, "loss": 1.0156, "step": 21922 }, { "epoch": 0.41, "learning_rate": 3.3062863777287444e-06, "loss": 1.0028, "step": 21923 }, { "epoch": 0.41, "learning_rate": 3.3061417737912616e-06, "loss": 0.9201, "step": 21924 }, { "epoch": 0.41, "learning_rate": 3.3059971668436684e-06, "loss": 0.9856, "step": 21925 }, { "epoch": 0.41, "learning_rate": 3.3058525568865075e-06, "loss": 0.9287, "step": 21926 }, { "epoch": 0.41, "learning_rate": 3.3057079439203183e-06, "loss": 0.7449, "step": 21927 }, { "epoch": 0.41, "learning_rate": 3.3055633279456397e-06, "loss": 0.8382, "step": 21928 }, { "epoch": 0.41, "learning_rate": 3.305418708963012e-06, "loss": 1.0741, "step": 21929 }, { "epoch": 0.41, "learning_rate": 3.305274086972976e-06, "loss": 0.7889, "step": 21930 }, { "epoch": 0.41, "learning_rate": 3.305129461976071e-06, "loss": 1.16, "step": 21931 }, { "epoch": 0.41, "learning_rate": 3.3049848339728373e-06, "loss": 1.155, "step": 21932 }, { "epoch": 0.41, "learning_rate": 3.3048402029638155e-06, "loss": 0.84, "step": 21933 }, { "epoch": 0.41, "learning_rate": 3.3046955689495446e-06, "loss": 0.7215, "step": 21934 }, { "epoch": 0.41, "learning_rate": 3.3045509319305653e-06, "loss": 0.8567, "step": 21935 }, { "epoch": 0.41, "learning_rate": 3.304406291907417e-06, "loss": 0.6688, "step": 21936 }, { "epoch": 0.41, "learning_rate": 3.3042616488806407e-06, "loss": 0.9105, "step": 21937 }, { "epoch": 0.41, "learning_rate": 3.304117002850776e-06, "loss": 1.0492, "step": 21938 }, { "epoch": 0.41, "learning_rate": 3.303972353818363e-06, "loss": 0.7161, "step": 21939 }, { "epoch": 0.41, "learning_rate": 3.303827701783942e-06, "loss": 0.959, "step": 21940 }, { "epoch": 0.41, "learning_rate": 3.303683046748053e-06, "loss": 0.8611, "step": 21941 }, { "epoch": 0.41, "learning_rate": 3.303538388711236e-06, "loss": 0.8906, "step": 21942 }, { "epoch": 0.41, "learning_rate": 3.303393727674031e-06, "loss": 1.0971, "step": 21943 }, { "epoch": 0.41, "learning_rate": 3.3032490636369787e-06, "loss": 1.1428, "step": 21944 }, { "epoch": 0.41, "learning_rate": 3.3031043966006192e-06, "loss": 0.9486, "step": 21945 }, { "epoch": 0.41, "learning_rate": 3.302959726565493e-06, "loss": 1.0578, "step": 21946 }, { "epoch": 0.41, "learning_rate": 3.302815053532139e-06, "loss": 0.9511, "step": 21947 }, { "epoch": 0.41, "learning_rate": 3.302670377501099e-06, "loss": 0.9016, "step": 21948 }, { "epoch": 0.41, "learning_rate": 3.3025256984729116e-06, "loss": 0.9518, "step": 21949 }, { "epoch": 0.41, "learning_rate": 3.3023810164481174e-06, "loss": 0.976, "step": 21950 }, { "epoch": 0.41, "learning_rate": 3.3022363314272583e-06, "loss": 0.9512, "step": 21951 }, { "epoch": 0.41, "learning_rate": 3.3020916434108724e-06, "loss": 0.9801, "step": 21952 }, { "epoch": 0.41, "learning_rate": 3.301946952399501e-06, "loss": 0.8693, "step": 21953 }, { "epoch": 0.41, "learning_rate": 3.3018022583936855e-06, "loss": 0.8401, "step": 21954 }, { "epoch": 0.41, "learning_rate": 3.3016575613939637e-06, "loss": 0.9489, "step": 21955 }, { "epoch": 0.41, "learning_rate": 3.3015128614008774e-06, "loss": 1.1584, "step": 21956 }, { "epoch": 0.41, "learning_rate": 3.301368158414967e-06, "loss": 1.014, "step": 21957 }, { "epoch": 0.41, "learning_rate": 3.301223452436772e-06, "loss": 1.1432, "step": 21958 }, { "epoch": 0.41, "learning_rate": 3.3010787434668334e-06, "loss": 0.9224, "step": 21959 }, { "epoch": 0.41, "learning_rate": 3.3009340315056913e-06, "loss": 0.8679, "step": 21960 }, { "epoch": 0.41, "learning_rate": 3.3007893165538863e-06, "loss": 0.9464, "step": 21961 }, { "epoch": 0.41, "learning_rate": 3.3006445986119584e-06, "loss": 1.1698, "step": 21962 }, { "epoch": 0.41, "learning_rate": 3.3004998776804477e-06, "loss": 1.0385, "step": 21963 }, { "epoch": 0.41, "learning_rate": 3.3003551537598953e-06, "loss": 0.8654, "step": 21964 }, { "epoch": 0.41, "learning_rate": 3.3002104268508413e-06, "loss": 1.0122, "step": 21965 }, { "epoch": 0.41, "learning_rate": 3.3000656969538265e-06, "loss": 0.8852, "step": 21966 }, { "epoch": 0.41, "learning_rate": 3.299920964069391e-06, "loss": 0.8622, "step": 21967 }, { "epoch": 0.41, "learning_rate": 3.2997762281980743e-06, "loss": 1.0685, "step": 21968 }, { "epoch": 0.41, "learning_rate": 3.2996314893404186e-06, "loss": 0.9743, "step": 21969 }, { "epoch": 0.41, "learning_rate": 3.299486747496963e-06, "loss": 1.1326, "step": 21970 }, { "epoch": 0.41, "learning_rate": 3.2993420026682476e-06, "loss": 1.0062, "step": 21971 }, { "epoch": 0.41, "learning_rate": 3.2991972548548147e-06, "loss": 0.866, "step": 21972 }, { "epoch": 0.41, "learning_rate": 3.2990525040572035e-06, "loss": 0.9356, "step": 21973 }, { "epoch": 0.41, "learning_rate": 3.2989077502759547e-06, "loss": 1.1281, "step": 21974 }, { "epoch": 0.41, "learning_rate": 3.2987629935116096e-06, "loss": 1.0994, "step": 21975 }, { "epoch": 0.41, "learning_rate": 3.2986182337647065e-06, "loss": 1.1108, "step": 21976 }, { "epoch": 0.41, "learning_rate": 3.298473471035788e-06, "loss": 0.8486, "step": 21977 }, { "epoch": 0.41, "learning_rate": 3.298328705325394e-06, "loss": 1.0046, "step": 21978 }, { "epoch": 0.41, "learning_rate": 3.2981839366340658e-06, "loss": 0.8762, "step": 21979 }, { "epoch": 0.41, "learning_rate": 3.2980391649623423e-06, "loss": 1.0543, "step": 21980 }, { "epoch": 0.41, "learning_rate": 3.2978943903107662e-06, "loss": 1.2191, "step": 21981 }, { "epoch": 0.41, "learning_rate": 3.297749612679876e-06, "loss": 1.0728, "step": 21982 }, { "epoch": 0.41, "learning_rate": 3.2976048320702137e-06, "loss": 0.9121, "step": 21983 }, { "epoch": 0.41, "learning_rate": 3.2974600484823185e-06, "loss": 1.0425, "step": 21984 }, { "epoch": 0.41, "learning_rate": 3.2973152619167327e-06, "loss": 0.8619, "step": 21985 }, { "epoch": 0.41, "learning_rate": 3.297170472373996e-06, "loss": 0.8016, "step": 21986 }, { "epoch": 0.41, "learning_rate": 3.297025679854649e-06, "loss": 1.0754, "step": 21987 }, { "epoch": 0.41, "learning_rate": 3.2968808843592324e-06, "loss": 1.1124, "step": 21988 }, { "epoch": 0.41, "learning_rate": 3.296736085888288e-06, "loss": 0.8598, "step": 21989 }, { "epoch": 0.41, "learning_rate": 3.2965912844423554e-06, "loss": 1.0809, "step": 21990 }, { "epoch": 0.41, "learning_rate": 3.296446480021974e-06, "loss": 0.8686, "step": 21991 }, { "epoch": 0.41, "learning_rate": 3.296301672627687e-06, "loss": 0.7924, "step": 21992 }, { "epoch": 0.41, "learning_rate": 3.296156862260033e-06, "loss": 1.0571, "step": 21993 }, { "epoch": 0.41, "learning_rate": 3.2960120489195546e-06, "loss": 1.0306, "step": 21994 }, { "epoch": 0.41, "learning_rate": 3.295867232606792e-06, "loss": 0.7813, "step": 21995 }, { "epoch": 0.41, "learning_rate": 3.295722413322284e-06, "loss": 0.8131, "step": 21996 }, { "epoch": 0.42, "learning_rate": 3.2955775910665742e-06, "loss": 0.7488, "step": 21997 }, { "epoch": 0.42, "learning_rate": 3.295432765840202e-06, "loss": 0.8992, "step": 21998 }, { "epoch": 0.42, "learning_rate": 3.2952879376437076e-06, "loss": 0.9291, "step": 21999 }, { "epoch": 0.42, "learning_rate": 3.2951431064776325e-06, "loss": 0.7822, "step": 22000 }, { "epoch": 0.42, "learning_rate": 3.294998272342518e-06, "loss": 0.9769, "step": 22001 }, { "epoch": 0.42, "learning_rate": 3.2948534352389037e-06, "loss": 0.8195, "step": 22002 }, { "epoch": 0.42, "learning_rate": 3.2947085951673313e-06, "loss": 0.7734, "step": 22003 }, { "epoch": 0.42, "learning_rate": 3.294563752128342e-06, "loss": 0.9219, "step": 22004 }, { "epoch": 0.42, "learning_rate": 3.2944189061224745e-06, "loss": 1.0041, "step": 22005 }, { "epoch": 0.42, "learning_rate": 3.2942740571502723e-06, "loss": 1.2249, "step": 22006 }, { "epoch": 0.42, "learning_rate": 3.2941292052122752e-06, "loss": 0.7803, "step": 22007 }, { "epoch": 0.42, "learning_rate": 3.2939843503090234e-06, "loss": 0.8635, "step": 22008 }, { "epoch": 0.42, "learning_rate": 3.2938394924410588e-06, "loss": 0.906, "step": 22009 }, { "epoch": 0.42, "learning_rate": 3.2936946316089223e-06, "loss": 0.8071, "step": 22010 }, { "epoch": 0.42, "learning_rate": 3.2935497678131534e-06, "loss": 0.8955, "step": 22011 }, { "epoch": 0.42, "learning_rate": 3.2934049010542944e-06, "loss": 0.9561, "step": 22012 }, { "epoch": 0.42, "learning_rate": 3.2932600313328855e-06, "loss": 0.9617, "step": 22013 }, { "epoch": 0.42, "learning_rate": 3.2931151586494684e-06, "loss": 1.0709, "step": 22014 }, { "epoch": 0.42, "learning_rate": 3.2929702830045832e-06, "loss": 0.9247, "step": 22015 }, { "epoch": 0.42, "learning_rate": 3.2928254043987724e-06, "loss": 0.7709, "step": 22016 }, { "epoch": 0.42, "learning_rate": 3.2926805228325746e-06, "loss": 0.8811, "step": 22017 }, { "epoch": 0.42, "learning_rate": 3.2925356383065325e-06, "loss": 1.0362, "step": 22018 }, { "epoch": 0.42, "learning_rate": 3.2923907508211867e-06, "loss": 1.0681, "step": 22019 }, { "epoch": 0.42, "learning_rate": 3.292245860377078e-06, "loss": 0.9849, "step": 22020 }, { "epoch": 0.42, "learning_rate": 3.2921009669747474e-06, "loss": 0.899, "step": 22021 }, { "epoch": 0.42, "learning_rate": 3.291956070614737e-06, "loss": 0.9238, "step": 22022 }, { "epoch": 0.42, "learning_rate": 3.291811171297586e-06, "loss": 0.8143, "step": 22023 }, { "epoch": 0.42, "learning_rate": 3.2916662690238365e-06, "loss": 1.0786, "step": 22024 }, { "epoch": 0.42, "learning_rate": 3.2915213637940297e-06, "loss": 0.9772, "step": 22025 }, { "epoch": 0.42, "learning_rate": 3.2913764556087056e-06, "loss": 0.9039, "step": 22026 }, { "epoch": 0.42, "learning_rate": 3.2912315444684063e-06, "loss": 0.7224, "step": 22027 }, { "epoch": 0.42, "learning_rate": 3.2910866303736734e-06, "loss": 0.8177, "step": 22028 }, { "epoch": 0.42, "learning_rate": 3.290941713325047e-06, "loss": 0.7693, "step": 22029 }, { "epoch": 0.42, "learning_rate": 3.2907967933230686e-06, "loss": 1.2017, "step": 22030 }, { "epoch": 0.42, "learning_rate": 3.2906518703682787e-06, "loss": 1.0643, "step": 22031 }, { "epoch": 0.42, "learning_rate": 3.290506944461219e-06, "loss": 0.973, "step": 22032 }, { "epoch": 0.42, "learning_rate": 3.2903620156024313e-06, "loss": 0.8788, "step": 22033 }, { "epoch": 0.42, "learning_rate": 3.2902170837924553e-06, "loss": 0.9969, "step": 22034 }, { "epoch": 0.42, "learning_rate": 3.2900721490318333e-06, "loss": 0.8694, "step": 22035 }, { "epoch": 0.42, "learning_rate": 3.289927211321106e-06, "loss": 0.9485, "step": 22036 }, { "epoch": 0.42, "learning_rate": 3.289782270660815e-06, "loss": 1.3674, "step": 22037 }, { "epoch": 0.42, "learning_rate": 3.2896373270515015e-06, "loss": 0.9124, "step": 22038 }, { "epoch": 0.42, "learning_rate": 3.2894923804937058e-06, "loss": 0.703, "step": 22039 }, { "epoch": 0.42, "learning_rate": 3.28934743098797e-06, "loss": 0.9737, "step": 22040 }, { "epoch": 0.42, "learning_rate": 3.289202478534834e-06, "loss": 0.9875, "step": 22041 }, { "epoch": 0.42, "learning_rate": 3.2890575231348415e-06, "loss": 0.7506, "step": 22042 }, { "epoch": 0.42, "learning_rate": 3.2889125647885324e-06, "loss": 1.0673, "step": 22043 }, { "epoch": 0.42, "learning_rate": 3.2887676034964478e-06, "loss": 0.8962, "step": 22044 }, { "epoch": 0.42, "learning_rate": 3.2886226392591288e-06, "loss": 0.9739, "step": 22045 }, { "epoch": 0.42, "learning_rate": 3.288477672077118e-06, "loss": 0.9893, "step": 22046 }, { "epoch": 0.42, "learning_rate": 3.2883327019509536e-06, "loss": 0.8903, "step": 22047 }, { "epoch": 0.42, "learning_rate": 3.2881877288811803e-06, "loss": 0.9321, "step": 22048 }, { "epoch": 0.42, "learning_rate": 3.288042752868339e-06, "loss": 0.9465, "step": 22049 }, { "epoch": 0.42, "learning_rate": 3.2878977739129696e-06, "loss": 1.0193, "step": 22050 }, { "epoch": 0.42, "learning_rate": 3.2877527920156137e-06, "loss": 1.0599, "step": 22051 }, { "epoch": 0.42, "learning_rate": 3.2876078071768136e-06, "loss": 0.9732, "step": 22052 }, { "epoch": 0.42, "learning_rate": 3.2874628193971104e-06, "loss": 1.0364, "step": 22053 }, { "epoch": 0.42, "learning_rate": 3.287317828677044e-06, "loss": 0.8751, "step": 22054 }, { "epoch": 0.42, "learning_rate": 3.287172835017158e-06, "loss": 1.0222, "step": 22055 }, { "epoch": 0.42, "learning_rate": 3.287027838417992e-06, "loss": 1.1241, "step": 22056 }, { "epoch": 0.42, "learning_rate": 3.2868828388800884e-06, "loss": 1.0454, "step": 22057 }, { "epoch": 0.42, "learning_rate": 3.286737836403989e-06, "loss": 0.8281, "step": 22058 }, { "epoch": 0.42, "learning_rate": 3.286592830990234e-06, "loss": 0.8276, "step": 22059 }, { "epoch": 0.42, "learning_rate": 3.2864478226393655e-06, "loss": 0.9067, "step": 22060 }, { "epoch": 0.42, "learning_rate": 3.2863028113519247e-06, "loss": 0.7714, "step": 22061 }, { "epoch": 0.42, "learning_rate": 3.2861577971284543e-06, "loss": 0.9248, "step": 22062 }, { "epoch": 0.42, "learning_rate": 3.2860127799694934e-06, "loss": 0.8919, "step": 22063 }, { "epoch": 0.42, "learning_rate": 3.2858677598755862e-06, "loss": 0.9022, "step": 22064 }, { "epoch": 0.42, "learning_rate": 3.2857227368472723e-06, "loss": 0.697, "step": 22065 }, { "epoch": 0.42, "learning_rate": 3.285577710885094e-06, "loss": 1.0264, "step": 22066 }, { "epoch": 0.42, "learning_rate": 3.2854326819895926e-06, "loss": 0.8575, "step": 22067 }, { "epoch": 0.42, "learning_rate": 3.285287650161309e-06, "loss": 1.2513, "step": 22068 }, { "epoch": 0.42, "learning_rate": 3.285142615400786e-06, "loss": 0.9457, "step": 22069 }, { "epoch": 0.42, "learning_rate": 3.2849975777085645e-06, "loss": 0.8525, "step": 22070 }, { "epoch": 0.42, "learning_rate": 3.2848525370851863e-06, "loss": 0.9704, "step": 22071 }, { "epoch": 0.42, "learning_rate": 3.284707493531192e-06, "loss": 0.6554, "step": 22072 }, { "epoch": 0.42, "learning_rate": 3.2845624470471256e-06, "loss": 0.8911, "step": 22073 }, { "epoch": 0.42, "learning_rate": 3.2844173976335258e-06, "loss": 0.9152, "step": 22074 }, { "epoch": 0.42, "learning_rate": 3.2842723452909355e-06, "loss": 0.9242, "step": 22075 }, { "epoch": 0.42, "learning_rate": 3.284127290019896e-06, "loss": 0.9365, "step": 22076 }, { "epoch": 0.42, "learning_rate": 3.28398223182095e-06, "loss": 0.8353, "step": 22077 }, { "epoch": 0.42, "learning_rate": 3.2838371706946383e-06, "loss": 0.9923, "step": 22078 }, { "epoch": 0.42, "learning_rate": 3.283692106641503e-06, "loss": 0.8339, "step": 22079 }, { "epoch": 0.42, "learning_rate": 3.2835470396620846e-06, "loss": 0.7335, "step": 22080 }, { "epoch": 0.42, "learning_rate": 3.2834019697569256e-06, "loss": 0.9877, "step": 22081 }, { "epoch": 0.42, "learning_rate": 3.2832568969265675e-06, "loss": 1.0065, "step": 22082 }, { "epoch": 0.42, "learning_rate": 3.283111821171553e-06, "loss": 1.077, "step": 22083 }, { "epoch": 0.42, "learning_rate": 3.282966742492422e-06, "loss": 0.6502, "step": 22084 }, { "epoch": 0.42, "learning_rate": 3.2828216608897183e-06, "loss": 0.9711, "step": 22085 }, { "epoch": 0.42, "learning_rate": 3.2826765763639824e-06, "loss": 0.9245, "step": 22086 }, { "epoch": 0.42, "learning_rate": 3.2825314889157555e-06, "loss": 0.9443, "step": 22087 }, { "epoch": 0.42, "learning_rate": 3.282386398545581e-06, "loss": 0.8563, "step": 22088 }, { "epoch": 0.42, "learning_rate": 3.2822413052539976e-06, "loss": 0.7802, "step": 22089 }, { "epoch": 0.42, "learning_rate": 3.2820962090415504e-06, "loss": 1.0886, "step": 22090 }, { "epoch": 0.42, "learning_rate": 3.2819511099087805e-06, "loss": 0.7841, "step": 22091 }, { "epoch": 0.42, "learning_rate": 3.2818060078562287e-06, "loss": 1.0978, "step": 22092 }, { "epoch": 0.42, "learning_rate": 3.281660902884437e-06, "loss": 0.9592, "step": 22093 }, { "epoch": 0.42, "learning_rate": 3.281515794993948e-06, "loss": 1.0295, "step": 22094 }, { "epoch": 0.42, "learning_rate": 3.281370684185302e-06, "loss": 0.9402, "step": 22095 }, { "epoch": 0.42, "learning_rate": 3.281225570459042e-06, "loss": 0.7194, "step": 22096 }, { "epoch": 0.42, "learning_rate": 3.281080453815711e-06, "loss": 1.0167, "step": 22097 }, { "epoch": 0.42, "learning_rate": 3.2809353342558483e-06, "loss": 0.6868, "step": 22098 }, { "epoch": 0.42, "learning_rate": 3.2807902117799977e-06, "loss": 1.0809, "step": 22099 }, { "epoch": 0.42, "learning_rate": 3.2806450863887003e-06, "loss": 1.1432, "step": 22100 }, { "epoch": 0.42, "learning_rate": 3.2804999580824974e-06, "loss": 0.9818, "step": 22101 }, { "epoch": 0.42, "learning_rate": 3.2803548268619316e-06, "loss": 0.7085, "step": 22102 }, { "epoch": 0.42, "learning_rate": 3.280209692727545e-06, "loss": 0.8836, "step": 22103 }, { "epoch": 0.42, "learning_rate": 3.28006455567988e-06, "loss": 0.8227, "step": 22104 }, { "epoch": 0.42, "learning_rate": 3.2799194157194774e-06, "loss": 0.9928, "step": 22105 }, { "epoch": 0.42, "learning_rate": 3.2797742728468794e-06, "loss": 0.9999, "step": 22106 }, { "epoch": 0.42, "learning_rate": 3.2796291270626286e-06, "loss": 1.1708, "step": 22107 }, { "epoch": 0.42, "learning_rate": 3.2794839783672665e-06, "loss": 0.8583, "step": 22108 }, { "epoch": 0.42, "learning_rate": 3.2793388267613345e-06, "loss": 0.8445, "step": 22109 }, { "epoch": 0.42, "learning_rate": 3.2791936722453755e-06, "loss": 0.7992, "step": 22110 }, { "epoch": 0.42, "learning_rate": 3.279048514819932e-06, "loss": 1.0266, "step": 22111 }, { "epoch": 0.42, "learning_rate": 3.278903354485544e-06, "loss": 1.0417, "step": 22112 }, { "epoch": 0.42, "learning_rate": 3.2787581912427557e-06, "loss": 1.115, "step": 22113 }, { "epoch": 0.42, "learning_rate": 3.2786130250921084e-06, "loss": 0.8329, "step": 22114 }, { "epoch": 0.42, "learning_rate": 3.2784678560341434e-06, "loss": 0.9376, "step": 22115 }, { "epoch": 0.42, "learning_rate": 3.278322684069403e-06, "loss": 0.9316, "step": 22116 }, { "epoch": 0.42, "learning_rate": 3.2781775091984296e-06, "loss": 0.8652, "step": 22117 }, { "epoch": 0.42, "learning_rate": 3.2780323314217655e-06, "loss": 1.0866, "step": 22118 }, { "epoch": 0.42, "learning_rate": 3.2778871507399525e-06, "loss": 0.9561, "step": 22119 }, { "epoch": 0.42, "learning_rate": 3.277741967153533e-06, "loss": 0.9046, "step": 22120 }, { "epoch": 0.42, "learning_rate": 3.277596780663049e-06, "loss": 0.9705, "step": 22121 }, { "epoch": 0.42, "learning_rate": 3.277451591269042e-06, "loss": 0.9152, "step": 22122 }, { "epoch": 0.42, "learning_rate": 3.2773063989720542e-06, "loss": 0.786, "step": 22123 }, { "epoch": 0.42, "learning_rate": 3.2771612037726284e-06, "loss": 0.9933, "step": 22124 }, { "epoch": 0.42, "learning_rate": 3.2770160056713067e-06, "loss": 0.941, "step": 22125 }, { "epoch": 0.42, "learning_rate": 3.2768708046686316e-06, "loss": 0.8281, "step": 22126 }, { "epoch": 0.42, "learning_rate": 3.276725600765144e-06, "loss": 1.1631, "step": 22127 }, { "epoch": 0.42, "learning_rate": 3.276580393961387e-06, "loss": 0.978, "step": 22128 }, { "epoch": 0.42, "learning_rate": 3.2764351842579027e-06, "loss": 0.8229, "step": 22129 }, { "epoch": 0.42, "learning_rate": 3.2762899716552325e-06, "loss": 0.9227, "step": 22130 }, { "epoch": 0.42, "learning_rate": 3.27614475615392e-06, "loss": 1.1366, "step": 22131 }, { "epoch": 0.42, "learning_rate": 3.2759995377545073e-06, "loss": 1.0908, "step": 22132 }, { "epoch": 0.42, "learning_rate": 3.2758543164575356e-06, "loss": 1.0585, "step": 22133 }, { "epoch": 0.42, "learning_rate": 3.2757090922635477e-06, "loss": 0.9759, "step": 22134 }, { "epoch": 0.42, "learning_rate": 3.275563865173086e-06, "loss": 0.872, "step": 22135 }, { "epoch": 0.42, "learning_rate": 3.2754186351866924e-06, "loss": 0.7269, "step": 22136 }, { "epoch": 0.42, "learning_rate": 3.2752734023049095e-06, "loss": 1.0559, "step": 22137 }, { "epoch": 0.42, "learning_rate": 3.2751281665282793e-06, "loss": 0.8757, "step": 22138 }, { "epoch": 0.42, "learning_rate": 3.2749829278573443e-06, "loss": 0.9718, "step": 22139 }, { "epoch": 0.42, "learning_rate": 3.2748376862926466e-06, "loss": 0.904, "step": 22140 }, { "epoch": 0.42, "learning_rate": 3.274692441834729e-06, "loss": 0.7866, "step": 22141 }, { "epoch": 0.42, "learning_rate": 3.274547194484134e-06, "loss": 0.8928, "step": 22142 }, { "epoch": 0.42, "learning_rate": 3.2744019442414025e-06, "loss": 0.8459, "step": 22143 }, { "epoch": 0.42, "learning_rate": 3.2742566911070788e-06, "loss": 1.1136, "step": 22144 }, { "epoch": 0.42, "learning_rate": 3.2741114350817037e-06, "loss": 0.9029, "step": 22145 }, { "epoch": 0.42, "learning_rate": 3.2739661761658207e-06, "loss": 1.0911, "step": 22146 }, { "epoch": 0.42, "learning_rate": 3.273820914359972e-06, "loss": 1.0745, "step": 22147 }, { "epoch": 0.42, "learning_rate": 3.273675649664699e-06, "loss": 0.7857, "step": 22148 }, { "epoch": 0.42, "learning_rate": 3.273530382080545e-06, "loss": 1.0687, "step": 22149 }, { "epoch": 0.42, "learning_rate": 3.2733851116080534e-06, "loss": 0.9099, "step": 22150 }, { "epoch": 0.42, "learning_rate": 3.2732398382477636e-06, "loss": 0.7439, "step": 22151 }, { "epoch": 0.42, "learning_rate": 3.2730945620002207e-06, "loss": 0.7699, "step": 22152 }, { "epoch": 0.42, "learning_rate": 3.2729492828659674e-06, "loss": 0.9598, "step": 22153 }, { "epoch": 0.42, "learning_rate": 3.2728040008455442e-06, "loss": 0.8482, "step": 22154 }, { "epoch": 0.42, "learning_rate": 3.272658715939495e-06, "loss": 0.9888, "step": 22155 }, { "epoch": 0.42, "learning_rate": 3.2725134281483616e-06, "loss": 0.8977, "step": 22156 }, { "epoch": 0.42, "learning_rate": 3.272368137472687e-06, "loss": 0.9632, "step": 22157 }, { "epoch": 0.42, "learning_rate": 3.272222843913013e-06, "loss": 0.818, "step": 22158 }, { "epoch": 0.42, "learning_rate": 3.272077547469883e-06, "loss": 1.0266, "step": 22159 }, { "epoch": 0.42, "learning_rate": 3.2719322481438385e-06, "loss": 0.9405, "step": 22160 }, { "epoch": 0.42, "learning_rate": 3.271786945935423e-06, "loss": 0.9928, "step": 22161 }, { "epoch": 0.42, "learning_rate": 3.271641640845179e-06, "loss": 1.0312, "step": 22162 }, { "epoch": 0.42, "learning_rate": 3.2714963328736486e-06, "loss": 1.0535, "step": 22163 }, { "epoch": 0.42, "learning_rate": 3.2713510220213746e-06, "loss": 0.9148, "step": 22164 }, { "epoch": 0.42, "learning_rate": 3.2712057082888993e-06, "loss": 0.8959, "step": 22165 }, { "epoch": 0.42, "learning_rate": 3.2710603916767652e-06, "loss": 0.9669, "step": 22166 }, { "epoch": 0.42, "learning_rate": 3.270915072185516e-06, "loss": 0.989, "step": 22167 }, { "epoch": 0.42, "learning_rate": 3.270769749815693e-06, "loss": 1.1997, "step": 22168 }, { "epoch": 0.42, "learning_rate": 3.2706244245678396e-06, "loss": 0.908, "step": 22169 }, { "epoch": 0.42, "learning_rate": 3.2704790964424987e-06, "loss": 0.8143, "step": 22170 }, { "epoch": 0.42, "learning_rate": 3.270333765440212e-06, "loss": 0.9722, "step": 22171 }, { "epoch": 0.42, "learning_rate": 3.2701884315615224e-06, "loss": 1.0662, "step": 22172 }, { "epoch": 0.42, "learning_rate": 3.270043094806973e-06, "loss": 0.8675, "step": 22173 }, { "epoch": 0.42, "learning_rate": 3.2698977551771068e-06, "loss": 1.1552, "step": 22174 }, { "epoch": 0.42, "learning_rate": 3.2697524126724656e-06, "loss": 1.0782, "step": 22175 }, { "epoch": 0.42, "learning_rate": 3.269607067293592e-06, "loss": 0.8701, "step": 22176 }, { "epoch": 0.42, "learning_rate": 3.2694617190410306e-06, "loss": 0.8725, "step": 22177 }, { "epoch": 0.42, "learning_rate": 3.269316367915321e-06, "loss": 0.8655, "step": 22178 }, { "epoch": 0.42, "learning_rate": 3.2691710139170086e-06, "loss": 0.9163, "step": 22179 }, { "epoch": 0.42, "learning_rate": 3.269025657046635e-06, "loss": 0.9235, "step": 22180 }, { "epoch": 0.42, "learning_rate": 3.2688802973047436e-06, "loss": 1.0241, "step": 22181 }, { "epoch": 0.42, "learning_rate": 3.268734934691876e-06, "loss": 1.1185, "step": 22182 }, { "epoch": 0.42, "learning_rate": 3.268589569208577e-06, "loss": 1.0512, "step": 22183 }, { "epoch": 0.42, "learning_rate": 3.268444200855387e-06, "loss": 1.1852, "step": 22184 }, { "epoch": 0.42, "learning_rate": 3.26829882963285e-06, "loss": 0.9574, "step": 22185 }, { "epoch": 0.42, "learning_rate": 3.2681534555415083e-06, "loss": 0.7118, "step": 22186 }, { "epoch": 0.42, "learning_rate": 3.268008078581906e-06, "loss": 1.0613, "step": 22187 }, { "epoch": 0.42, "learning_rate": 3.267862698754585e-06, "loss": 1.0168, "step": 22188 }, { "epoch": 0.42, "learning_rate": 3.2677173160600883e-06, "loss": 0.8774, "step": 22189 }, { "epoch": 0.42, "learning_rate": 3.267571930498958e-06, "loss": 0.7831, "step": 22190 }, { "epoch": 0.42, "learning_rate": 3.2674265420717375e-06, "loss": 0.8524, "step": 22191 }, { "epoch": 0.42, "learning_rate": 3.2672811507789714e-06, "loss": 0.7881, "step": 22192 }, { "epoch": 0.42, "learning_rate": 3.2671357566211993e-06, "loss": 0.8906, "step": 22193 }, { "epoch": 0.42, "learning_rate": 3.2669903595989667e-06, "loss": 1.0203, "step": 22194 }, { "epoch": 0.42, "learning_rate": 3.2668449597128154e-06, "loss": 0.6671, "step": 22195 }, { "epoch": 0.42, "learning_rate": 3.2666995569632887e-06, "loss": 0.8754, "step": 22196 }, { "epoch": 0.42, "learning_rate": 3.266554151350929e-06, "loss": 0.985, "step": 22197 }, { "epoch": 0.42, "learning_rate": 3.2664087428762805e-06, "loss": 0.896, "step": 22198 }, { "epoch": 0.42, "learning_rate": 3.266263331539884e-06, "loss": 1.0135, "step": 22199 }, { "epoch": 0.42, "learning_rate": 3.266117917342284e-06, "loss": 1.0902, "step": 22200 }, { "epoch": 0.42, "learning_rate": 3.2659725002840236e-06, "loss": 0.8188, "step": 22201 }, { "epoch": 0.42, "learning_rate": 3.2658270803656456e-06, "loss": 0.7034, "step": 22202 }, { "epoch": 0.42, "learning_rate": 3.265681657587692e-06, "loss": 0.7711, "step": 22203 }, { "epoch": 0.42, "learning_rate": 3.2655362319507074e-06, "loss": 0.8473, "step": 22204 }, { "epoch": 0.42, "learning_rate": 3.2653908034552335e-06, "loss": 0.9607, "step": 22205 }, { "epoch": 0.42, "learning_rate": 3.265245372101814e-06, "loss": 0.9797, "step": 22206 }, { "epoch": 0.42, "learning_rate": 3.265099937890991e-06, "loss": 1.0001, "step": 22207 }, { "epoch": 0.42, "learning_rate": 3.264954500823309e-06, "loss": 0.9068, "step": 22208 }, { "epoch": 0.42, "learning_rate": 3.26480906089931e-06, "loss": 1.0771, "step": 22209 }, { "epoch": 0.42, "learning_rate": 3.2646636181195377e-06, "loss": 0.805, "step": 22210 }, { "epoch": 0.42, "learning_rate": 3.2645181724845356e-06, "loss": 0.9804, "step": 22211 }, { "epoch": 0.42, "learning_rate": 3.2643727239948447e-06, "loss": 1.1664, "step": 22212 }, { "epoch": 0.42, "learning_rate": 3.2642272726510103e-06, "loss": 1.0545, "step": 22213 }, { "epoch": 0.42, "learning_rate": 3.2640818184535744e-06, "loss": 1.0029, "step": 22214 }, { "epoch": 0.42, "learning_rate": 3.2639363614030804e-06, "loss": 0.9785, "step": 22215 }, { "epoch": 0.42, "learning_rate": 3.2637909015000716e-06, "loss": 0.8172, "step": 22216 }, { "epoch": 0.42, "learning_rate": 3.263645438745091e-06, "loss": 0.9973, "step": 22217 }, { "epoch": 0.42, "learning_rate": 3.2634999731386826e-06, "loss": 1.2104, "step": 22218 }, { "epoch": 0.42, "learning_rate": 3.2633545046813873e-06, "loss": 1.1187, "step": 22219 }, { "epoch": 0.42, "learning_rate": 3.2632090333737503e-06, "loss": 0.7348, "step": 22220 }, { "epoch": 0.42, "learning_rate": 3.263063559216314e-06, "loss": 1.0175, "step": 22221 }, { "epoch": 0.42, "learning_rate": 3.262918082209622e-06, "loss": 0.7535, "step": 22222 }, { "epoch": 0.42, "learning_rate": 3.2627726023542167e-06, "loss": 0.8559, "step": 22223 }, { "epoch": 0.42, "learning_rate": 3.2626271196506426e-06, "loss": 1.0287, "step": 22224 }, { "epoch": 0.42, "learning_rate": 3.262481634099442e-06, "loss": 1.0566, "step": 22225 }, { "epoch": 0.42, "learning_rate": 3.262336145701158e-06, "loss": 0.8685, "step": 22226 }, { "epoch": 0.42, "learning_rate": 3.262190654456335e-06, "loss": 0.8271, "step": 22227 }, { "epoch": 0.42, "learning_rate": 3.2620451603655144e-06, "loss": 0.9229, "step": 22228 }, { "epoch": 0.42, "learning_rate": 3.261899663429241e-06, "loss": 0.7485, "step": 22229 }, { "epoch": 0.42, "learning_rate": 3.2617541636480582e-06, "loss": 1.0708, "step": 22230 }, { "epoch": 0.42, "learning_rate": 3.2616086610225084e-06, "loss": 1.1358, "step": 22231 }, { "epoch": 0.42, "learning_rate": 3.2614631555531344e-06, "loss": 0.9104, "step": 22232 }, { "epoch": 0.42, "learning_rate": 3.2613176472404817e-06, "loss": 0.8751, "step": 22233 }, { "epoch": 0.42, "learning_rate": 3.261172136085091e-06, "loss": 0.7437, "step": 22234 }, { "epoch": 0.42, "learning_rate": 3.261026622087507e-06, "loss": 0.9991, "step": 22235 }, { "epoch": 0.42, "learning_rate": 3.2608811052482738e-06, "loss": 1.0195, "step": 22236 }, { "epoch": 0.42, "learning_rate": 3.2607355855679332e-06, "loss": 1.1669, "step": 22237 }, { "epoch": 0.42, "learning_rate": 3.2605900630470296e-06, "loss": 0.8783, "step": 22238 }, { "epoch": 0.42, "learning_rate": 3.260444537686106e-06, "loss": 0.9048, "step": 22239 }, { "epoch": 0.42, "learning_rate": 3.2602990094857057e-06, "loss": 0.9417, "step": 22240 }, { "epoch": 0.42, "learning_rate": 3.2601534784463717e-06, "loss": 1.0697, "step": 22241 }, { "epoch": 0.42, "learning_rate": 3.260007944568649e-06, "loss": 0.8014, "step": 22242 }, { "epoch": 0.42, "learning_rate": 3.2598624078530787e-06, "loss": 1.1132, "step": 22243 }, { "epoch": 0.42, "learning_rate": 3.2597168683002064e-06, "loss": 1.0888, "step": 22244 }, { "epoch": 0.42, "learning_rate": 3.2595713259105746e-06, "loss": 0.7348, "step": 22245 }, { "epoch": 0.42, "learning_rate": 3.259425780684726e-06, "loss": 0.8736, "step": 22246 }, { "epoch": 0.42, "learning_rate": 3.2592802326232055e-06, "loss": 0.8401, "step": 22247 }, { "epoch": 0.42, "learning_rate": 3.259134681726556e-06, "loss": 0.7674, "step": 22248 }, { "epoch": 0.42, "learning_rate": 3.25898912799532e-06, "loss": 0.9533, "step": 22249 }, { "epoch": 0.42, "learning_rate": 3.2588435714300427e-06, "loss": 1.1418, "step": 22250 }, { "epoch": 0.42, "learning_rate": 3.2586980120312668e-06, "loss": 0.935, "step": 22251 }, { "epoch": 0.42, "learning_rate": 3.2585524497995354e-06, "loss": 0.6707, "step": 22252 }, { "epoch": 0.42, "learning_rate": 3.2584068847353923e-06, "loss": 0.9528, "step": 22253 }, { "epoch": 0.42, "learning_rate": 3.2582613168393818e-06, "loss": 0.7909, "step": 22254 }, { "epoch": 0.42, "learning_rate": 3.258115746112046e-06, "loss": 0.8351, "step": 22255 }, { "epoch": 0.42, "learning_rate": 3.2579701725539293e-06, "loss": 1.1599, "step": 22256 }, { "epoch": 0.42, "learning_rate": 3.2578245961655757e-06, "loss": 0.7941, "step": 22257 }, { "epoch": 0.42, "learning_rate": 3.257679016947528e-06, "loss": 0.9633, "step": 22258 }, { "epoch": 0.42, "learning_rate": 3.25753343490033e-06, "loss": 0.8806, "step": 22259 }, { "epoch": 0.42, "learning_rate": 3.257387850024526e-06, "loss": 0.7607, "step": 22260 }, { "epoch": 0.42, "learning_rate": 3.2572422623206584e-06, "loss": 0.8456, "step": 22261 }, { "epoch": 0.42, "learning_rate": 3.2570966717892717e-06, "loss": 1.0085, "step": 22262 }, { "epoch": 0.42, "learning_rate": 3.256951078430909e-06, "loss": 0.8475, "step": 22263 }, { "epoch": 0.42, "learning_rate": 3.2568054822461135e-06, "loss": 0.7371, "step": 22264 }, { "epoch": 0.42, "learning_rate": 3.2566598832354306e-06, "loss": 0.8506, "step": 22265 }, { "epoch": 0.42, "learning_rate": 3.2565142813994032e-06, "loss": 0.954, "step": 22266 }, { "epoch": 0.42, "learning_rate": 3.256368676738574e-06, "loss": 0.8325, "step": 22267 }, { "epoch": 0.42, "learning_rate": 3.256223069253487e-06, "loss": 1.0545, "step": 22268 }, { "epoch": 0.42, "learning_rate": 3.2560774589446868e-06, "loss": 0.9985, "step": 22269 }, { "epoch": 0.42, "learning_rate": 3.2559318458127165e-06, "loss": 0.7742, "step": 22270 }, { "epoch": 0.42, "learning_rate": 3.2557862298581195e-06, "loss": 1.0341, "step": 22271 }, { "epoch": 0.42, "learning_rate": 3.2556406110814404e-06, "loss": 0.7616, "step": 22272 }, { "epoch": 0.42, "learning_rate": 3.255494989483222e-06, "loss": 0.8344, "step": 22273 }, { "epoch": 0.42, "learning_rate": 3.255349365064009e-06, "loss": 1.0959, "step": 22274 }, { "epoch": 0.42, "learning_rate": 3.2552037378243444e-06, "loss": 1.2023, "step": 22275 }, { "epoch": 0.42, "learning_rate": 3.2550581077647726e-06, "loss": 0.7457, "step": 22276 }, { "epoch": 0.42, "learning_rate": 3.254912474885835e-06, "loss": 0.8362, "step": 22277 }, { "epoch": 0.42, "learning_rate": 3.2547668391880793e-06, "loss": 1.0901, "step": 22278 }, { "epoch": 0.42, "learning_rate": 3.2546212006720473e-06, "loss": 0.6451, "step": 22279 }, { "epoch": 0.42, "learning_rate": 3.254475559338282e-06, "loss": 1.0924, "step": 22280 }, { "epoch": 0.42, "learning_rate": 3.254329915187329e-06, "loss": 0.8996, "step": 22281 }, { "epoch": 0.42, "learning_rate": 3.254184268219731e-06, "loss": 1.01, "step": 22282 }, { "epoch": 0.42, "learning_rate": 3.2540386184360316e-06, "loss": 0.993, "step": 22283 }, { "epoch": 0.42, "learning_rate": 3.253892965836776e-06, "loss": 0.9724, "step": 22284 }, { "epoch": 0.42, "learning_rate": 3.2537473104225057e-06, "loss": 0.8885, "step": 22285 }, { "epoch": 0.42, "learning_rate": 3.253601652193767e-06, "loss": 1.0293, "step": 22286 }, { "epoch": 0.42, "learning_rate": 3.253455991151103e-06, "loss": 1.0743, "step": 22287 }, { "epoch": 0.42, "learning_rate": 3.2533103272950573e-06, "loss": 1.1072, "step": 22288 }, { "epoch": 0.42, "learning_rate": 3.2531646606261735e-06, "loss": 0.7388, "step": 22289 }, { "epoch": 0.42, "learning_rate": 3.253018991144996e-06, "loss": 0.8734, "step": 22290 }, { "epoch": 0.42, "learning_rate": 3.2528733188520688e-06, "loss": 0.9031, "step": 22291 }, { "epoch": 0.42, "learning_rate": 3.2527276437479362e-06, "loss": 0.7798, "step": 22292 }, { "epoch": 0.42, "learning_rate": 3.2525819658331413e-06, "loss": 0.9615, "step": 22293 }, { "epoch": 0.42, "learning_rate": 3.2524362851082286e-06, "loss": 0.9789, "step": 22294 }, { "epoch": 0.42, "learning_rate": 3.2522906015737414e-06, "loss": 1.0118, "step": 22295 }, { "epoch": 0.42, "learning_rate": 3.2521449152302254e-06, "loss": 0.8657, "step": 22296 }, { "epoch": 0.42, "learning_rate": 3.2519992260782217e-06, "loss": 0.9988, "step": 22297 }, { "epoch": 0.42, "learning_rate": 3.2518535341182767e-06, "loss": 0.7842, "step": 22298 }, { "epoch": 0.42, "learning_rate": 3.2517078393509337e-06, "loss": 0.9578, "step": 22299 }, { "epoch": 0.42, "learning_rate": 3.251562141776737e-06, "loss": 1.2827, "step": 22300 }, { "epoch": 0.42, "learning_rate": 3.2514164413962295e-06, "loss": 1.0543, "step": 22301 }, { "epoch": 0.42, "learning_rate": 3.2512707382099567e-06, "loss": 0.9483, "step": 22302 }, { "epoch": 0.42, "learning_rate": 3.251125032218462e-06, "loss": 0.7562, "step": 22303 }, { "epoch": 0.42, "learning_rate": 3.2509793234222886e-06, "loss": 0.8787, "step": 22304 }, { "epoch": 0.42, "learning_rate": 3.250833611821982e-06, "loss": 0.9948, "step": 22305 }, { "epoch": 0.42, "learning_rate": 3.2506878974180854e-06, "loss": 1.1147, "step": 22306 }, { "epoch": 0.42, "learning_rate": 3.2505421802111435e-06, "loss": 0.9694, "step": 22307 }, { "epoch": 0.42, "learning_rate": 3.250396460201701e-06, "loss": 0.7715, "step": 22308 }, { "epoch": 0.42, "learning_rate": 3.2502507373903005e-06, "loss": 0.8945, "step": 22309 }, { "epoch": 0.42, "learning_rate": 3.250105011777486e-06, "loss": 0.8534, "step": 22310 }, { "epoch": 0.42, "learning_rate": 3.2499592833638028e-06, "loss": 0.7982, "step": 22311 }, { "epoch": 0.42, "learning_rate": 3.2498135521497946e-06, "loss": 0.9774, "step": 22312 }, { "epoch": 0.42, "learning_rate": 3.249667818136006e-06, "loss": 0.9475, "step": 22313 }, { "epoch": 0.42, "learning_rate": 3.249522081322981e-06, "loss": 1.0695, "step": 22314 }, { "epoch": 0.42, "learning_rate": 3.2493763417112627e-06, "loss": 0.8659, "step": 22315 }, { "epoch": 0.42, "learning_rate": 3.2492305993013962e-06, "loss": 0.9672, "step": 22316 }, { "epoch": 0.42, "learning_rate": 3.249084854093926e-06, "loss": 0.7813, "step": 22317 }, { "epoch": 0.42, "learning_rate": 3.248939106089396e-06, "loss": 0.9476, "step": 22318 }, { "epoch": 0.42, "learning_rate": 3.2487933552883493e-06, "loss": 1.2653, "step": 22319 }, { "epoch": 0.42, "learning_rate": 3.2486476016913325e-06, "loss": 0.8789, "step": 22320 }, { "epoch": 0.42, "learning_rate": 3.248501845298888e-06, "loss": 0.9713, "step": 22321 }, { "epoch": 0.42, "learning_rate": 3.2483560861115604e-06, "loss": 0.893, "step": 22322 }, { "epoch": 0.42, "learning_rate": 3.2482103241298945e-06, "loss": 0.8438, "step": 22323 }, { "epoch": 0.42, "learning_rate": 3.248064559354434e-06, "loss": 1.1481, "step": 22324 }, { "epoch": 0.42, "learning_rate": 3.2479187917857234e-06, "loss": 1.0224, "step": 22325 }, { "epoch": 0.42, "learning_rate": 3.247773021424307e-06, "loss": 0.9146, "step": 22326 }, { "epoch": 0.42, "learning_rate": 3.247627248270729e-06, "loss": 0.9515, "step": 22327 }, { "epoch": 0.42, "learning_rate": 3.2474814723255333e-06, "loss": 0.9704, "step": 22328 }, { "epoch": 0.42, "learning_rate": 3.247335693589266e-06, "loss": 0.903, "step": 22329 }, { "epoch": 0.42, "learning_rate": 3.247189912062469e-06, "loss": 1.0435, "step": 22330 }, { "epoch": 0.42, "learning_rate": 3.2470441277456877e-06, "loss": 1.0933, "step": 22331 }, { "epoch": 0.42, "learning_rate": 3.246898340639467e-06, "loss": 1.0218, "step": 22332 }, { "epoch": 0.42, "learning_rate": 3.2467525507443505e-06, "loss": 0.8438, "step": 22333 }, { "epoch": 0.42, "learning_rate": 3.2466067580608836e-06, "loss": 0.8188, "step": 22334 }, { "epoch": 0.42, "learning_rate": 3.2464609625896093e-06, "loss": 1.0745, "step": 22335 }, { "epoch": 0.42, "learning_rate": 3.2463151643310727e-06, "loss": 0.8836, "step": 22336 }, { "epoch": 0.42, "learning_rate": 3.246169363285818e-06, "loss": 0.9067, "step": 22337 }, { "epoch": 0.42, "learning_rate": 3.2460235594543903e-06, "loss": 0.9858, "step": 22338 }, { "epoch": 0.42, "learning_rate": 3.245877752837333e-06, "loss": 0.6064, "step": 22339 }, { "epoch": 0.42, "learning_rate": 3.245731943435191e-06, "loss": 0.9796, "step": 22340 }, { "epoch": 0.42, "learning_rate": 3.2455861312485094e-06, "loss": 0.9754, "step": 22341 }, { "epoch": 0.42, "learning_rate": 3.2454403162778315e-06, "loss": 0.911, "step": 22342 }, { "epoch": 0.42, "learning_rate": 3.245294498523703e-06, "loss": 1.1802, "step": 22343 }, { "epoch": 0.42, "learning_rate": 3.245148677986667e-06, "loss": 0.9325, "step": 22344 }, { "epoch": 0.42, "learning_rate": 3.2450028546672687e-06, "loss": 0.8846, "step": 22345 }, { "epoch": 0.42, "learning_rate": 3.244857028566053e-06, "loss": 0.9486, "step": 22346 }, { "epoch": 0.42, "learning_rate": 3.2447111996835633e-06, "loss": 0.8592, "step": 22347 }, { "epoch": 0.42, "learning_rate": 3.2445653680203453e-06, "loss": 0.8137, "step": 22348 }, { "epoch": 0.42, "learning_rate": 3.2444195335769436e-06, "loss": 1.1419, "step": 22349 }, { "epoch": 0.42, "learning_rate": 3.2442736963539013e-06, "loss": 1.1374, "step": 22350 }, { "epoch": 0.42, "learning_rate": 3.244127856351764e-06, "loss": 0.7207, "step": 22351 }, { "epoch": 0.42, "learning_rate": 3.2439820135710765e-06, "loss": 0.9902, "step": 22352 }, { "epoch": 0.42, "learning_rate": 3.243836168012382e-06, "loss": 0.9154, "step": 22353 }, { "epoch": 0.42, "learning_rate": 3.243690319676227e-06, "loss": 0.7289, "step": 22354 }, { "epoch": 0.42, "learning_rate": 3.2435444685631553e-06, "loss": 0.83, "step": 22355 }, { "epoch": 0.42, "learning_rate": 3.2433986146737105e-06, "loss": 1.0419, "step": 22356 }, { "epoch": 0.42, "learning_rate": 3.243252758008439e-06, "loss": 0.8645, "step": 22357 }, { "epoch": 0.42, "learning_rate": 3.2431068985678845e-06, "loss": 0.761, "step": 22358 }, { "epoch": 0.42, "learning_rate": 3.242961036352591e-06, "loss": 1.0834, "step": 22359 }, { "epoch": 0.42, "learning_rate": 3.2428151713631033e-06, "loss": 0.8877, "step": 22360 }, { "epoch": 0.42, "learning_rate": 3.2426693035999674e-06, "loss": 0.8649, "step": 22361 }, { "epoch": 0.42, "learning_rate": 3.2425234330637266e-06, "loss": 0.8514, "step": 22362 }, { "epoch": 0.42, "learning_rate": 3.2423775597549263e-06, "loss": 1.011, "step": 22363 }, { "epoch": 0.42, "learning_rate": 3.2422316836741115e-06, "loss": 0.905, "step": 22364 }, { "epoch": 0.42, "learning_rate": 3.2420858048218253e-06, "loss": 0.9058, "step": 22365 }, { "epoch": 0.42, "learning_rate": 3.241939923198614e-06, "loss": 0.9285, "step": 22366 }, { "epoch": 0.42, "learning_rate": 3.2417940388050216e-06, "loss": 0.8483, "step": 22367 }, { "epoch": 0.42, "learning_rate": 3.241648151641593e-06, "loss": 0.9106, "step": 22368 }, { "epoch": 0.42, "learning_rate": 3.2415022617088732e-06, "loss": 1.0331, "step": 22369 }, { "epoch": 0.42, "learning_rate": 3.241356369007407e-06, "loss": 0.8767, "step": 22370 }, { "epoch": 0.42, "learning_rate": 3.241210473537738e-06, "loss": 1.1422, "step": 22371 }, { "epoch": 0.42, "learning_rate": 3.241064575300412e-06, "loss": 0.9062, "step": 22372 }, { "epoch": 0.42, "learning_rate": 3.240918674295974e-06, "loss": 0.8327, "step": 22373 }, { "epoch": 0.42, "learning_rate": 3.2407727705249682e-06, "loss": 1.0002, "step": 22374 }, { "epoch": 0.42, "learning_rate": 3.240626863987939e-06, "loss": 1.0103, "step": 22375 }, { "epoch": 0.42, "learning_rate": 3.2404809546854333e-06, "loss": 0.9936, "step": 22376 }, { "epoch": 0.42, "learning_rate": 3.2403350426179935e-06, "loss": 0.8343, "step": 22377 }, { "epoch": 0.42, "learning_rate": 3.240189127786165e-06, "loss": 1.0102, "step": 22378 }, { "epoch": 0.42, "learning_rate": 3.240043210190494e-06, "loss": 0.9711, "step": 22379 }, { "epoch": 0.42, "learning_rate": 3.2398972898315233e-06, "loss": 0.8496, "step": 22380 }, { "epoch": 0.42, "learning_rate": 3.239751366709799e-06, "loss": 1.2479, "step": 22381 }, { "epoch": 0.42, "learning_rate": 3.2396054408258657e-06, "loss": 1.0613, "step": 22382 }, { "epoch": 0.42, "learning_rate": 3.239459512180269e-06, "loss": 0.9893, "step": 22383 }, { "epoch": 0.42, "learning_rate": 3.2393135807735526e-06, "loss": 0.7622, "step": 22384 }, { "epoch": 0.42, "learning_rate": 3.2391676466062626e-06, "loss": 0.7868, "step": 22385 }, { "epoch": 0.42, "learning_rate": 3.2390217096789428e-06, "loss": 1.0594, "step": 22386 }, { "epoch": 0.42, "learning_rate": 3.2388757699921387e-06, "loss": 0.8925, "step": 22387 }, { "epoch": 0.42, "learning_rate": 3.2387298275463946e-06, "loss": 1.0506, "step": 22388 }, { "epoch": 0.42, "learning_rate": 3.2385838823422568e-06, "loss": 0.8535, "step": 22389 }, { "epoch": 0.42, "learning_rate": 3.2384379343802686e-06, "loss": 0.8423, "step": 22390 }, { "epoch": 0.42, "learning_rate": 3.2382919836609765e-06, "loss": 0.6226, "step": 22391 }, { "epoch": 0.42, "learning_rate": 3.2381460301849245e-06, "loss": 0.8595, "step": 22392 }, { "epoch": 0.42, "learning_rate": 3.238000073952658e-06, "loss": 1.1375, "step": 22393 }, { "epoch": 0.42, "learning_rate": 3.237854114964722e-06, "loss": 0.8529, "step": 22394 }, { "epoch": 0.42, "learning_rate": 3.2377081532216602e-06, "loss": 0.8804, "step": 22395 }, { "epoch": 0.42, "learning_rate": 3.23756218872402e-06, "loss": 0.9383, "step": 22396 }, { "epoch": 0.42, "learning_rate": 3.2374162214723454e-06, "loss": 0.9405, "step": 22397 }, { "epoch": 0.42, "learning_rate": 3.2372702514671807e-06, "loss": 0.8161, "step": 22398 }, { "epoch": 0.42, "learning_rate": 3.2371242787090713e-06, "loss": 0.8192, "step": 22399 }, { "epoch": 0.42, "learning_rate": 3.236978303198563e-06, "loss": 1.1422, "step": 22400 }, { "epoch": 0.42, "learning_rate": 3.2368323249362e-06, "loss": 0.8371, "step": 22401 }, { "epoch": 0.42, "learning_rate": 3.2366863439225264e-06, "loss": 0.8649, "step": 22402 }, { "epoch": 0.42, "learning_rate": 3.2365403601580904e-06, "loss": 0.8225, "step": 22403 }, { "epoch": 0.42, "learning_rate": 3.2363943736434345e-06, "loss": 0.8374, "step": 22404 }, { "epoch": 0.42, "learning_rate": 3.2362483843791046e-06, "loss": 1.0225, "step": 22405 }, { "epoch": 0.42, "learning_rate": 3.2361023923656464e-06, "loss": 1.0286, "step": 22406 }, { "epoch": 0.42, "learning_rate": 3.235956397603604e-06, "loss": 1.0319, "step": 22407 }, { "epoch": 0.42, "learning_rate": 3.235810400093523e-06, "loss": 1.0483, "step": 22408 }, { "epoch": 0.42, "learning_rate": 3.235664399835948e-06, "loss": 0.9756, "step": 22409 }, { "epoch": 0.42, "learning_rate": 3.235518396831426e-06, "loss": 0.9842, "step": 22410 }, { "epoch": 0.42, "learning_rate": 3.2353723910804998e-06, "loss": 0.8677, "step": 22411 }, { "epoch": 0.42, "learning_rate": 3.235226382583716e-06, "loss": 0.8822, "step": 22412 }, { "epoch": 0.42, "learning_rate": 3.235080371341619e-06, "loss": 1.0666, "step": 22413 }, { "epoch": 0.42, "learning_rate": 3.234934357354755e-06, "loss": 0.7369, "step": 22414 }, { "epoch": 0.42, "learning_rate": 3.234788340623668e-06, "loss": 1.0693, "step": 22415 }, { "epoch": 0.42, "learning_rate": 3.234642321148904e-06, "loss": 0.7521, "step": 22416 }, { "epoch": 0.42, "learning_rate": 3.2344962989310087e-06, "loss": 1.0714, "step": 22417 }, { "epoch": 0.42, "learning_rate": 3.234350273970527e-06, "loss": 0.9359, "step": 22418 }, { "epoch": 0.42, "learning_rate": 3.2342042462680027e-06, "loss": 1.0239, "step": 22419 }, { "epoch": 0.42, "learning_rate": 3.234058215823983e-06, "loss": 0.9117, "step": 22420 }, { "epoch": 0.42, "learning_rate": 3.233912182639013e-06, "loss": 0.8503, "step": 22421 }, { "epoch": 0.42, "learning_rate": 3.2337661467136368e-06, "loss": 1.0027, "step": 22422 }, { "epoch": 0.42, "learning_rate": 3.2336201080483994e-06, "loss": 0.7072, "step": 22423 }, { "epoch": 0.42, "learning_rate": 3.233474066643848e-06, "loss": 0.8553, "step": 22424 }, { "epoch": 0.42, "learning_rate": 3.233328022500527e-06, "loss": 1.0955, "step": 22425 }, { "epoch": 0.42, "learning_rate": 3.233181975618981e-06, "loss": 0.6811, "step": 22426 }, { "epoch": 0.42, "learning_rate": 3.2330359259997568e-06, "loss": 1.0709, "step": 22427 }, { "epoch": 0.42, "learning_rate": 3.232889873643398e-06, "loss": 0.7787, "step": 22428 }, { "epoch": 0.42, "learning_rate": 3.232743818550452e-06, "loss": 0.976, "step": 22429 }, { "epoch": 0.42, "learning_rate": 3.232597760721462e-06, "loss": 0.9915, "step": 22430 }, { "epoch": 0.42, "learning_rate": 3.2324517001569748e-06, "loss": 0.8868, "step": 22431 }, { "epoch": 0.42, "learning_rate": 3.232305636857536e-06, "loss": 0.9915, "step": 22432 }, { "epoch": 0.42, "learning_rate": 3.23215957082369e-06, "loss": 0.9501, "step": 22433 }, { "epoch": 0.42, "learning_rate": 3.232013502055982e-06, "loss": 0.9559, "step": 22434 }, { "epoch": 0.42, "learning_rate": 3.2318674305549583e-06, "loss": 0.8523, "step": 22435 }, { "epoch": 0.42, "learning_rate": 3.2317213563211643e-06, "loss": 0.9893, "step": 22436 }, { "epoch": 0.42, "learning_rate": 3.2315752793551447e-06, "loss": 1.0221, "step": 22437 }, { "epoch": 0.42, "learning_rate": 3.231429199657446e-06, "loss": 0.8596, "step": 22438 }, { "epoch": 0.42, "learning_rate": 3.2312831172286137e-06, "loss": 0.9351, "step": 22439 }, { "epoch": 0.42, "learning_rate": 3.2311370320691915e-06, "loss": 0.8039, "step": 22440 }, { "epoch": 0.42, "learning_rate": 3.2309909441797267e-06, "loss": 1.0042, "step": 22441 }, { "epoch": 0.42, "learning_rate": 3.2308448535607638e-06, "loss": 0.8138, "step": 22442 }, { "epoch": 0.42, "learning_rate": 3.230698760212849e-06, "loss": 1.0668, "step": 22443 }, { "epoch": 0.42, "learning_rate": 3.2305526641365263e-06, "loss": 0.9563, "step": 22444 }, { "epoch": 0.42, "learning_rate": 3.230406565332344e-06, "loss": 0.8012, "step": 22445 }, { "epoch": 0.42, "learning_rate": 3.230260463800845e-06, "loss": 0.6919, "step": 22446 }, { "epoch": 0.42, "learning_rate": 3.230114359542576e-06, "loss": 0.9169, "step": 22447 }, { "epoch": 0.42, "learning_rate": 3.229968252558083e-06, "loss": 0.6898, "step": 22448 }, { "epoch": 0.42, "learning_rate": 3.2298221428479097e-06, "loss": 0.9461, "step": 22449 }, { "epoch": 0.42, "learning_rate": 3.2296760304126036e-06, "loss": 0.9167, "step": 22450 }, { "epoch": 0.42, "learning_rate": 3.2295299152527093e-06, "loss": 0.8996, "step": 22451 }, { "epoch": 0.42, "learning_rate": 3.229383797368773e-06, "loss": 1.0355, "step": 22452 }, { "epoch": 0.42, "learning_rate": 3.2292376767613397e-06, "loss": 1.0344, "step": 22453 }, { "epoch": 0.42, "learning_rate": 3.229091553430956e-06, "loss": 0.9207, "step": 22454 }, { "epoch": 0.42, "learning_rate": 3.2289454273781657e-06, "loss": 0.8809, "step": 22455 }, { "epoch": 0.42, "learning_rate": 3.2287992986035166e-06, "loss": 0.8992, "step": 22456 }, { "epoch": 0.42, "learning_rate": 3.2286531671075517e-06, "loss": 0.9883, "step": 22457 }, { "epoch": 0.42, "learning_rate": 3.2285070328908197e-06, "loss": 0.9918, "step": 22458 }, { "epoch": 0.42, "learning_rate": 3.228360895953864e-06, "loss": 0.7569, "step": 22459 }, { "epoch": 0.42, "learning_rate": 3.2282147562972315e-06, "loss": 0.9572, "step": 22460 }, { "epoch": 0.42, "learning_rate": 3.2280686139214673e-06, "loss": 0.9004, "step": 22461 }, { "epoch": 0.42, "learning_rate": 3.2279224688271173e-06, "loss": 0.9765, "step": 22462 }, { "epoch": 0.42, "learning_rate": 3.227776321014727e-06, "loss": 0.7719, "step": 22463 }, { "epoch": 0.42, "learning_rate": 3.2276301704848423e-06, "loss": 0.7493, "step": 22464 }, { "epoch": 0.42, "learning_rate": 3.2274840172380086e-06, "loss": 0.7814, "step": 22465 }, { "epoch": 0.42, "learning_rate": 3.227337861274772e-06, "loss": 0.7111, "step": 22466 }, { "epoch": 0.42, "learning_rate": 3.227191702595678e-06, "loss": 0.7226, "step": 22467 }, { "epoch": 0.42, "learning_rate": 3.227045541201273e-06, "loss": 0.8031, "step": 22468 }, { "epoch": 0.42, "learning_rate": 3.226899377092102e-06, "loss": 1.0604, "step": 22469 }, { "epoch": 0.42, "learning_rate": 3.2267532102687107e-06, "loss": 0.8517, "step": 22470 }, { "epoch": 0.42, "learning_rate": 3.2266070407316453e-06, "loss": 0.8742, "step": 22471 }, { "epoch": 0.42, "learning_rate": 3.2264608684814513e-06, "loss": 1.0359, "step": 22472 }, { "epoch": 0.42, "learning_rate": 3.2263146935186753e-06, "loss": 0.8767, "step": 22473 }, { "epoch": 0.42, "learning_rate": 3.226168515843862e-06, "loss": 0.988, "step": 22474 }, { "epoch": 0.42, "learning_rate": 3.2260223354575582e-06, "loss": 1.031, "step": 22475 }, { "epoch": 0.42, "learning_rate": 3.225876152360309e-06, "loss": 0.9684, "step": 22476 }, { "epoch": 0.42, "learning_rate": 3.22572996655266e-06, "loss": 0.8509, "step": 22477 }, { "epoch": 0.42, "learning_rate": 3.2255837780351577e-06, "loss": 0.8507, "step": 22478 }, { "epoch": 0.42, "learning_rate": 3.2254375868083484e-06, "loss": 1.0252, "step": 22479 }, { "epoch": 0.42, "learning_rate": 3.2252913928727776e-06, "loss": 0.8905, "step": 22480 }, { "epoch": 0.42, "learning_rate": 3.22514519622899e-06, "loss": 1.0478, "step": 22481 }, { "epoch": 0.42, "learning_rate": 3.224998996877533e-06, "loss": 0.5295, "step": 22482 }, { "epoch": 0.42, "learning_rate": 3.2248527948189524e-06, "loss": 1.001, "step": 22483 }, { "epoch": 0.42, "learning_rate": 3.224706590053793e-06, "loss": 1.3154, "step": 22484 }, { "epoch": 0.42, "learning_rate": 3.224560382582602e-06, "loss": 0.8433, "step": 22485 }, { "epoch": 0.42, "learning_rate": 3.224414172405924e-06, "loss": 0.8727, "step": 22486 }, { "epoch": 0.42, "learning_rate": 3.224267959524306e-06, "loss": 1.0047, "step": 22487 }, { "epoch": 0.42, "learning_rate": 3.224121743938294e-06, "loss": 0.9307, "step": 22488 }, { "epoch": 0.42, "learning_rate": 3.2239755256484334e-06, "loss": 1.0751, "step": 22489 }, { "epoch": 0.42, "learning_rate": 3.2238293046552706e-06, "loss": 0.8214, "step": 22490 }, { "epoch": 0.42, "learning_rate": 3.223683080959351e-06, "loss": 0.7397, "step": 22491 }, { "epoch": 0.42, "learning_rate": 3.223536854561221e-06, "loss": 0.9479, "step": 22492 }, { "epoch": 0.42, "learning_rate": 3.223390625461426e-06, "loss": 1.2072, "step": 22493 }, { "epoch": 0.42, "learning_rate": 3.2232443936605136e-06, "loss": 1.079, "step": 22494 }, { "epoch": 0.42, "learning_rate": 3.2230981591590286e-06, "loss": 0.7024, "step": 22495 }, { "epoch": 0.42, "learning_rate": 3.2229519219575172e-06, "loss": 0.9918, "step": 22496 }, { "epoch": 0.42, "learning_rate": 3.222805682056525e-06, "loss": 0.9302, "step": 22497 }, { "epoch": 0.42, "learning_rate": 3.2226594394565995e-06, "loss": 0.8856, "step": 22498 }, { "epoch": 0.42, "learning_rate": 3.2225131941582845e-06, "loss": 0.8857, "step": 22499 }, { "epoch": 0.42, "learning_rate": 3.222366946162128e-06, "loss": 1.1308, "step": 22500 }, { "epoch": 0.42, "learning_rate": 3.2222206954686765e-06, "loss": 0.9373, "step": 22501 }, { "epoch": 0.42, "learning_rate": 3.2220744420784732e-06, "loss": 0.9675, "step": 22502 }, { "epoch": 0.42, "learning_rate": 3.221928185992067e-06, "loss": 0.7361, "step": 22503 }, { "epoch": 0.42, "learning_rate": 3.2217819272100036e-06, "loss": 0.6595, "step": 22504 }, { "epoch": 0.42, "learning_rate": 3.2216356657328286e-06, "loss": 0.958, "step": 22505 }, { "epoch": 0.42, "learning_rate": 3.2214894015610877e-06, "loss": 1.044, "step": 22506 }, { "epoch": 0.42, "learning_rate": 3.221343134695327e-06, "loss": 1.0724, "step": 22507 }, { "epoch": 0.42, "learning_rate": 3.2211968651360938e-06, "loss": 1.019, "step": 22508 }, { "epoch": 0.42, "learning_rate": 3.221050592883933e-06, "loss": 0.6968, "step": 22509 }, { "epoch": 0.42, "learning_rate": 3.2209043179393924e-06, "loss": 0.8085, "step": 22510 }, { "epoch": 0.42, "learning_rate": 3.2207580403030163e-06, "loss": 1.0425, "step": 22511 }, { "epoch": 0.42, "learning_rate": 3.220611759975352e-06, "loss": 1.0756, "step": 22512 }, { "epoch": 0.42, "learning_rate": 3.2204654769569453e-06, "loss": 1.0574, "step": 22513 }, { "epoch": 0.42, "learning_rate": 3.2203191912483434e-06, "loss": 0.9242, "step": 22514 }, { "epoch": 0.42, "learning_rate": 3.2201729028500906e-06, "loss": 0.9887, "step": 22515 }, { "epoch": 0.42, "learning_rate": 3.2200266117627355e-06, "loss": 0.8416, "step": 22516 }, { "epoch": 0.42, "learning_rate": 3.219880317986822e-06, "loss": 0.9128, "step": 22517 }, { "epoch": 0.42, "learning_rate": 3.219734021522898e-06, "loss": 1.1161, "step": 22518 }, { "epoch": 0.42, "learning_rate": 3.21958772237151e-06, "loss": 1.2368, "step": 22519 }, { "epoch": 0.42, "learning_rate": 3.2194414205332013e-06, "loss": 0.8364, "step": 22520 }, { "epoch": 0.42, "learning_rate": 3.2192951160085223e-06, "loss": 0.9799, "step": 22521 }, { "epoch": 0.42, "learning_rate": 3.219148808798017e-06, "loss": 0.9158, "step": 22522 }, { "epoch": 0.42, "learning_rate": 3.2190024989022315e-06, "loss": 0.8127, "step": 22523 }, { "epoch": 0.42, "learning_rate": 3.218856186321714e-06, "loss": 1.1082, "step": 22524 }, { "epoch": 0.42, "learning_rate": 3.2187098710570084e-06, "loss": 0.9648, "step": 22525 }, { "epoch": 0.42, "learning_rate": 3.2185635531086623e-06, "loss": 1.1718, "step": 22526 }, { "epoch": 0.43, "learning_rate": 3.2184172324772224e-06, "loss": 0.9236, "step": 22527 }, { "epoch": 0.43, "learning_rate": 3.2182709091632343e-06, "loss": 0.7673, "step": 22528 }, { "epoch": 0.43, "learning_rate": 3.218124583167244e-06, "loss": 0.8427, "step": 22529 }, { "epoch": 0.43, "learning_rate": 3.2179782544898e-06, "loss": 0.9379, "step": 22530 }, { "epoch": 0.43, "learning_rate": 3.2178319231314466e-06, "loss": 1.0597, "step": 22531 }, { "epoch": 0.43, "learning_rate": 3.21768558909273e-06, "loss": 0.9892, "step": 22532 }, { "epoch": 0.43, "learning_rate": 3.2175392523741978e-06, "loss": 0.9996, "step": 22533 }, { "epoch": 0.43, "learning_rate": 3.2173929129763965e-06, "loss": 1.0391, "step": 22534 }, { "epoch": 0.43, "learning_rate": 3.2172465708998713e-06, "loss": 0.8872, "step": 22535 }, { "epoch": 0.43, "learning_rate": 3.21710022614517e-06, "loss": 0.7823, "step": 22536 }, { "epoch": 0.43, "learning_rate": 3.2169538787128384e-06, "loss": 1.0434, "step": 22537 }, { "epoch": 0.43, "learning_rate": 3.2168075286034234e-06, "loss": 0.8316, "step": 22538 }, { "epoch": 0.43, "learning_rate": 3.2166611758174706e-06, "loss": 0.8737, "step": 22539 }, { "epoch": 0.43, "learning_rate": 3.216514820355527e-06, "loss": 0.9001, "step": 22540 }, { "epoch": 0.43, "learning_rate": 3.2163684622181385e-06, "loss": 0.9447, "step": 22541 }, { "epoch": 0.43, "learning_rate": 3.2162221014058527e-06, "loss": 0.9242, "step": 22542 }, { "epoch": 0.43, "learning_rate": 3.2160757379192154e-06, "loss": 1.0972, "step": 22543 }, { "epoch": 0.43, "learning_rate": 3.2159293717587737e-06, "loss": 0.8732, "step": 22544 }, { "epoch": 0.43, "learning_rate": 3.2157830029250724e-06, "loss": 0.8723, "step": 22545 }, { "epoch": 0.43, "learning_rate": 3.215636631418661e-06, "loss": 0.8436, "step": 22546 }, { "epoch": 0.43, "learning_rate": 3.2154902572400835e-06, "loss": 0.8386, "step": 22547 }, { "epoch": 0.43, "learning_rate": 3.2153438803898874e-06, "loss": 0.9525, "step": 22548 }, { "epoch": 0.43, "learning_rate": 3.2151975008686187e-06, "loss": 1.1176, "step": 22549 }, { "epoch": 0.43, "learning_rate": 3.2150511186768245e-06, "loss": 0.9094, "step": 22550 }, { "epoch": 0.43, "learning_rate": 3.214904733815052e-06, "loss": 0.9356, "step": 22551 }, { "epoch": 0.43, "learning_rate": 3.214758346283847e-06, "loss": 0.8416, "step": 22552 }, { "epoch": 0.43, "learning_rate": 3.214611956083756e-06, "loss": 0.8695, "step": 22553 }, { "epoch": 0.43, "learning_rate": 3.214465563215326e-06, "loss": 0.9229, "step": 22554 }, { "epoch": 0.43, "learning_rate": 3.2143191676791036e-06, "loss": 0.8728, "step": 22555 }, { "epoch": 0.43, "learning_rate": 3.214172769475635e-06, "loss": 0.9455, "step": 22556 }, { "epoch": 0.43, "learning_rate": 3.214026368605467e-06, "loss": 0.9296, "step": 22557 }, { "epoch": 0.43, "learning_rate": 3.213879965069148e-06, "loss": 0.7377, "step": 22558 }, { "epoch": 0.43, "learning_rate": 3.2137335588672214e-06, "loss": 0.8532, "step": 22559 }, { "epoch": 0.43, "learning_rate": 3.2135871500002357e-06, "loss": 0.8768, "step": 22560 }, { "epoch": 0.43, "learning_rate": 3.213440738468738e-06, "loss": 0.8386, "step": 22561 }, { "epoch": 0.43, "learning_rate": 3.213294324273274e-06, "loss": 1.1184, "step": 22562 }, { "epoch": 0.43, "learning_rate": 3.213147907414391e-06, "loss": 0.934, "step": 22563 }, { "epoch": 0.43, "learning_rate": 3.2130014878926363e-06, "loss": 0.7095, "step": 22564 }, { "epoch": 0.43, "learning_rate": 3.2128550657085555e-06, "loss": 0.9214, "step": 22565 }, { "epoch": 0.43, "learning_rate": 3.212708640862696e-06, "loss": 0.805, "step": 22566 }, { "epoch": 0.43, "learning_rate": 3.212562213355604e-06, "loss": 0.8166, "step": 22567 }, { "epoch": 0.43, "learning_rate": 3.2124157831878263e-06, "loss": 1.1558, "step": 22568 }, { "epoch": 0.43, "learning_rate": 3.21226935035991e-06, "loss": 1.018, "step": 22569 }, { "epoch": 0.43, "learning_rate": 3.2121229148724016e-06, "loss": 0.9814, "step": 22570 }, { "epoch": 0.43, "learning_rate": 3.211976476725848e-06, "loss": 1.0807, "step": 22571 }, { "epoch": 0.43, "learning_rate": 3.2118300359207965e-06, "loss": 0.9861, "step": 22572 }, { "epoch": 0.43, "learning_rate": 3.2116835924577937e-06, "loss": 1.0689, "step": 22573 }, { "epoch": 0.43, "learning_rate": 3.211537146337386e-06, "loss": 1.0578, "step": 22574 }, { "epoch": 0.43, "learning_rate": 3.2113906975601195e-06, "loss": 1.1671, "step": 22575 }, { "epoch": 0.43, "learning_rate": 3.2112442461265425e-06, "loss": 0.9595, "step": 22576 }, { "epoch": 0.43, "learning_rate": 3.2110977920372018e-06, "loss": 1.009, "step": 22577 }, { "epoch": 0.43, "learning_rate": 3.2109513352926435e-06, "loss": 0.9947, "step": 22578 }, { "epoch": 0.43, "learning_rate": 3.2108048758934146e-06, "loss": 0.841, "step": 22579 }, { "epoch": 0.43, "learning_rate": 3.210658413840062e-06, "loss": 0.7776, "step": 22580 }, { "epoch": 0.43, "learning_rate": 3.2105119491331333e-06, "loss": 1.101, "step": 22581 }, { "epoch": 0.43, "learning_rate": 3.2103654817731745e-06, "loss": 0.9041, "step": 22582 }, { "epoch": 0.43, "learning_rate": 3.210219011760732e-06, "loss": 0.7729, "step": 22583 }, { "epoch": 0.43, "learning_rate": 3.210072539096354e-06, "loss": 1.058, "step": 22584 }, { "epoch": 0.43, "learning_rate": 3.2099260637805868e-06, "loss": 0.8382, "step": 22585 }, { "epoch": 0.43, "learning_rate": 3.2097795858139776e-06, "loss": 0.9425, "step": 22586 }, { "epoch": 0.43, "learning_rate": 3.2096331051970735e-06, "loss": 1.0651, "step": 22587 }, { "epoch": 0.43, "learning_rate": 3.2094866219304212e-06, "loss": 1.1318, "step": 22588 }, { "epoch": 0.43, "learning_rate": 3.2093401360145667e-06, "loss": 1.0009, "step": 22589 }, { "epoch": 0.43, "learning_rate": 3.2091936474500583e-06, "loss": 0.9874, "step": 22590 }, { "epoch": 0.43, "learning_rate": 3.2090471562374425e-06, "loss": 0.8637, "step": 22591 }, { "epoch": 0.43, "learning_rate": 3.2089006623772667e-06, "loss": 1.0129, "step": 22592 }, { "epoch": 0.43, "learning_rate": 3.208754165870078e-06, "loss": 1.0751, "step": 22593 }, { "epoch": 0.43, "learning_rate": 3.208607666716422e-06, "loss": 0.9162, "step": 22594 }, { "epoch": 0.43, "learning_rate": 3.2084611649168467e-06, "loss": 0.9579, "step": 22595 }, { "epoch": 0.43, "learning_rate": 3.2083146604718995e-06, "loss": 0.752, "step": 22596 }, { "epoch": 0.43, "learning_rate": 3.2081681533821267e-06, "loss": 1.0345, "step": 22597 }, { "epoch": 0.43, "learning_rate": 3.208021643648076e-06, "loss": 0.8334, "step": 22598 }, { "epoch": 0.43, "learning_rate": 3.207875131270295e-06, "loss": 0.7938, "step": 22599 }, { "epoch": 0.43, "learning_rate": 3.2077286162493295e-06, "loss": 1.062, "step": 22600 }, { "epoch": 0.43, "learning_rate": 3.2075820985857263e-06, "loss": 0.8132, "step": 22601 }, { "epoch": 0.43, "learning_rate": 3.207435578280034e-06, "loss": 0.9178, "step": 22602 }, { "epoch": 0.43, "learning_rate": 3.2072890553327984e-06, "loss": 0.932, "step": 22603 }, { "epoch": 0.43, "learning_rate": 3.2071425297445667e-06, "loss": 0.927, "step": 22604 }, { "epoch": 0.43, "learning_rate": 3.206996001515888e-06, "loss": 0.8668, "step": 22605 }, { "epoch": 0.43, "learning_rate": 3.206849470647307e-06, "loss": 0.7955, "step": 22606 }, { "epoch": 0.43, "learning_rate": 3.2067029371393713e-06, "loss": 0.7594, "step": 22607 }, { "epoch": 0.43, "learning_rate": 3.2065564009926296e-06, "loss": 0.8142, "step": 22608 }, { "epoch": 0.43, "learning_rate": 3.206409862207627e-06, "loss": 0.799, "step": 22609 }, { "epoch": 0.43, "learning_rate": 3.2062633207849124e-06, "loss": 0.8853, "step": 22610 }, { "epoch": 0.43, "learning_rate": 3.206116776725032e-06, "loss": 0.8252, "step": 22611 }, { "epoch": 0.43, "learning_rate": 3.205970230028533e-06, "loss": 0.8595, "step": 22612 }, { "epoch": 0.43, "learning_rate": 3.2058236806959623e-06, "loss": 1.0587, "step": 22613 }, { "epoch": 0.43, "learning_rate": 3.2056771287278687e-06, "loss": 1.0192, "step": 22614 }, { "epoch": 0.43, "learning_rate": 3.205530574124798e-06, "loss": 0.8001, "step": 22615 }, { "epoch": 0.43, "learning_rate": 3.2053840168872974e-06, "loss": 0.8931, "step": 22616 }, { "epoch": 0.43, "learning_rate": 3.2052374570159145e-06, "loss": 0.7877, "step": 22617 }, { "epoch": 0.43, "learning_rate": 3.205090894511197e-06, "loss": 0.7885, "step": 22618 }, { "epoch": 0.43, "learning_rate": 3.204944329373691e-06, "loss": 1.0295, "step": 22619 }, { "epoch": 0.43, "learning_rate": 3.2047977616039455e-06, "loss": 1.0219, "step": 22620 }, { "epoch": 0.43, "learning_rate": 3.2046511912025058e-06, "loss": 0.9915, "step": 22621 }, { "epoch": 0.43, "learning_rate": 3.2045046181699207e-06, "loss": 0.7409, "step": 22622 }, { "epoch": 0.43, "learning_rate": 3.2043580425067373e-06, "loss": 0.6697, "step": 22623 }, { "epoch": 0.43, "learning_rate": 3.204211464213502e-06, "loss": 1.0278, "step": 22624 }, { "epoch": 0.43, "learning_rate": 3.2040648832907624e-06, "loss": 1.0227, "step": 22625 }, { "epoch": 0.43, "learning_rate": 3.2039182997390667e-06, "loss": 1.1056, "step": 22626 }, { "epoch": 0.43, "learning_rate": 3.203771713558961e-06, "loss": 0.8678, "step": 22627 }, { "epoch": 0.43, "learning_rate": 3.203625124750994e-06, "loss": 0.9541, "step": 22628 }, { "epoch": 0.43, "learning_rate": 3.2034785333157128e-06, "loss": 0.7719, "step": 22629 }, { "epoch": 0.43, "learning_rate": 3.2033319392536633e-06, "loss": 1.041, "step": 22630 }, { "epoch": 0.43, "learning_rate": 3.203185342565394e-06, "loss": 1.1113, "step": 22631 }, { "epoch": 0.43, "learning_rate": 3.2030387432514524e-06, "loss": 1.0258, "step": 22632 }, { "epoch": 0.43, "learning_rate": 3.202892141312386e-06, "loss": 0.9213, "step": 22633 }, { "epoch": 0.43, "learning_rate": 3.2027455367487414e-06, "loss": 0.9111, "step": 22634 }, { "epoch": 0.43, "learning_rate": 3.2025989295610673e-06, "loss": 0.9847, "step": 22635 }, { "epoch": 0.43, "learning_rate": 3.20245231974991e-06, "loss": 0.8631, "step": 22636 }, { "epoch": 0.43, "learning_rate": 3.2023057073158165e-06, "loss": 0.9971, "step": 22637 }, { "epoch": 0.43, "learning_rate": 3.2021590922593355e-06, "loss": 1.0859, "step": 22638 }, { "epoch": 0.43, "learning_rate": 3.202012474581014e-06, "loss": 0.7858, "step": 22639 }, { "epoch": 0.43, "learning_rate": 3.2018658542814e-06, "loss": 0.9598, "step": 22640 }, { "epoch": 0.43, "learning_rate": 3.2017192313610395e-06, "loss": 0.9219, "step": 22641 }, { "epoch": 0.43, "learning_rate": 3.201572605820481e-06, "loss": 0.7779, "step": 22642 }, { "epoch": 0.43, "learning_rate": 3.2014259776602724e-06, "loss": 1.0294, "step": 22643 }, { "epoch": 0.43, "learning_rate": 3.2012793468809613e-06, "loss": 1.0735, "step": 22644 }, { "epoch": 0.43, "learning_rate": 3.201132713483093e-06, "loss": 0.6627, "step": 22645 }, { "epoch": 0.43, "learning_rate": 3.2009860774672176e-06, "loss": 0.9318, "step": 22646 }, { "epoch": 0.43, "learning_rate": 3.2008394388338815e-06, "loss": 0.8461, "step": 22647 }, { "epoch": 0.43, "learning_rate": 3.2006927975836325e-06, "loss": 0.7968, "step": 22648 }, { "epoch": 0.43, "learning_rate": 3.2005461537170178e-06, "loss": 1.2103, "step": 22649 }, { "epoch": 0.43, "learning_rate": 3.200399507234586e-06, "loss": 1.2471, "step": 22650 }, { "epoch": 0.43, "learning_rate": 3.2002528581368835e-06, "loss": 1.0465, "step": 22651 }, { "epoch": 0.43, "learning_rate": 3.2001062064244583e-06, "loss": 0.931, "step": 22652 }, { "epoch": 0.43, "learning_rate": 3.199959552097858e-06, "loss": 0.864, "step": 22653 }, { "epoch": 0.43, "learning_rate": 3.1998128951576296e-06, "loss": 0.7537, "step": 22654 }, { "epoch": 0.43, "learning_rate": 3.1996662356043216e-06, "loss": 1.112, "step": 22655 }, { "epoch": 0.43, "learning_rate": 3.199519573438482e-06, "loss": 1.2816, "step": 22656 }, { "epoch": 0.43, "learning_rate": 3.199372908660657e-06, "loss": 0.9891, "step": 22657 }, { "epoch": 0.43, "learning_rate": 3.1992262412713957e-06, "loss": 0.9138, "step": 22658 }, { "epoch": 0.43, "learning_rate": 3.1990795712712446e-06, "loss": 0.8772, "step": 22659 }, { "epoch": 0.43, "learning_rate": 3.1989328986607514e-06, "loss": 0.9451, "step": 22660 }, { "epoch": 0.43, "learning_rate": 3.198786223440465e-06, "loss": 0.9653, "step": 22661 }, { "epoch": 0.43, "learning_rate": 3.198639545610932e-06, "loss": 1.1375, "step": 22662 }, { "epoch": 0.43, "learning_rate": 3.1984928651727005e-06, "loss": 1.0366, "step": 22663 }, { "epoch": 0.43, "learning_rate": 3.198346182126317e-06, "loss": 0.7406, "step": 22664 }, { "epoch": 0.43, "learning_rate": 3.1981994964723323e-06, "loss": 0.9834, "step": 22665 }, { "epoch": 0.43, "learning_rate": 3.1980528082112905e-06, "loss": 0.8712, "step": 22666 }, { "epoch": 0.43, "learning_rate": 3.1979061173437408e-06, "loss": 0.8928, "step": 22667 }, { "epoch": 0.43, "learning_rate": 3.197759423870232e-06, "loss": 1.1222, "step": 22668 }, { "epoch": 0.43, "learning_rate": 3.1976127277913107e-06, "loss": 1.2775, "step": 22669 }, { "epoch": 0.43, "learning_rate": 3.1974660291075243e-06, "loss": 0.7405, "step": 22670 }, { "epoch": 0.43, "learning_rate": 3.197319327819422e-06, "loss": 0.9227, "step": 22671 }, { "epoch": 0.43, "learning_rate": 3.19717262392755e-06, "loss": 0.9843, "step": 22672 }, { "epoch": 0.43, "learning_rate": 3.197025917432457e-06, "loss": 0.7098, "step": 22673 }, { "epoch": 0.43, "learning_rate": 3.1968792083346905e-06, "loss": 0.8235, "step": 22674 }, { "epoch": 0.43, "learning_rate": 3.1967324966347986e-06, "loss": 1.0716, "step": 22675 }, { "epoch": 0.43, "learning_rate": 3.1965857823333285e-06, "loss": 0.8769, "step": 22676 }, { "epoch": 0.43, "learning_rate": 3.196439065430829e-06, "loss": 0.9076, "step": 22677 }, { "epoch": 0.43, "learning_rate": 3.1962923459278474e-06, "loss": 0.7401, "step": 22678 }, { "epoch": 0.43, "learning_rate": 3.196145623824931e-06, "loss": 0.7275, "step": 22679 }, { "epoch": 0.43, "learning_rate": 3.1959988991226282e-06, "loss": 0.9296, "step": 22680 }, { "epoch": 0.43, "learning_rate": 3.195852171821487e-06, "loss": 0.9483, "step": 22681 }, { "epoch": 0.43, "learning_rate": 3.195705441922056e-06, "loss": 1.1079, "step": 22682 }, { "epoch": 0.43, "learning_rate": 3.1955587094248806e-06, "loss": 0.9997, "step": 22683 }, { "epoch": 0.43, "learning_rate": 3.1954119743305114e-06, "loss": 1.039, "step": 22684 }, { "epoch": 0.43, "learning_rate": 3.1952652366394953e-06, "loss": 0.785, "step": 22685 }, { "epoch": 0.43, "learning_rate": 3.1951184963523796e-06, "loss": 1.0665, "step": 22686 }, { "epoch": 0.43, "learning_rate": 3.1949717534697126e-06, "loss": 0.9794, "step": 22687 }, { "epoch": 0.43, "learning_rate": 3.194825007992043e-06, "loss": 0.9833, "step": 22688 }, { "epoch": 0.43, "learning_rate": 3.1946782599199177e-06, "loss": 0.9795, "step": 22689 }, { "epoch": 0.43, "learning_rate": 3.1945315092538853e-06, "loss": 0.8438, "step": 22690 }, { "epoch": 0.43, "learning_rate": 3.1943847559944935e-06, "loss": 0.8304, "step": 22691 }, { "epoch": 0.43, "learning_rate": 3.19423800014229e-06, "loss": 0.8421, "step": 22692 }, { "epoch": 0.43, "learning_rate": 3.194091241697824e-06, "loss": 1.1942, "step": 22693 }, { "epoch": 0.43, "learning_rate": 3.1939444806616416e-06, "loss": 0.9373, "step": 22694 }, { "epoch": 0.43, "learning_rate": 3.1937977170342916e-06, "loss": 0.7885, "step": 22695 }, { "epoch": 0.43, "learning_rate": 3.1936509508163227e-06, "loss": 0.9698, "step": 22696 }, { "epoch": 0.43, "learning_rate": 3.193504182008283e-06, "loss": 0.9716, "step": 22697 }, { "epoch": 0.43, "learning_rate": 3.193357410610719e-06, "loss": 0.9464, "step": 22698 }, { "epoch": 0.43, "learning_rate": 3.19321063662418e-06, "loss": 0.9099, "step": 22699 }, { "epoch": 0.43, "learning_rate": 3.193063860049214e-06, "loss": 1.1813, "step": 22700 }, { "epoch": 0.43, "learning_rate": 3.1929170808863684e-06, "loss": 1.0997, "step": 22701 }, { "epoch": 0.43, "learning_rate": 3.192770299136192e-06, "loss": 0.9812, "step": 22702 }, { "epoch": 0.43, "learning_rate": 3.1926235147992324e-06, "loss": 0.7984, "step": 22703 }, { "epoch": 0.43, "learning_rate": 3.192476727876038e-06, "loss": 0.7911, "step": 22704 }, { "epoch": 0.43, "learning_rate": 3.1923299383671565e-06, "loss": 0.8321, "step": 22705 }, { "epoch": 0.43, "learning_rate": 3.1921831462731365e-06, "loss": 1.201, "step": 22706 }, { "epoch": 0.43, "learning_rate": 3.1920363515945256e-06, "loss": 0.8748, "step": 22707 }, { "epoch": 0.43, "learning_rate": 3.1918895543318716e-06, "loss": 0.7983, "step": 22708 }, { "epoch": 0.43, "learning_rate": 3.1917427544857244e-06, "loss": 0.8967, "step": 22709 }, { "epoch": 0.43, "learning_rate": 3.1915959520566303e-06, "loss": 0.8397, "step": 22710 }, { "epoch": 0.43, "learning_rate": 3.191449147045138e-06, "loss": 1.0178, "step": 22711 }, { "epoch": 0.43, "learning_rate": 3.1913023394517967e-06, "loss": 1.216, "step": 22712 }, { "epoch": 0.43, "learning_rate": 3.191155529277153e-06, "loss": 0.8544, "step": 22713 }, { "epoch": 0.43, "learning_rate": 3.1910087165217552e-06, "loss": 1.0547, "step": 22714 }, { "epoch": 0.43, "learning_rate": 3.190861901186153e-06, "loss": 0.942, "step": 22715 }, { "epoch": 0.43, "learning_rate": 3.1907150832708925e-06, "loss": 0.837, "step": 22716 }, { "epoch": 0.43, "learning_rate": 3.190568262776524e-06, "loss": 0.8665, "step": 22717 }, { "epoch": 0.43, "learning_rate": 3.190421439703595e-06, "loss": 1.0131, "step": 22718 }, { "epoch": 0.43, "learning_rate": 3.190274614052653e-06, "loss": 1.0198, "step": 22719 }, { "epoch": 0.43, "learning_rate": 3.190127785824246e-06, "loss": 0.9771, "step": 22720 }, { "epoch": 0.43, "learning_rate": 3.1899809550189244e-06, "loss": 0.9249, "step": 22721 }, { "epoch": 0.43, "learning_rate": 3.1898341216372343e-06, "loss": 1.063, "step": 22722 }, { "epoch": 0.43, "learning_rate": 3.189687285679725e-06, "loss": 0.8811, "step": 22723 }, { "epoch": 0.43, "learning_rate": 3.189540447146945e-06, "loss": 0.995, "step": 22724 }, { "epoch": 0.43, "learning_rate": 3.1893936060394415e-06, "loss": 1.0489, "step": 22725 }, { "epoch": 0.43, "learning_rate": 3.1892467623577633e-06, "loss": 1.0618, "step": 22726 }, { "epoch": 0.43, "learning_rate": 3.1890999161024594e-06, "loss": 0.835, "step": 22727 }, { "epoch": 0.43, "learning_rate": 3.188953067274077e-06, "loss": 0.8661, "step": 22728 }, { "epoch": 0.43, "learning_rate": 3.188806215873165e-06, "loss": 0.9352, "step": 22729 }, { "epoch": 0.43, "learning_rate": 3.1886593619002714e-06, "loss": 1.1448, "step": 22730 }, { "epoch": 0.43, "learning_rate": 3.1885125053559457e-06, "loss": 0.9165, "step": 22731 }, { "epoch": 0.43, "learning_rate": 3.1883656462407347e-06, "loss": 0.7809, "step": 22732 }, { "epoch": 0.43, "learning_rate": 3.1882187845551884e-06, "loss": 0.915, "step": 22733 }, { "epoch": 0.43, "learning_rate": 3.1880719202998533e-06, "loss": 0.8285, "step": 22734 }, { "epoch": 0.43, "learning_rate": 3.1879250534752792e-06, "loss": 0.8217, "step": 22735 }, { "epoch": 0.43, "learning_rate": 3.187778184082014e-06, "loss": 0.9981, "step": 22736 }, { "epoch": 0.43, "learning_rate": 3.187631312120606e-06, "loss": 1.154, "step": 22737 }, { "epoch": 0.43, "learning_rate": 3.1874844375916036e-06, "loss": 1.1476, "step": 22738 }, { "epoch": 0.43, "learning_rate": 3.187337560495556e-06, "loss": 0.7249, "step": 22739 }, { "epoch": 0.43, "learning_rate": 3.1871906808330106e-06, "loss": 0.8861, "step": 22740 }, { "epoch": 0.43, "learning_rate": 3.187043798604516e-06, "loss": 0.7624, "step": 22741 }, { "epoch": 0.43, "learning_rate": 3.1868969138106208e-06, "loss": 1.0444, "step": 22742 }, { "epoch": 0.43, "learning_rate": 3.186750026451874e-06, "loss": 0.8894, "step": 22743 }, { "epoch": 0.43, "learning_rate": 3.1866031365288243e-06, "loss": 1.0923, "step": 22744 }, { "epoch": 0.43, "learning_rate": 3.1864562440420188e-06, "loss": 0.8497, "step": 22745 }, { "epoch": 0.43, "learning_rate": 3.186309348992007e-06, "loss": 0.8844, "step": 22746 }, { "epoch": 0.43, "learning_rate": 3.1861624513793364e-06, "loss": 0.7525, "step": 22747 }, { "epoch": 0.43, "learning_rate": 3.1860155512045574e-06, "loss": 0.9645, "step": 22748 }, { "epoch": 0.43, "learning_rate": 3.185868648468217e-06, "loss": 0.8455, "step": 22749 }, { "epoch": 0.43, "learning_rate": 3.185721743170863e-06, "loss": 1.0624, "step": 22750 }, { "epoch": 0.43, "learning_rate": 3.1855748353130468e-06, "loss": 0.8783, "step": 22751 }, { "epoch": 0.43, "learning_rate": 3.185427924895314e-06, "loss": 0.7795, "step": 22752 }, { "epoch": 0.43, "learning_rate": 3.1852810119182143e-06, "loss": 0.8557, "step": 22753 }, { "epoch": 0.43, "learning_rate": 3.1851340963822975e-06, "loss": 0.7767, "step": 22754 }, { "epoch": 0.43, "learning_rate": 3.1849871782881105e-06, "loss": 1.1152, "step": 22755 }, { "epoch": 0.43, "learning_rate": 3.1848402576362016e-06, "loss": 1.0345, "step": 22756 }, { "epoch": 0.43, "learning_rate": 3.18469333442712e-06, "loss": 0.8923, "step": 22757 }, { "epoch": 0.43, "learning_rate": 3.1845464086614154e-06, "loss": 0.9195, "step": 22758 }, { "epoch": 0.43, "learning_rate": 3.184399480339635e-06, "loss": 0.7123, "step": 22759 }, { "epoch": 0.43, "learning_rate": 3.1842525494623287e-06, "loss": 0.7124, "step": 22760 }, { "epoch": 0.43, "learning_rate": 3.1841056160300436e-06, "loss": 1.0695, "step": 22761 }, { "epoch": 0.43, "learning_rate": 3.183958680043329e-06, "loss": 0.8117, "step": 22762 }, { "epoch": 0.43, "learning_rate": 3.183811741502734e-06, "loss": 0.9088, "step": 22763 }, { "epoch": 0.43, "learning_rate": 3.183664800408807e-06, "loss": 0.8952, "step": 22764 }, { "epoch": 0.43, "learning_rate": 3.183517856762096e-06, "loss": 0.8737, "step": 22765 }, { "epoch": 0.43, "learning_rate": 3.1833709105631516e-06, "loss": 0.8, "step": 22766 }, { "epoch": 0.43, "learning_rate": 3.18322396181252e-06, "loss": 1.0818, "step": 22767 }, { "epoch": 0.43, "learning_rate": 3.183077010510751e-06, "loss": 1.0649, "step": 22768 }, { "epoch": 0.43, "learning_rate": 3.1829300566583943e-06, "loss": 0.9822, "step": 22769 }, { "epoch": 0.43, "learning_rate": 3.1827831002559974e-06, "loss": 0.9322, "step": 22770 }, { "epoch": 0.43, "learning_rate": 3.1826361413041085e-06, "loss": 0.9258, "step": 22771 }, { "epoch": 0.43, "learning_rate": 3.182489179803278e-06, "loss": 0.8034, "step": 22772 }, { "epoch": 0.43, "learning_rate": 3.182342215754054e-06, "loss": 0.7679, "step": 22773 }, { "epoch": 0.43, "learning_rate": 3.1821952491569842e-06, "loss": 0.9718, "step": 22774 }, { "epoch": 0.43, "learning_rate": 3.1820482800126195e-06, "loss": 1.1086, "step": 22775 }, { "epoch": 0.43, "learning_rate": 3.1819013083215067e-06, "loss": 0.9268, "step": 22776 }, { "epoch": 0.43, "learning_rate": 3.181754334084195e-06, "loss": 0.9252, "step": 22777 }, { "epoch": 0.43, "learning_rate": 3.181607357301234e-06, "loss": 0.7251, "step": 22778 }, { "epoch": 0.43, "learning_rate": 3.181460377973171e-06, "loss": 0.8312, "step": 22779 }, { "epoch": 0.43, "learning_rate": 3.181313396100557e-06, "loss": 0.9717, "step": 22780 }, { "epoch": 0.43, "learning_rate": 3.18116641168394e-06, "loss": 1.222, "step": 22781 }, { "epoch": 0.43, "learning_rate": 3.181019424723868e-06, "loss": 1.2285, "step": 22782 }, { "epoch": 0.43, "learning_rate": 3.1808724352208896e-06, "loss": 0.8553, "step": 22783 }, { "epoch": 0.43, "learning_rate": 3.180725443175555e-06, "loss": 0.8746, "step": 22784 }, { "epoch": 0.43, "learning_rate": 3.180578448588413e-06, "loss": 0.8983, "step": 22785 }, { "epoch": 0.43, "learning_rate": 3.180431451460011e-06, "loss": 1.0051, "step": 22786 }, { "epoch": 0.43, "learning_rate": 3.1802844517909e-06, "loss": 0.9231, "step": 22787 }, { "epoch": 0.43, "learning_rate": 3.1801374495816267e-06, "loss": 0.9408, "step": 22788 }, { "epoch": 0.43, "learning_rate": 3.179990444832741e-06, "loss": 0.7786, "step": 22789 }, { "epoch": 0.43, "learning_rate": 3.179843437544793e-06, "loss": 0.8828, "step": 22790 }, { "epoch": 0.43, "learning_rate": 3.1796964277183293e-06, "loss": 0.8852, "step": 22791 }, { "epoch": 0.43, "learning_rate": 3.1795494153538997e-06, "loss": 0.9441, "step": 22792 }, { "epoch": 0.43, "learning_rate": 3.179402400452054e-06, "loss": 0.9019, "step": 22793 }, { "epoch": 0.43, "learning_rate": 3.179255383013341e-06, "loss": 0.9488, "step": 22794 }, { "epoch": 0.43, "learning_rate": 3.1791083630383085e-06, "loss": 1.0482, "step": 22795 }, { "epoch": 0.43, "learning_rate": 3.1789613405275066e-06, "loss": 1.0181, "step": 22796 }, { "epoch": 0.43, "learning_rate": 3.178814315481484e-06, "loss": 0.8854, "step": 22797 }, { "epoch": 0.43, "learning_rate": 3.1786672879007892e-06, "loss": 0.8269, "step": 22798 }, { "epoch": 0.43, "learning_rate": 3.1785202577859714e-06, "loss": 1.1535, "step": 22799 }, { "epoch": 0.43, "learning_rate": 3.17837322513758e-06, "loss": 1.0899, "step": 22800 }, { "epoch": 0.43, "learning_rate": 3.1782261899561638e-06, "loss": 0.8434, "step": 22801 }, { "epoch": 0.43, "learning_rate": 3.178079152242272e-06, "loss": 0.9161, "step": 22802 }, { "epoch": 0.43, "learning_rate": 3.1779321119964536e-06, "loss": 0.9637, "step": 22803 }, { "epoch": 0.43, "learning_rate": 3.177785069219257e-06, "loss": 0.9521, "step": 22804 }, { "epoch": 0.43, "learning_rate": 3.1776380239112315e-06, "loss": 1.0566, "step": 22805 }, { "epoch": 0.43, "learning_rate": 3.1774909760729265e-06, "loss": 1.248, "step": 22806 }, { "epoch": 0.43, "learning_rate": 3.1773439257048915e-06, "loss": 0.864, "step": 22807 }, { "epoch": 0.43, "learning_rate": 3.1771968728076746e-06, "loss": 0.7257, "step": 22808 }, { "epoch": 0.43, "learning_rate": 3.1770498173818255e-06, "loss": 0.9608, "step": 22809 }, { "epoch": 0.43, "learning_rate": 3.1769027594278935e-06, "loss": 0.9796, "step": 22810 }, { "epoch": 0.43, "learning_rate": 3.176755698946427e-06, "loss": 1.085, "step": 22811 }, { "epoch": 0.43, "learning_rate": 3.1766086359379754e-06, "loss": 1.0356, "step": 22812 }, { "epoch": 0.43, "learning_rate": 3.176461570403088e-06, "loss": 0.9863, "step": 22813 }, { "epoch": 0.43, "learning_rate": 3.176314502342314e-06, "loss": 0.8134, "step": 22814 }, { "epoch": 0.43, "learning_rate": 3.176167431756202e-06, "loss": 0.8163, "step": 22815 }, { "epoch": 0.43, "learning_rate": 3.176020358645302e-06, "loss": 0.8905, "step": 22816 }, { "epoch": 0.43, "learning_rate": 3.1758732830101624e-06, "loss": 0.8856, "step": 22817 }, { "epoch": 0.43, "learning_rate": 3.1757262048513326e-06, "loss": 1.0081, "step": 22818 }, { "epoch": 0.43, "learning_rate": 3.175579124169362e-06, "loss": 0.9495, "step": 22819 }, { "epoch": 0.43, "learning_rate": 3.175432040964799e-06, "loss": 0.9896, "step": 22820 }, { "epoch": 0.43, "learning_rate": 3.175284955238194e-06, "loss": 0.8479, "step": 22821 }, { "epoch": 0.43, "learning_rate": 3.1751378669900966e-06, "loss": 0.9607, "step": 22822 }, { "epoch": 0.43, "learning_rate": 3.174990776221054e-06, "loss": 0.9521, "step": 22823 }, { "epoch": 0.43, "learning_rate": 3.1748436829316163e-06, "loss": 1.0361, "step": 22824 }, { "epoch": 0.43, "learning_rate": 3.1746965871223347e-06, "loss": 0.9549, "step": 22825 }, { "epoch": 0.43, "learning_rate": 3.1745494887937544e-06, "loss": 0.962, "step": 22826 }, { "epoch": 0.43, "learning_rate": 3.174402387946428e-06, "loss": 0.7578, "step": 22827 }, { "epoch": 0.43, "learning_rate": 3.1742552845809048e-06, "loss": 0.9587, "step": 22828 }, { "epoch": 0.43, "learning_rate": 3.174108178697732e-06, "loss": 0.7363, "step": 22829 }, { "epoch": 0.43, "learning_rate": 3.17396107029746e-06, "loss": 0.8748, "step": 22830 }, { "epoch": 0.43, "learning_rate": 3.1738139593806383e-06, "loss": 1.0612, "step": 22831 }, { "epoch": 0.43, "learning_rate": 3.173666845947816e-06, "loss": 1.0864, "step": 22832 }, { "epoch": 0.43, "learning_rate": 3.1735197299995417e-06, "loss": 0.9174, "step": 22833 }, { "epoch": 0.43, "learning_rate": 3.1733726115363657e-06, "loss": 0.8366, "step": 22834 }, { "epoch": 0.43, "learning_rate": 3.1732254905588366e-06, "loss": 0.7581, "step": 22835 }, { "epoch": 0.43, "learning_rate": 3.173078367067505e-06, "loss": 0.9564, "step": 22836 }, { "epoch": 0.43, "learning_rate": 3.172931241062919e-06, "loss": 0.9716, "step": 22837 }, { "epoch": 0.43, "learning_rate": 3.172784112545629e-06, "loss": 0.9883, "step": 22838 }, { "epoch": 0.43, "learning_rate": 3.172636981516183e-06, "loss": 1.0443, "step": 22839 }, { "epoch": 0.43, "learning_rate": 3.172489847975131e-06, "loss": 1.0521, "step": 22840 }, { "epoch": 0.43, "learning_rate": 3.1723427119230225e-06, "loss": 0.9039, "step": 22841 }, { "epoch": 0.43, "learning_rate": 3.1721955733604072e-06, "loss": 0.8514, "step": 22842 }, { "epoch": 0.43, "learning_rate": 3.1720484322878347e-06, "loss": 0.9188, "step": 22843 }, { "epoch": 0.43, "learning_rate": 3.171901288705854e-06, "loss": 0.9005, "step": 22844 }, { "epoch": 0.43, "learning_rate": 3.1717541426150134e-06, "loss": 0.6352, "step": 22845 }, { "epoch": 0.43, "learning_rate": 3.1716069940158645e-06, "loss": 0.7073, "step": 22846 }, { "epoch": 0.43, "learning_rate": 3.1714598429089547e-06, "loss": 0.8619, "step": 22847 }, { "epoch": 0.43, "learning_rate": 3.1713126892948354e-06, "loss": 0.8768, "step": 22848 }, { "epoch": 0.43, "learning_rate": 3.1711655331740547e-06, "loss": 0.9263, "step": 22849 }, { "epoch": 0.43, "learning_rate": 3.1710183745471623e-06, "loss": 1.17, "step": 22850 }, { "epoch": 0.43, "learning_rate": 3.170871213414708e-06, "loss": 0.8403, "step": 22851 }, { "epoch": 0.43, "learning_rate": 3.170724049777242e-06, "loss": 0.8026, "step": 22852 }, { "epoch": 0.43, "learning_rate": 3.170576883635312e-06, "loss": 1.0465, "step": 22853 }, { "epoch": 0.43, "learning_rate": 3.1704297149894685e-06, "loss": 0.7768, "step": 22854 }, { "epoch": 0.43, "learning_rate": 3.1702825438402608e-06, "loss": 0.9693, "step": 22855 }, { "epoch": 0.43, "learning_rate": 3.170135370188239e-06, "loss": 1.1793, "step": 22856 }, { "epoch": 0.43, "learning_rate": 3.1699881940339523e-06, "loss": 1.0065, "step": 22857 }, { "epoch": 0.43, "learning_rate": 3.1698410153779503e-06, "loss": 0.7846, "step": 22858 }, { "epoch": 0.43, "learning_rate": 3.1696938342207823e-06, "loss": 0.9312, "step": 22859 }, { "epoch": 0.43, "learning_rate": 3.1695466505629977e-06, "loss": 0.8637, "step": 22860 }, { "epoch": 0.43, "learning_rate": 3.169399464405147e-06, "loss": 0.8261, "step": 22861 }, { "epoch": 0.43, "learning_rate": 3.1692522757477794e-06, "loss": 1.3002, "step": 22862 }, { "epoch": 0.43, "learning_rate": 3.169105084591444e-06, "loss": 0.9478, "step": 22863 }, { "epoch": 0.43, "learning_rate": 3.168957890936691e-06, "loss": 1.0866, "step": 22864 }, { "epoch": 0.43, "learning_rate": 3.1688106947840693e-06, "loss": 0.8735, "step": 22865 }, { "epoch": 0.43, "learning_rate": 3.168663496134129e-06, "loss": 0.8771, "step": 22866 }, { "epoch": 0.43, "learning_rate": 3.1685162949874205e-06, "loss": 0.7792, "step": 22867 }, { "epoch": 0.43, "learning_rate": 3.168369091344491e-06, "loss": 1.0659, "step": 22868 }, { "epoch": 0.43, "learning_rate": 3.1682218852058926e-06, "loss": 1.0932, "step": 22869 }, { "epoch": 0.43, "learning_rate": 3.168074676572175e-06, "loss": 0.8104, "step": 22870 }, { "epoch": 0.43, "learning_rate": 3.167927465443886e-06, "loss": 0.8287, "step": 22871 }, { "epoch": 0.43, "learning_rate": 3.167780251821577e-06, "loss": 1.0189, "step": 22872 }, { "epoch": 0.43, "learning_rate": 3.167633035705797e-06, "loss": 1.0024, "step": 22873 }, { "epoch": 0.43, "learning_rate": 3.1674858170970957e-06, "loss": 0.8725, "step": 22874 }, { "epoch": 0.43, "learning_rate": 3.1673385959960223e-06, "loss": 0.9222, "step": 22875 }, { "epoch": 0.43, "learning_rate": 3.167191372403127e-06, "loss": 0.8883, "step": 22876 }, { "epoch": 0.43, "learning_rate": 3.1670441463189598e-06, "loss": 0.9757, "step": 22877 }, { "epoch": 0.43, "learning_rate": 3.1668969177440704e-06, "loss": 1.1509, "step": 22878 }, { "epoch": 0.43, "learning_rate": 3.166749686679009e-06, "loss": 0.8991, "step": 22879 }, { "epoch": 0.43, "learning_rate": 3.1666024531243235e-06, "loss": 0.8906, "step": 22880 }, { "epoch": 0.43, "learning_rate": 3.1664552170805653e-06, "loss": 1.0369, "step": 22881 }, { "epoch": 0.43, "learning_rate": 3.166307978548284e-06, "loss": 1.0103, "step": 22882 }, { "epoch": 0.43, "learning_rate": 3.166160737528029e-06, "loss": 0.9307, "step": 22883 }, { "epoch": 0.43, "learning_rate": 3.16601349402035e-06, "loss": 1.0441, "step": 22884 }, { "epoch": 0.43, "learning_rate": 3.1658662480257972e-06, "loss": 0.8501, "step": 22885 }, { "epoch": 0.43, "learning_rate": 3.1657189995449205e-06, "loss": 0.7048, "step": 22886 }, { "epoch": 0.43, "learning_rate": 3.165571748578269e-06, "loss": 1.1841, "step": 22887 }, { "epoch": 0.43, "learning_rate": 3.1654244951263937e-06, "loss": 0.8672, "step": 22888 }, { "epoch": 0.43, "learning_rate": 3.1652772391898427e-06, "loss": 0.9073, "step": 22889 }, { "epoch": 0.43, "learning_rate": 3.1651299807691672e-06, "loss": 0.9077, "step": 22890 }, { "epoch": 0.43, "learning_rate": 3.1649827198649175e-06, "loss": 0.9547, "step": 22891 }, { "epoch": 0.43, "learning_rate": 3.1648354564776423e-06, "loss": 1.0512, "step": 22892 }, { "epoch": 0.43, "learning_rate": 3.164688190607892e-06, "loss": 1.0084, "step": 22893 }, { "epoch": 0.43, "learning_rate": 3.1645409222562164e-06, "loss": 1.0348, "step": 22894 }, { "epoch": 0.43, "learning_rate": 3.164393651423165e-06, "loss": 0.9621, "step": 22895 }, { "epoch": 0.43, "learning_rate": 3.164246378109288e-06, "loss": 1.033, "step": 22896 }, { "epoch": 0.43, "learning_rate": 3.164099102315136e-06, "loss": 0.8478, "step": 22897 }, { "epoch": 0.43, "learning_rate": 3.1639518240412576e-06, "loss": 0.8695, "step": 22898 }, { "epoch": 0.43, "learning_rate": 3.1638045432882036e-06, "loss": 0.8451, "step": 22899 }, { "epoch": 0.43, "learning_rate": 3.163657260056524e-06, "loss": 1.1266, "step": 22900 }, { "epoch": 0.43, "learning_rate": 3.163509974346769e-06, "loss": 0.9575, "step": 22901 }, { "epoch": 0.43, "learning_rate": 3.163362686159487e-06, "loss": 0.9517, "step": 22902 }, { "epoch": 0.43, "learning_rate": 3.1632153954952298e-06, "loss": 0.8204, "step": 22903 }, { "epoch": 0.43, "learning_rate": 3.1630681023545464e-06, "loss": 0.7593, "step": 22904 }, { "epoch": 0.43, "learning_rate": 3.162920806737987e-06, "loss": 1.048, "step": 22905 }, { "epoch": 0.43, "learning_rate": 3.162773508646102e-06, "loss": 0.9343, "step": 22906 }, { "epoch": 0.43, "learning_rate": 3.1626262080794413e-06, "loss": 0.8592, "step": 22907 }, { "epoch": 0.43, "learning_rate": 3.1624789050385542e-06, "loss": 0.8159, "step": 22908 }, { "epoch": 0.43, "learning_rate": 3.1623315995239913e-06, "loss": 1.1245, "step": 22909 }, { "epoch": 0.43, "learning_rate": 3.1621842915363017e-06, "loss": 0.7031, "step": 22910 }, { "epoch": 0.43, "learning_rate": 3.1620369810760366e-06, "loss": 0.8653, "step": 22911 }, { "epoch": 0.43, "learning_rate": 3.1618896681437465e-06, "loss": 1.1918, "step": 22912 }, { "epoch": 0.43, "learning_rate": 3.1617423527399803e-06, "loss": 1.1362, "step": 22913 }, { "epoch": 0.43, "learning_rate": 3.161595034865288e-06, "loss": 1.0533, "step": 22914 }, { "epoch": 0.43, "learning_rate": 3.161447714520221e-06, "loss": 1.0154, "step": 22915 }, { "epoch": 0.43, "learning_rate": 3.161300391705328e-06, "loss": 1.0765, "step": 22916 }, { "epoch": 0.43, "learning_rate": 3.1611530664211597e-06, "loss": 0.9127, "step": 22917 }, { "epoch": 0.43, "learning_rate": 3.161005738668266e-06, "loss": 1.0101, "step": 22918 }, { "epoch": 0.43, "learning_rate": 3.160858408447197e-06, "loss": 0.9808, "step": 22919 }, { "epoch": 0.43, "learning_rate": 3.1607110757585037e-06, "loss": 0.889, "step": 22920 }, { "epoch": 0.43, "learning_rate": 3.1605637406027347e-06, "loss": 0.8528, "step": 22921 }, { "epoch": 0.43, "learning_rate": 3.160416402980441e-06, "loss": 0.9269, "step": 22922 }, { "epoch": 0.43, "learning_rate": 3.160269062892173e-06, "loss": 0.8534, "step": 22923 }, { "epoch": 0.43, "learning_rate": 3.1601217203384803e-06, "loss": 1.0798, "step": 22924 }, { "epoch": 0.43, "learning_rate": 3.159974375319913e-06, "loss": 1.1385, "step": 22925 }, { "epoch": 0.43, "learning_rate": 3.159827027837023e-06, "loss": 0.8463, "step": 22926 }, { "epoch": 0.43, "learning_rate": 3.159679677890358e-06, "loss": 0.8744, "step": 22927 }, { "epoch": 0.43, "learning_rate": 3.1595323254804695e-06, "loss": 0.8232, "step": 22928 }, { "epoch": 0.43, "learning_rate": 3.1593849706079076e-06, "loss": 0.9186, "step": 22929 }, { "epoch": 0.43, "learning_rate": 3.159237613273223e-06, "loss": 0.9788, "step": 22930 }, { "epoch": 0.43, "learning_rate": 3.1590902534769635e-06, "loss": 1.0424, "step": 22931 }, { "epoch": 0.43, "learning_rate": 3.158942891219683e-06, "loss": 0.7312, "step": 22932 }, { "epoch": 0.43, "learning_rate": 3.1587955265019295e-06, "loss": 0.8498, "step": 22933 }, { "epoch": 0.43, "learning_rate": 3.1586481593242536e-06, "loss": 0.7384, "step": 22934 }, { "epoch": 0.43, "learning_rate": 3.158500789687206e-06, "loss": 0.8512, "step": 22935 }, { "epoch": 0.43, "learning_rate": 3.158353417591336e-06, "loss": 0.8308, "step": 22936 }, { "epoch": 0.43, "learning_rate": 3.1582060430371946e-06, "loss": 1.1526, "step": 22937 }, { "epoch": 0.43, "learning_rate": 3.158058666025332e-06, "loss": 1.0325, "step": 22938 }, { "epoch": 0.43, "learning_rate": 3.157911286556299e-06, "loss": 1.0031, "step": 22939 }, { "epoch": 0.43, "learning_rate": 3.1577639046306453e-06, "loss": 0.8275, "step": 22940 }, { "epoch": 0.43, "learning_rate": 3.1576165202489217e-06, "loss": 0.779, "step": 22941 }, { "epoch": 0.43, "learning_rate": 3.1574691334116775e-06, "loss": 0.9513, "step": 22942 }, { "epoch": 0.43, "learning_rate": 3.1573217441194638e-06, "loss": 1.4335, "step": 22943 }, { "epoch": 0.43, "learning_rate": 3.157174352372831e-06, "loss": 1.1101, "step": 22944 }, { "epoch": 0.43, "learning_rate": 3.157026958172329e-06, "loss": 0.9764, "step": 22945 }, { "epoch": 0.43, "learning_rate": 3.1568795615185088e-06, "loss": 0.7516, "step": 22946 }, { "epoch": 0.43, "learning_rate": 3.1567321624119208e-06, "loss": 0.9188, "step": 22947 }, { "epoch": 0.43, "learning_rate": 3.156584760853115e-06, "loss": 0.8519, "step": 22948 }, { "epoch": 0.43, "learning_rate": 3.156437356842641e-06, "loss": 1.0268, "step": 22949 }, { "epoch": 0.43, "learning_rate": 3.1562899503810513e-06, "loss": 1.01, "step": 22950 }, { "epoch": 0.43, "learning_rate": 3.156142541468894e-06, "loss": 1.0341, "step": 22951 }, { "epoch": 0.43, "learning_rate": 3.1559951301067205e-06, "loss": 0.9865, "step": 22952 }, { "epoch": 0.43, "learning_rate": 3.155847716295082e-06, "loss": 0.807, "step": 22953 }, { "epoch": 0.43, "learning_rate": 3.1557003000345275e-06, "loss": 0.912, "step": 22954 }, { "epoch": 0.43, "learning_rate": 3.1555528813256088e-06, "loss": 0.9937, "step": 22955 }, { "epoch": 0.43, "learning_rate": 3.155405460168876e-06, "loss": 1.0281, "step": 22956 }, { "epoch": 0.43, "learning_rate": 3.155258036564879e-06, "loss": 0.8742, "step": 22957 }, { "epoch": 0.43, "learning_rate": 3.1551106105141683e-06, "loss": 0.9491, "step": 22958 }, { "epoch": 0.43, "learning_rate": 3.1549631820172942e-06, "loss": 0.9258, "step": 22959 }, { "epoch": 0.43, "learning_rate": 3.1548157510748086e-06, "loss": 0.8257, "step": 22960 }, { "epoch": 0.43, "learning_rate": 3.1546683176872607e-06, "loss": 0.766, "step": 22961 }, { "epoch": 0.43, "learning_rate": 3.1545208818552016e-06, "loss": 1.0168, "step": 22962 }, { "epoch": 0.43, "learning_rate": 3.1543734435791814e-06, "loss": 1.1038, "step": 22963 }, { "epoch": 0.43, "learning_rate": 3.1542260028597506e-06, "loss": 0.8458, "step": 22964 }, { "epoch": 0.43, "learning_rate": 3.15407855969746e-06, "loss": 1.011, "step": 22965 }, { "epoch": 0.43, "learning_rate": 3.1539311140928602e-06, "loss": 0.9996, "step": 22966 }, { "epoch": 0.43, "learning_rate": 3.1537836660465017e-06, "loss": 0.9547, "step": 22967 }, { "epoch": 0.43, "learning_rate": 3.153636215558936e-06, "loss": 1.0798, "step": 22968 }, { "epoch": 0.43, "learning_rate": 3.153488762630711e-06, "loss": 1.0221, "step": 22969 }, { "epoch": 0.43, "learning_rate": 3.15334130726238e-06, "loss": 0.8027, "step": 22970 }, { "epoch": 0.43, "learning_rate": 3.1531938494544926e-06, "loss": 0.7979, "step": 22971 }, { "epoch": 0.43, "learning_rate": 3.153046389207599e-06, "loss": 0.9336, "step": 22972 }, { "epoch": 0.43, "learning_rate": 3.1528989265222496e-06, "loss": 0.7717, "step": 22973 }, { "epoch": 0.43, "learning_rate": 3.1527514613989975e-06, "loss": 0.7049, "step": 22974 }, { "epoch": 0.43, "learning_rate": 3.15260399383839e-06, "loss": 1.2835, "step": 22975 }, { "epoch": 0.43, "learning_rate": 3.1524565238409795e-06, "loss": 1.0865, "step": 22976 }, { "epoch": 0.43, "learning_rate": 3.1523090514073167e-06, "loss": 0.9971, "step": 22977 }, { "epoch": 0.43, "learning_rate": 3.1521615765379515e-06, "loss": 1.0082, "step": 22978 }, { "epoch": 0.43, "learning_rate": 3.152014099233435e-06, "loss": 1.0101, "step": 22979 }, { "epoch": 0.43, "learning_rate": 3.1518666194943182e-06, "loss": 0.6905, "step": 22980 }, { "epoch": 0.43, "learning_rate": 3.151719137321151e-06, "loss": 0.7866, "step": 22981 }, { "epoch": 0.43, "learning_rate": 3.1515716527144847e-06, "loss": 0.9859, "step": 22982 }, { "epoch": 0.43, "learning_rate": 3.15142416567487e-06, "loss": 0.9507, "step": 22983 }, { "epoch": 0.43, "learning_rate": 3.1512766762028567e-06, "loss": 1.0938, "step": 22984 }, { "epoch": 0.43, "learning_rate": 3.1511291842989973e-06, "loss": 0.7372, "step": 22985 }, { "epoch": 0.43, "learning_rate": 3.150981689963841e-06, "loss": 0.8888, "step": 22986 }, { "epoch": 0.43, "learning_rate": 3.1508341931979387e-06, "loss": 0.888, "step": 22987 }, { "epoch": 0.43, "learning_rate": 3.1506866940018414e-06, "loss": 0.9014, "step": 22988 }, { "epoch": 0.43, "learning_rate": 3.150539192376101e-06, "loss": 0.8277, "step": 22989 }, { "epoch": 0.43, "learning_rate": 3.1503916883212663e-06, "loss": 0.9014, "step": 22990 }, { "epoch": 0.43, "learning_rate": 3.1502441818378892e-06, "loss": 0.8152, "step": 22991 }, { "epoch": 0.43, "learning_rate": 3.150096672926521e-06, "loss": 0.9791, "step": 22992 }, { "epoch": 0.43, "learning_rate": 3.149949161587711e-06, "loss": 1.1264, "step": 22993 }, { "epoch": 0.43, "learning_rate": 3.14980164782201e-06, "loss": 1.0468, "step": 22994 }, { "epoch": 0.43, "learning_rate": 3.1496541316299713e-06, "loss": 0.9492, "step": 22995 }, { "epoch": 0.43, "learning_rate": 3.1495066130121425e-06, "loss": 0.8596, "step": 22996 }, { "epoch": 0.43, "learning_rate": 3.1493590919690762e-06, "loss": 1.0767, "step": 22997 }, { "epoch": 0.43, "learning_rate": 3.1492115685013235e-06, "loss": 0.7619, "step": 22998 }, { "epoch": 0.43, "learning_rate": 3.149064042609435e-06, "loss": 0.9007, "step": 22999 }, { "epoch": 0.43, "learning_rate": 3.1489165142939603e-06, "loss": 1.1401, "step": 23000 }, { "epoch": 0.43, "learning_rate": 3.1487689835554512e-06, "loss": 1.1392, "step": 23001 }, { "epoch": 0.43, "learning_rate": 3.148621450394459e-06, "loss": 0.8497, "step": 23002 }, { "epoch": 0.43, "learning_rate": 3.1484739148115347e-06, "loss": 0.8586, "step": 23003 }, { "epoch": 0.43, "learning_rate": 3.1483263768072283e-06, "loss": 0.774, "step": 23004 }, { "epoch": 0.43, "learning_rate": 3.1481788363820907e-06, "loss": 0.8703, "step": 23005 }, { "epoch": 0.43, "learning_rate": 3.1480312935366734e-06, "loss": 0.9728, "step": 23006 }, { "epoch": 0.43, "learning_rate": 3.1478837482715273e-06, "loss": 0.9263, "step": 23007 }, { "epoch": 0.43, "learning_rate": 3.147736200587203e-06, "loss": 0.7794, "step": 23008 }, { "epoch": 0.43, "learning_rate": 3.147588650484252e-06, "loss": 0.7713, "step": 23009 }, { "epoch": 0.43, "learning_rate": 3.1474410979632247e-06, "loss": 1.0174, "step": 23010 }, { "epoch": 0.43, "learning_rate": 3.147293543024672e-06, "loss": 0.8329, "step": 23011 }, { "epoch": 0.43, "learning_rate": 3.147145985669145e-06, "loss": 1.012, "step": 23012 }, { "epoch": 0.43, "learning_rate": 3.1469984258971953e-06, "loss": 1.0702, "step": 23013 }, { "epoch": 0.43, "learning_rate": 3.146850863709372e-06, "loss": 0.8981, "step": 23014 }, { "epoch": 0.43, "learning_rate": 3.1467032991062278e-06, "loss": 0.9561, "step": 23015 }, { "epoch": 0.43, "learning_rate": 3.1465557320883146e-06, "loss": 0.9652, "step": 23016 }, { "epoch": 0.43, "learning_rate": 3.146408162656181e-06, "loss": 0.7525, "step": 23017 }, { "epoch": 0.43, "learning_rate": 3.1462605908103795e-06, "loss": 1.0574, "step": 23018 }, { "epoch": 0.43, "learning_rate": 3.146113016551461e-06, "loss": 0.817, "step": 23019 }, { "epoch": 0.43, "learning_rate": 3.1459654398799755e-06, "loss": 1.0354, "step": 23020 }, { "epoch": 0.43, "learning_rate": 3.1458178607964753e-06, "loss": 0.9207, "step": 23021 }, { "epoch": 0.43, "learning_rate": 3.1456702793015108e-06, "loss": 0.9559, "step": 23022 }, { "epoch": 0.43, "learning_rate": 3.1455226953956335e-06, "loss": 0.8485, "step": 23023 }, { "epoch": 0.43, "learning_rate": 3.1453751090793943e-06, "loss": 0.9947, "step": 23024 }, { "epoch": 0.43, "learning_rate": 3.1452275203533443e-06, "loss": 1.0357, "step": 23025 }, { "epoch": 0.43, "learning_rate": 3.1450799292180344e-06, "loss": 0.7536, "step": 23026 }, { "epoch": 0.43, "learning_rate": 3.1449323356740157e-06, "loss": 0.8983, "step": 23027 }, { "epoch": 0.43, "learning_rate": 3.1447847397218395e-06, "loss": 0.9271, "step": 23028 }, { "epoch": 0.43, "learning_rate": 3.144637141362057e-06, "loss": 0.8451, "step": 23029 }, { "epoch": 0.43, "learning_rate": 3.1444895405952193e-06, "loss": 0.963, "step": 23030 }, { "epoch": 0.43, "learning_rate": 3.144341937421877e-06, "loss": 0.9297, "step": 23031 }, { "epoch": 0.43, "learning_rate": 3.1441943318425816e-06, "loss": 1.0057, "step": 23032 }, { "epoch": 0.43, "learning_rate": 3.144046723857885e-06, "loss": 0.8583, "step": 23033 }, { "epoch": 0.43, "learning_rate": 3.1438991134683374e-06, "loss": 0.839, "step": 23034 }, { "epoch": 0.43, "learning_rate": 3.1437515006744895e-06, "loss": 0.9996, "step": 23035 }, { "epoch": 0.43, "learning_rate": 3.1436038854768947e-06, "loss": 0.8189, "step": 23036 }, { "epoch": 0.43, "learning_rate": 3.1434562678761018e-06, "loss": 0.9225, "step": 23037 }, { "epoch": 0.43, "learning_rate": 3.1433086478726626e-06, "loss": 0.8129, "step": 23038 }, { "epoch": 0.43, "learning_rate": 3.1431610254671296e-06, "loss": 0.8759, "step": 23039 }, { "epoch": 0.43, "learning_rate": 3.1430134006600523e-06, "loss": 0.7477, "step": 23040 }, { "epoch": 0.43, "learning_rate": 3.1428657734519825e-06, "loss": 0.9213, "step": 23041 }, { "epoch": 0.43, "learning_rate": 3.142718143843472e-06, "loss": 0.8351, "step": 23042 }, { "epoch": 0.43, "learning_rate": 3.142570511835071e-06, "loss": 1.134, "step": 23043 }, { "epoch": 0.43, "learning_rate": 3.1424228774273324e-06, "loss": 0.7986, "step": 23044 }, { "epoch": 0.43, "learning_rate": 3.142275240620807e-06, "loss": 0.8552, "step": 23045 }, { "epoch": 0.43, "learning_rate": 3.142127601416044e-06, "loss": 0.8629, "step": 23046 }, { "epoch": 0.43, "learning_rate": 3.1419799598135967e-06, "loss": 0.9711, "step": 23047 }, { "epoch": 0.43, "learning_rate": 3.141832315814016e-06, "loss": 0.9061, "step": 23048 }, { "epoch": 0.43, "learning_rate": 3.1416846694178533e-06, "loss": 0.8886, "step": 23049 }, { "epoch": 0.43, "learning_rate": 3.1415370206256596e-06, "loss": 1.0729, "step": 23050 }, { "epoch": 0.43, "learning_rate": 3.1413893694379867e-06, "loss": 0.9468, "step": 23051 }, { "epoch": 0.43, "learning_rate": 3.141241715855385e-06, "loss": 0.941, "step": 23052 }, { "epoch": 0.43, "learning_rate": 3.1410940598784067e-06, "loss": 0.9407, "step": 23053 }, { "epoch": 0.43, "learning_rate": 3.140946401507603e-06, "loss": 1.0115, "step": 23054 }, { "epoch": 0.43, "learning_rate": 3.140798740743525e-06, "loss": 0.8041, "step": 23055 }, { "epoch": 0.43, "learning_rate": 3.1406510775867225e-06, "loss": 1.1742, "step": 23056 }, { "epoch": 0.44, "learning_rate": 3.140503412037751e-06, "loss": 0.9857, "step": 23057 }, { "epoch": 0.44, "learning_rate": 3.140355744097158e-06, "loss": 0.9517, "step": 23058 }, { "epoch": 0.44, "learning_rate": 3.140208073765497e-06, "loss": 0.8453, "step": 23059 }, { "epoch": 0.44, "learning_rate": 3.140060401043319e-06, "loss": 0.9034, "step": 23060 }, { "epoch": 0.44, "learning_rate": 3.139912725931174e-06, "loss": 0.876, "step": 23061 }, { "epoch": 0.44, "learning_rate": 3.139765048429615e-06, "loss": 1.1293, "step": 23062 }, { "epoch": 0.44, "learning_rate": 3.1396173685391927e-06, "loss": 0.9296, "step": 23063 }, { "epoch": 0.44, "learning_rate": 3.139469686260459e-06, "loss": 1.1137, "step": 23064 }, { "epoch": 0.44, "learning_rate": 3.1393220015939647e-06, "loss": 0.8145, "step": 23065 }, { "epoch": 0.44, "learning_rate": 3.1391743145402628e-06, "loss": 0.9575, "step": 23066 }, { "epoch": 0.44, "learning_rate": 3.1390266250999023e-06, "loss": 0.8977, "step": 23067 }, { "epoch": 0.44, "learning_rate": 3.1388789332734365e-06, "loss": 1.1229, "step": 23068 }, { "epoch": 0.44, "learning_rate": 3.1387312390614163e-06, "loss": 0.939, "step": 23069 }, { "epoch": 0.44, "learning_rate": 3.1385835424643927e-06, "loss": 1.0712, "step": 23070 }, { "epoch": 0.44, "learning_rate": 3.138435843482918e-06, "loss": 0.6751, "step": 23071 }, { "epoch": 0.44, "learning_rate": 3.138288142117545e-06, "loss": 0.8578, "step": 23072 }, { "epoch": 0.44, "learning_rate": 3.138140438368822e-06, "loss": 0.9894, "step": 23073 }, { "epoch": 0.44, "learning_rate": 3.137992732237302e-06, "loss": 0.9525, "step": 23074 }, { "epoch": 0.44, "learning_rate": 3.137845023723538e-06, "loss": 1.207, "step": 23075 }, { "epoch": 0.44, "learning_rate": 3.137697312828079e-06, "loss": 1.028, "step": 23076 }, { "epoch": 0.44, "learning_rate": 3.1375495995514782e-06, "loss": 0.8258, "step": 23077 }, { "epoch": 0.44, "learning_rate": 3.137401883894287e-06, "loss": 0.9712, "step": 23078 }, { "epoch": 0.44, "learning_rate": 3.1372541658570564e-06, "loss": 0.8384, "step": 23079 }, { "epoch": 0.44, "learning_rate": 3.137106445440338e-06, "loss": 0.7914, "step": 23080 }, { "epoch": 0.44, "learning_rate": 3.1369587226446846e-06, "loss": 1.2366, "step": 23081 }, { "epoch": 0.44, "learning_rate": 3.1368109974706464e-06, "loss": 0.817, "step": 23082 }, { "epoch": 0.44, "learning_rate": 3.136663269918775e-06, "loss": 0.7962, "step": 23083 }, { "epoch": 0.44, "learning_rate": 3.136515539989623e-06, "loss": 0.8566, "step": 23084 }, { "epoch": 0.44, "learning_rate": 3.136367807683741e-06, "loss": 0.9553, "step": 23085 }, { "epoch": 0.44, "learning_rate": 3.136220073001682e-06, "loss": 1.0984, "step": 23086 }, { "epoch": 0.44, "learning_rate": 3.136072335943996e-06, "loss": 1.0592, "step": 23087 }, { "epoch": 0.44, "learning_rate": 3.1359245965112354e-06, "loss": 1.1009, "step": 23088 }, { "epoch": 0.44, "learning_rate": 3.1357768547039524e-06, "loss": 0.7465, "step": 23089 }, { "epoch": 0.44, "learning_rate": 3.1356291105226977e-06, "loss": 1.1203, "step": 23090 }, { "epoch": 0.44, "learning_rate": 3.1354813639680233e-06, "loss": 0.7444, "step": 23091 }, { "epoch": 0.44, "learning_rate": 3.1353336150404813e-06, "loss": 0.7836, "step": 23092 }, { "epoch": 0.44, "learning_rate": 3.135185863740623e-06, "loss": 0.736, "step": 23093 }, { "epoch": 0.44, "learning_rate": 3.1350381100689997e-06, "loss": 1.1271, "step": 23094 }, { "epoch": 0.44, "learning_rate": 3.134890354026164e-06, "loss": 0.843, "step": 23095 }, { "epoch": 0.44, "learning_rate": 3.1347425956126677e-06, "loss": 0.7873, "step": 23096 }, { "epoch": 0.44, "learning_rate": 3.134594834829061e-06, "loss": 0.9891, "step": 23097 }, { "epoch": 0.44, "learning_rate": 3.134447071675897e-06, "loss": 0.8345, "step": 23098 }, { "epoch": 0.44, "learning_rate": 3.1342993061537276e-06, "loss": 1.0358, "step": 23099 }, { "epoch": 0.44, "learning_rate": 3.1341515382631034e-06, "loss": 1.2243, "step": 23100 }, { "epoch": 0.44, "learning_rate": 3.1340037680045766e-06, "loss": 0.9623, "step": 23101 }, { "epoch": 0.44, "learning_rate": 3.1338559953787003e-06, "loss": 1.098, "step": 23102 }, { "epoch": 0.44, "learning_rate": 3.133708220386024e-06, "loss": 0.9146, "step": 23103 }, { "epoch": 0.44, "learning_rate": 3.133560443027101e-06, "loss": 0.9142, "step": 23104 }, { "epoch": 0.44, "learning_rate": 3.133412663302483e-06, "loss": 1.1, "step": 23105 }, { "epoch": 0.44, "learning_rate": 3.133264881212721e-06, "loss": 1.0804, "step": 23106 }, { "epoch": 0.44, "learning_rate": 3.1331170967583675e-06, "loss": 0.8166, "step": 23107 }, { "epoch": 0.44, "learning_rate": 3.1329693099399748e-06, "loss": 0.7682, "step": 23108 }, { "epoch": 0.44, "learning_rate": 3.1328215207580937e-06, "loss": 0.8738, "step": 23109 }, { "epoch": 0.44, "learning_rate": 3.1326737292132757e-06, "loss": 0.8541, "step": 23110 }, { "epoch": 0.44, "learning_rate": 3.1325259353060743e-06, "loss": 0.9088, "step": 23111 }, { "epoch": 0.44, "learning_rate": 3.13237813903704e-06, "loss": 1.0249, "step": 23112 }, { "epoch": 0.44, "learning_rate": 3.1322303404067255e-06, "loss": 1.1251, "step": 23113 }, { "epoch": 0.44, "learning_rate": 3.132082539415683e-06, "loss": 0.9772, "step": 23114 }, { "epoch": 0.44, "learning_rate": 3.1319347360644624e-06, "loss": 0.6751, "step": 23115 }, { "epoch": 0.44, "learning_rate": 3.131786930353617e-06, "loss": 0.7437, "step": 23116 }, { "epoch": 0.44, "learning_rate": 3.1316391222836993e-06, "loss": 0.8456, "step": 23117 }, { "epoch": 0.44, "learning_rate": 3.1314913118552605e-06, "loss": 0.9027, "step": 23118 }, { "epoch": 0.44, "learning_rate": 3.1313434990688506e-06, "loss": 1.3024, "step": 23119 }, { "epoch": 0.44, "learning_rate": 3.1311956839250255e-06, "loss": 1.1176, "step": 23120 }, { "epoch": 0.44, "learning_rate": 3.1310478664243342e-06, "loss": 0.8357, "step": 23121 }, { "epoch": 0.44, "learning_rate": 3.13090004656733e-06, "loss": 0.8111, "step": 23122 }, { "epoch": 0.44, "learning_rate": 3.1307522243545647e-06, "loss": 0.8981, "step": 23123 }, { "epoch": 0.44, "learning_rate": 3.1306043997865892e-06, "loss": 1.1042, "step": 23124 }, { "epoch": 0.44, "learning_rate": 3.130456572863956e-06, "loss": 1.1827, "step": 23125 }, { "epoch": 0.44, "learning_rate": 3.1303087435872174e-06, "loss": 0.7503, "step": 23126 }, { "epoch": 0.44, "learning_rate": 3.130160911956926e-06, "loss": 0.727, "step": 23127 }, { "epoch": 0.44, "learning_rate": 3.1300130779736326e-06, "loss": 0.7194, "step": 23128 }, { "epoch": 0.44, "learning_rate": 3.12986524163789e-06, "loss": 0.9384, "step": 23129 }, { "epoch": 0.44, "learning_rate": 3.129717402950249e-06, "loss": 0.8694, "step": 23130 }, { "epoch": 0.44, "learning_rate": 3.129569561911263e-06, "loss": 1.0756, "step": 23131 }, { "epoch": 0.44, "learning_rate": 3.1294217185214837e-06, "loss": 0.9237, "step": 23132 }, { "epoch": 0.44, "learning_rate": 3.129273872781463e-06, "loss": 0.7921, "step": 23133 }, { "epoch": 0.44, "learning_rate": 3.1291260246917534e-06, "loss": 0.9641, "step": 23134 }, { "epoch": 0.44, "learning_rate": 3.1289781742529057e-06, "loss": 0.812, "step": 23135 }, { "epoch": 0.44, "learning_rate": 3.1288303214654736e-06, "loss": 0.9952, "step": 23136 }, { "epoch": 0.44, "learning_rate": 3.1286824663300074e-06, "loss": 0.909, "step": 23137 }, { "epoch": 0.44, "learning_rate": 3.1285346088470613e-06, "loss": 1.0593, "step": 23138 }, { "epoch": 0.44, "learning_rate": 3.1283867490171855e-06, "loss": 0.8963, "step": 23139 }, { "epoch": 0.44, "learning_rate": 3.128238886840932e-06, "loss": 0.6759, "step": 23140 }, { "epoch": 0.44, "learning_rate": 3.1280910223188554e-06, "loss": 0.7841, "step": 23141 }, { "epoch": 0.44, "learning_rate": 3.1279431554515055e-06, "loss": 0.7805, "step": 23142 }, { "epoch": 0.44, "learning_rate": 3.1277952862394346e-06, "loss": 1.1304, "step": 23143 }, { "epoch": 0.44, "learning_rate": 3.1276474146831966e-06, "loss": 1.0684, "step": 23144 }, { "epoch": 0.44, "learning_rate": 3.1274995407833413e-06, "loss": 0.8557, "step": 23145 }, { "epoch": 0.44, "learning_rate": 3.127351664540422e-06, "loss": 1.0397, "step": 23146 }, { "epoch": 0.44, "learning_rate": 3.1272037859549915e-06, "loss": 0.9847, "step": 23147 }, { "epoch": 0.44, "learning_rate": 3.1270559050276007e-06, "loss": 0.695, "step": 23148 }, { "epoch": 0.44, "learning_rate": 3.126908021758803e-06, "loss": 1.03, "step": 23149 }, { "epoch": 0.44, "learning_rate": 3.1267601361491495e-06, "loss": 0.9811, "step": 23150 }, { "epoch": 0.44, "learning_rate": 3.1266122481991923e-06, "loss": 0.8616, "step": 23151 }, { "epoch": 0.44, "learning_rate": 3.1264643579094854e-06, "loss": 0.8486, "step": 23152 }, { "epoch": 0.44, "learning_rate": 3.1263164652805788e-06, "loss": 0.9069, "step": 23153 }, { "epoch": 0.44, "learning_rate": 3.1261685703130256e-06, "loss": 0.8425, "step": 23154 }, { "epoch": 0.44, "learning_rate": 3.1260206730073795e-06, "loss": 0.7668, "step": 23155 }, { "epoch": 0.44, "learning_rate": 3.12587277336419e-06, "loss": 1.076, "step": 23156 }, { "epoch": 0.44, "learning_rate": 3.1257248713840114e-06, "loss": 0.9221, "step": 23157 }, { "epoch": 0.44, "learning_rate": 3.1255769670673956e-06, "loss": 0.8985, "step": 23158 }, { "epoch": 0.44, "learning_rate": 3.125429060414894e-06, "loss": 0.8799, "step": 23159 }, { "epoch": 0.44, "learning_rate": 3.12528115142706e-06, "loss": 0.8014, "step": 23160 }, { "epoch": 0.44, "learning_rate": 3.125133240104445e-06, "loss": 1.2228, "step": 23161 }, { "epoch": 0.44, "learning_rate": 3.1249853264476015e-06, "loss": 1.2683, "step": 23162 }, { "epoch": 0.44, "learning_rate": 3.1248374104570824e-06, "loss": 0.753, "step": 23163 }, { "epoch": 0.44, "learning_rate": 3.1246894921334394e-06, "loss": 0.8804, "step": 23164 }, { "epoch": 0.44, "learning_rate": 3.1245415714772247e-06, "loss": 0.9839, "step": 23165 }, { "epoch": 0.44, "learning_rate": 3.1243936484889908e-06, "loss": 0.9452, "step": 23166 }, { "epoch": 0.44, "learning_rate": 3.1242457231692906e-06, "loss": 0.9509, "step": 23167 }, { "epoch": 0.44, "learning_rate": 3.1240977955186756e-06, "loss": 1.1093, "step": 23168 }, { "epoch": 0.44, "learning_rate": 3.123949865537699e-06, "loss": 1.0397, "step": 23169 }, { "epoch": 0.44, "learning_rate": 3.123801933226913e-06, "loss": 0.9669, "step": 23170 }, { "epoch": 0.44, "learning_rate": 3.123653998586869e-06, "loss": 0.9038, "step": 23171 }, { "epoch": 0.44, "learning_rate": 3.1235060616181203e-06, "loss": 0.9978, "step": 23172 }, { "epoch": 0.44, "learning_rate": 3.1233581223212194e-06, "loss": 0.8379, "step": 23173 }, { "epoch": 0.44, "learning_rate": 3.1232101806967173e-06, "loss": 1.0676, "step": 23174 }, { "epoch": 0.44, "learning_rate": 3.1230622367451684e-06, "loss": 0.954, "step": 23175 }, { "epoch": 0.44, "learning_rate": 3.122914290467125e-06, "loss": 0.8604, "step": 23176 }, { "epoch": 0.44, "learning_rate": 3.1227663418631378e-06, "loss": 0.7954, "step": 23177 }, { "epoch": 0.44, "learning_rate": 3.1226183909337598e-06, "loss": 0.8698, "step": 23178 }, { "epoch": 0.44, "learning_rate": 3.122470437679545e-06, "loss": 0.9581, "step": 23179 }, { "epoch": 0.44, "learning_rate": 3.122322482101044e-06, "loss": 1.0107, "step": 23180 }, { "epoch": 0.44, "learning_rate": 3.1221745241988095e-06, "loss": 1.0355, "step": 23181 }, { "epoch": 0.44, "learning_rate": 3.122026563973395e-06, "loss": 1.0626, "step": 23182 }, { "epoch": 0.44, "learning_rate": 3.1218786014253523e-06, "loss": 0.9495, "step": 23183 }, { "epoch": 0.44, "learning_rate": 3.1217306365552338e-06, "loss": 0.8956, "step": 23184 }, { "epoch": 0.44, "learning_rate": 3.121582669363592e-06, "loss": 0.9972, "step": 23185 }, { "epoch": 0.44, "learning_rate": 3.1214346998509798e-06, "loss": 0.9369, "step": 23186 }, { "epoch": 0.44, "learning_rate": 3.1212867280179493e-06, "loss": 1.0941, "step": 23187 }, { "epoch": 0.44, "learning_rate": 3.1211387538650535e-06, "loss": 1.1045, "step": 23188 }, { "epoch": 0.44, "learning_rate": 3.1209907773928443e-06, "loss": 0.6793, "step": 23189 }, { "epoch": 0.44, "learning_rate": 3.120842798601875e-06, "loss": 0.9686, "step": 23190 }, { "epoch": 0.44, "learning_rate": 3.1206948174926977e-06, "loss": 0.8585, "step": 23191 }, { "epoch": 0.44, "learning_rate": 3.1205468340658647e-06, "loss": 1.0228, "step": 23192 }, { "epoch": 0.44, "learning_rate": 3.1203988483219287e-06, "loss": 1.0804, "step": 23193 }, { "epoch": 0.44, "learning_rate": 3.1202508602614427e-06, "loss": 0.9477, "step": 23194 }, { "epoch": 0.44, "learning_rate": 3.120102869884959e-06, "loss": 0.9796, "step": 23195 }, { "epoch": 0.44, "learning_rate": 3.11995487719303e-06, "loss": 0.8579, "step": 23196 }, { "epoch": 0.44, "learning_rate": 3.1198068821862087e-06, "loss": 0.8533, "step": 23197 }, { "epoch": 0.44, "learning_rate": 3.119658884865048e-06, "loss": 0.8197, "step": 23198 }, { "epoch": 0.44, "learning_rate": 3.1195108852300986e-06, "loss": 1.0101, "step": 23199 }, { "epoch": 0.44, "learning_rate": 3.119362883281916e-06, "loss": 0.8934, "step": 23200 }, { "epoch": 0.44, "learning_rate": 3.119214879021051e-06, "loss": 1.031, "step": 23201 }, { "epoch": 0.44, "learning_rate": 3.119066872448056e-06, "loss": 1.023, "step": 23202 }, { "epoch": 0.44, "learning_rate": 3.1189188635634847e-06, "loss": 1.0115, "step": 23203 }, { "epoch": 0.44, "learning_rate": 3.1187708523678895e-06, "loss": 0.7877, "step": 23204 }, { "epoch": 0.44, "learning_rate": 3.1186228388618227e-06, "loss": 0.7586, "step": 23205 }, { "epoch": 0.44, "learning_rate": 3.1184748230458377e-06, "loss": 1.0029, "step": 23206 }, { "epoch": 0.44, "learning_rate": 3.118326804920486e-06, "loss": 0.7067, "step": 23207 }, { "epoch": 0.44, "learning_rate": 3.1181787844863208e-06, "loss": 0.9584, "step": 23208 }, { "epoch": 0.44, "learning_rate": 3.1180307617438954e-06, "loss": 1.1389, "step": 23209 }, { "epoch": 0.44, "learning_rate": 3.117882736693762e-06, "loss": 0.6588, "step": 23210 }, { "epoch": 0.44, "learning_rate": 3.1177347093364735e-06, "loss": 1.0801, "step": 23211 }, { "epoch": 0.44, "learning_rate": 3.1175866796725828e-06, "loss": 1.2393, "step": 23212 }, { "epoch": 0.44, "learning_rate": 3.117438647702642e-06, "loss": 1.0763, "step": 23213 }, { "epoch": 0.44, "learning_rate": 3.117290613427204e-06, "loss": 0.9684, "step": 23214 }, { "epoch": 0.44, "learning_rate": 3.117142576846823e-06, "loss": 1.1257, "step": 23215 }, { "epoch": 0.44, "learning_rate": 3.1169945379620485e-06, "loss": 0.8461, "step": 23216 }, { "epoch": 0.44, "learning_rate": 3.116846496773437e-06, "loss": 0.9282, "step": 23217 }, { "epoch": 0.44, "learning_rate": 3.1166984532815393e-06, "loss": 1.2094, "step": 23218 }, { "epoch": 0.44, "learning_rate": 3.116550407486908e-06, "loss": 0.9832, "step": 23219 }, { "epoch": 0.44, "learning_rate": 3.1164023593900965e-06, "loss": 1.0428, "step": 23220 }, { "epoch": 0.44, "learning_rate": 3.116254308991658e-06, "loss": 0.8261, "step": 23221 }, { "epoch": 0.44, "learning_rate": 3.116106256292144e-06, "loss": 0.7817, "step": 23222 }, { "epoch": 0.44, "learning_rate": 3.1159582012921084e-06, "loss": 0.8295, "step": 23223 }, { "epoch": 0.44, "learning_rate": 3.1158101439921042e-06, "loss": 0.944, "step": 23224 }, { "epoch": 0.44, "learning_rate": 3.1156620843926834e-06, "loss": 0.9642, "step": 23225 }, { "epoch": 0.44, "learning_rate": 3.115514022494399e-06, "loss": 1.0085, "step": 23226 }, { "epoch": 0.44, "learning_rate": 3.1153659582978047e-06, "loss": 1.0813, "step": 23227 }, { "epoch": 0.44, "learning_rate": 3.1152178918034527e-06, "loss": 0.8136, "step": 23228 }, { "epoch": 0.44, "learning_rate": 3.1150698230118957e-06, "loss": 0.848, "step": 23229 }, { "epoch": 0.44, "learning_rate": 3.1149217519236867e-06, "loss": 0.9254, "step": 23230 }, { "epoch": 0.44, "learning_rate": 3.114773678539379e-06, "loss": 1.0495, "step": 23231 }, { "epoch": 0.44, "learning_rate": 3.114625602859525e-06, "loss": 1.1415, "step": 23232 }, { "epoch": 0.44, "learning_rate": 3.1144775248846783e-06, "loss": 0.8061, "step": 23233 }, { "epoch": 0.44, "learning_rate": 3.114329444615391e-06, "loss": 0.8732, "step": 23234 }, { "epoch": 0.44, "learning_rate": 3.1141813620522167e-06, "loss": 0.7705, "step": 23235 }, { "epoch": 0.44, "learning_rate": 3.1140332771957083e-06, "loss": 1.0783, "step": 23236 }, { "epoch": 0.44, "learning_rate": 3.113885190046417e-06, "loss": 0.973, "step": 23237 }, { "epoch": 0.44, "learning_rate": 3.1137371006048983e-06, "loss": 1.0212, "step": 23238 }, { "epoch": 0.44, "learning_rate": 3.113589008871704e-06, "loss": 0.9694, "step": 23239 }, { "epoch": 0.44, "learning_rate": 3.113440914847387e-06, "loss": 0.8937, "step": 23240 }, { "epoch": 0.44, "learning_rate": 3.1132928185325007e-06, "loss": 0.7814, "step": 23241 }, { "epoch": 0.44, "learning_rate": 3.113144719927598e-06, "loss": 0.6968, "step": 23242 }, { "epoch": 0.44, "learning_rate": 3.112996619033232e-06, "loss": 0.9495, "step": 23243 }, { "epoch": 0.44, "learning_rate": 3.1128485158499544e-06, "loss": 0.9626, "step": 23244 }, { "epoch": 0.44, "learning_rate": 3.112700410378319e-06, "loss": 1.0869, "step": 23245 }, { "epoch": 0.44, "learning_rate": 3.1125523026188796e-06, "loss": 0.8493, "step": 23246 }, { "epoch": 0.44, "learning_rate": 3.1124041925721894e-06, "loss": 0.966, "step": 23247 }, { "epoch": 0.44, "learning_rate": 3.1122560802388004e-06, "loss": 0.9442, "step": 23248 }, { "epoch": 0.44, "learning_rate": 3.1121079656192656e-06, "loss": 0.9191, "step": 23249 }, { "epoch": 0.44, "learning_rate": 3.1119598487141378e-06, "loss": 0.968, "step": 23250 }, { "epoch": 0.44, "learning_rate": 3.1118117295239713e-06, "loss": 0.895, "step": 23251 }, { "epoch": 0.44, "learning_rate": 3.111663608049319e-06, "loss": 1.2506, "step": 23252 }, { "epoch": 0.44, "learning_rate": 3.111515484290733e-06, "loss": 0.9701, "step": 23253 }, { "epoch": 0.44, "learning_rate": 3.1113673582487676e-06, "loss": 0.9968, "step": 23254 }, { "epoch": 0.44, "learning_rate": 3.1112192299239746e-06, "loss": 1.0092, "step": 23255 }, { "epoch": 0.44, "learning_rate": 3.111071099316908e-06, "loss": 1.2629, "step": 23256 }, { "epoch": 0.44, "learning_rate": 3.1109229664281203e-06, "loss": 0.927, "step": 23257 }, { "epoch": 0.44, "learning_rate": 3.110774831258165e-06, "loss": 0.9489, "step": 23258 }, { "epoch": 0.44, "learning_rate": 3.110626693807595e-06, "loss": 0.8698, "step": 23259 }, { "epoch": 0.44, "learning_rate": 3.110478554076965e-06, "loss": 0.9352, "step": 23260 }, { "epoch": 0.44, "learning_rate": 3.1103304120668253e-06, "loss": 0.727, "step": 23261 }, { "epoch": 0.44, "learning_rate": 3.1101822677777317e-06, "loss": 0.9714, "step": 23262 }, { "epoch": 0.44, "learning_rate": 3.110034121210236e-06, "loss": 0.7841, "step": 23263 }, { "epoch": 0.44, "learning_rate": 3.1098859723648912e-06, "loss": 0.9887, "step": 23264 }, { "epoch": 0.44, "learning_rate": 3.10973782124225e-06, "loss": 0.9472, "step": 23265 }, { "epoch": 0.44, "learning_rate": 3.109589667842868e-06, "loss": 0.8334, "step": 23266 }, { "epoch": 0.44, "learning_rate": 3.1094415121672963e-06, "loss": 0.8214, "step": 23267 }, { "epoch": 0.44, "learning_rate": 3.1092933542160885e-06, "loss": 0.8804, "step": 23268 }, { "epoch": 0.44, "learning_rate": 3.109145193989798e-06, "loss": 1.0976, "step": 23269 }, { "epoch": 0.44, "learning_rate": 3.1089970314889783e-06, "loss": 1.0368, "step": 23270 }, { "epoch": 0.44, "learning_rate": 3.108848866714182e-06, "loss": 0.934, "step": 23271 }, { "epoch": 0.44, "learning_rate": 3.108700699665963e-06, "loss": 0.9493, "step": 23272 }, { "epoch": 0.44, "learning_rate": 3.108552530344874e-06, "loss": 0.7206, "step": 23273 }, { "epoch": 0.44, "learning_rate": 3.108404358751469e-06, "loss": 0.8828, "step": 23274 }, { "epoch": 0.44, "learning_rate": 3.1082561848863004e-06, "loss": 1.1512, "step": 23275 }, { "epoch": 0.44, "learning_rate": 3.1081080087499217e-06, "loss": 1.0635, "step": 23276 }, { "epoch": 0.44, "learning_rate": 3.107959830342887e-06, "loss": 0.7531, "step": 23277 }, { "epoch": 0.44, "learning_rate": 3.1078116496657483e-06, "loss": 0.8735, "step": 23278 }, { "epoch": 0.44, "learning_rate": 3.107663466719059e-06, "loss": 1.0101, "step": 23279 }, { "epoch": 0.44, "learning_rate": 3.1075152815033745e-06, "loss": 0.8858, "step": 23280 }, { "epoch": 0.44, "learning_rate": 3.1073670940192454e-06, "loss": 0.9863, "step": 23281 }, { "epoch": 0.44, "learning_rate": 3.1072189042672262e-06, "loss": 0.8173, "step": 23282 }, { "epoch": 0.44, "learning_rate": 3.107070712247871e-06, "loss": 0.9098, "step": 23283 }, { "epoch": 0.44, "learning_rate": 3.106922517961732e-06, "loss": 0.904, "step": 23284 }, { "epoch": 0.44, "learning_rate": 3.1067743214093625e-06, "loss": 1.062, "step": 23285 }, { "epoch": 0.44, "learning_rate": 3.106626122591317e-06, "loss": 0.9493, "step": 23286 }, { "epoch": 0.44, "learning_rate": 3.1064779215081474e-06, "loss": 1.2412, "step": 23287 }, { "epoch": 0.44, "learning_rate": 3.106329718160408e-06, "loss": 1.0962, "step": 23288 }, { "epoch": 0.44, "learning_rate": 3.1061815125486527e-06, "loss": 1.1369, "step": 23289 }, { "epoch": 0.44, "learning_rate": 3.1060333046734336e-06, "loss": 0.7786, "step": 23290 }, { "epoch": 0.44, "learning_rate": 3.1058850945353055e-06, "loss": 0.8432, "step": 23291 }, { "epoch": 0.44, "learning_rate": 3.10573688213482e-06, "loss": 0.7731, "step": 23292 }, { "epoch": 0.44, "learning_rate": 3.1055886674725318e-06, "loss": 1.0093, "step": 23293 }, { "epoch": 0.44, "learning_rate": 3.105440450548994e-06, "loss": 1.1505, "step": 23294 }, { "epoch": 0.44, "learning_rate": 3.105292231364761e-06, "loss": 0.9632, "step": 23295 }, { "epoch": 0.44, "learning_rate": 3.1051440099203843e-06, "loss": 1.0505, "step": 23296 }, { "epoch": 0.44, "learning_rate": 3.104995786216419e-06, "loss": 0.9551, "step": 23297 }, { "epoch": 0.44, "learning_rate": 3.1048475602534183e-06, "loss": 0.8326, "step": 23298 }, { "epoch": 0.44, "learning_rate": 3.104699332031935e-06, "loss": 1.2307, "step": 23299 }, { "epoch": 0.44, "learning_rate": 3.104551101552522e-06, "loss": 1.083, "step": 23300 }, { "epoch": 0.44, "learning_rate": 3.104402868815735e-06, "loss": 0.9142, "step": 23301 }, { "epoch": 0.44, "learning_rate": 3.1042546338221257e-06, "loss": 0.9102, "step": 23302 }, { "epoch": 0.44, "learning_rate": 3.1041063965722482e-06, "loss": 0.8779, "step": 23303 }, { "epoch": 0.44, "learning_rate": 3.1039581570666564e-06, "loss": 0.8712, "step": 23304 }, { "epoch": 0.44, "learning_rate": 3.1038099153059033e-06, "loss": 1.0312, "step": 23305 }, { "epoch": 0.44, "learning_rate": 3.1036616712905416e-06, "loss": 1.1883, "step": 23306 }, { "epoch": 0.44, "learning_rate": 3.103513425021126e-06, "loss": 0.9382, "step": 23307 }, { "epoch": 0.44, "learning_rate": 3.1033651764982096e-06, "loss": 0.7641, "step": 23308 }, { "epoch": 0.44, "learning_rate": 3.1032169257223464e-06, "loss": 1.0533, "step": 23309 }, { "epoch": 0.44, "learning_rate": 3.103068672694091e-06, "loss": 0.8851, "step": 23310 }, { "epoch": 0.44, "learning_rate": 3.1029204174139944e-06, "loss": 0.8741, "step": 23311 }, { "epoch": 0.44, "learning_rate": 3.102772159882611e-06, "loss": 1.1553, "step": 23312 }, { "epoch": 0.44, "learning_rate": 3.1026239001004954e-06, "loss": 0.9622, "step": 23313 }, { "epoch": 0.44, "learning_rate": 3.102475638068201e-06, "loss": 0.8488, "step": 23314 }, { "epoch": 0.44, "learning_rate": 3.1023273737862804e-06, "loss": 0.9057, "step": 23315 }, { "epoch": 0.44, "learning_rate": 3.102179107255288e-06, "loss": 0.7444, "step": 23316 }, { "epoch": 0.44, "learning_rate": 3.1020308384757775e-06, "loss": 0.7408, "step": 23317 }, { "epoch": 0.44, "learning_rate": 3.1018825674483022e-06, "loss": 0.9854, "step": 23318 }, { "epoch": 0.44, "learning_rate": 3.1017342941734164e-06, "loss": 1.0232, "step": 23319 }, { "epoch": 0.44, "learning_rate": 3.1015860186516716e-06, "loss": 1.0171, "step": 23320 }, { "epoch": 0.44, "learning_rate": 3.1014377408836245e-06, "loss": 0.8807, "step": 23321 }, { "epoch": 0.44, "learning_rate": 3.1012894608698268e-06, "loss": 0.8611, "step": 23322 }, { "epoch": 0.44, "learning_rate": 3.101141178610833e-06, "loss": 0.7827, "step": 23323 }, { "epoch": 0.44, "learning_rate": 3.100992894107196e-06, "loss": 0.9886, "step": 23324 }, { "epoch": 0.44, "learning_rate": 3.1008446073594708e-06, "loss": 1.1307, "step": 23325 }, { "epoch": 0.44, "learning_rate": 3.1006963183682092e-06, "loss": 0.9877, "step": 23326 }, { "epoch": 0.44, "learning_rate": 3.1005480271339668e-06, "loss": 0.725, "step": 23327 }, { "epoch": 0.44, "learning_rate": 3.100399733657296e-06, "loss": 1.0229, "step": 23328 }, { "epoch": 0.44, "learning_rate": 3.100251437938751e-06, "loss": 0.7941, "step": 23329 }, { "epoch": 0.44, "learning_rate": 3.1001031399788857e-06, "loss": 1.0916, "step": 23330 }, { "epoch": 0.44, "learning_rate": 3.0999548397782536e-06, "loss": 1.1096, "step": 23331 }, { "epoch": 0.44, "learning_rate": 3.0998065373374086e-06, "loss": 1.0641, "step": 23332 }, { "epoch": 0.44, "learning_rate": 3.099658232656904e-06, "loss": 0.9018, "step": 23333 }, { "epoch": 0.44, "learning_rate": 3.0995099257372948e-06, "loss": 1.1937, "step": 23334 }, { "epoch": 0.44, "learning_rate": 3.099361616579133e-06, "loss": 0.961, "step": 23335 }, { "epoch": 0.44, "learning_rate": 3.0992133051829737e-06, "loss": 1.1307, "step": 23336 }, { "epoch": 0.44, "learning_rate": 3.099064991549371e-06, "loss": 1.2451, "step": 23337 }, { "epoch": 0.44, "learning_rate": 3.0989166756788767e-06, "loss": 1.0241, "step": 23338 }, { "epoch": 0.44, "learning_rate": 3.098768357572046e-06, "loss": 0.8883, "step": 23339 }, { "epoch": 0.44, "learning_rate": 3.098620037229434e-06, "loss": 0.9136, "step": 23340 }, { "epoch": 0.44, "learning_rate": 3.098471714651592e-06, "loss": 0.9846, "step": 23341 }, { "epoch": 0.44, "learning_rate": 3.0983233898390747e-06, "loss": 0.9613, "step": 23342 }, { "epoch": 0.44, "learning_rate": 3.0981750627924372e-06, "loss": 0.9471, "step": 23343 }, { "epoch": 0.44, "learning_rate": 3.0980267335122314e-06, "loss": 0.9967, "step": 23344 }, { "epoch": 0.44, "learning_rate": 3.0978784019990126e-06, "loss": 0.9874, "step": 23345 }, { "epoch": 0.44, "learning_rate": 3.0977300682533347e-06, "loss": 0.8811, "step": 23346 }, { "epoch": 0.44, "learning_rate": 3.0975817322757507e-06, "loss": 1.0841, "step": 23347 }, { "epoch": 0.44, "learning_rate": 3.0974333940668144e-06, "loss": 0.9398, "step": 23348 }, { "epoch": 0.44, "learning_rate": 3.0972850536270804e-06, "loss": 0.9135, "step": 23349 }, { "epoch": 0.44, "learning_rate": 3.0971367109571023e-06, "loss": 0.8767, "step": 23350 }, { "epoch": 0.44, "learning_rate": 3.0969883660574336e-06, "loss": 1.0069, "step": 23351 }, { "epoch": 0.44, "learning_rate": 3.0968400189286296e-06, "loss": 1.0202, "step": 23352 }, { "epoch": 0.44, "learning_rate": 3.0966916695712425e-06, "loss": 1.0901, "step": 23353 }, { "epoch": 0.44, "learning_rate": 3.096543317985827e-06, "loss": 0.8303, "step": 23354 }, { "epoch": 0.44, "learning_rate": 3.0963949641729375e-06, "loss": 0.99, "step": 23355 }, { "epoch": 0.44, "learning_rate": 3.096246608133127e-06, "loss": 0.9843, "step": 23356 }, { "epoch": 0.44, "learning_rate": 3.09609824986695e-06, "loss": 0.765, "step": 23357 }, { "epoch": 0.44, "learning_rate": 3.095949889374961e-06, "loss": 0.8729, "step": 23358 }, { "epoch": 0.44, "learning_rate": 3.095801526657713e-06, "loss": 1.0366, "step": 23359 }, { "epoch": 0.44, "learning_rate": 3.0956531617157603e-06, "loss": 0.98, "step": 23360 }, { "epoch": 0.44, "learning_rate": 3.0955047945496575e-06, "loss": 0.8185, "step": 23361 }, { "epoch": 0.44, "learning_rate": 3.0953564251599565e-06, "loss": 1.143, "step": 23362 }, { "epoch": 0.44, "learning_rate": 3.095208053547214e-06, "loss": 0.8385, "step": 23363 }, { "epoch": 0.44, "learning_rate": 3.0950596797119835e-06, "loss": 0.8203, "step": 23364 }, { "epoch": 0.44, "learning_rate": 3.0949113036548173e-06, "loss": 1.1154, "step": 23365 }, { "epoch": 0.44, "learning_rate": 3.094762925376271e-06, "loss": 0.9254, "step": 23366 }, { "epoch": 0.44, "learning_rate": 3.0946145448768987e-06, "loss": 0.7991, "step": 23367 }, { "epoch": 0.44, "learning_rate": 3.094466162157253e-06, "loss": 0.9683, "step": 23368 }, { "epoch": 0.44, "learning_rate": 3.0943177772178897e-06, "loss": 1.1266, "step": 23369 }, { "epoch": 0.44, "learning_rate": 3.094169390059361e-06, "loss": 0.9297, "step": 23370 }, { "epoch": 0.44, "learning_rate": 3.0940210006822222e-06, "loss": 1.0107, "step": 23371 }, { "epoch": 0.44, "learning_rate": 3.093872609087028e-06, "loss": 0.9062, "step": 23372 }, { "epoch": 0.44, "learning_rate": 3.093724215274332e-06, "loss": 0.9077, "step": 23373 }, { "epoch": 0.44, "learning_rate": 3.093575819244687e-06, "loss": 0.9103, "step": 23374 }, { "epoch": 0.44, "learning_rate": 3.0934274209986483e-06, "loss": 1.0232, "step": 23375 }, { "epoch": 0.44, "learning_rate": 3.0932790205367697e-06, "loss": 1.0182, "step": 23376 }, { "epoch": 0.44, "learning_rate": 3.0931306178596055e-06, "loss": 0.8195, "step": 23377 }, { "epoch": 0.44, "learning_rate": 3.0929822129677094e-06, "loss": 0.7343, "step": 23378 }, { "epoch": 0.44, "learning_rate": 3.092833805861637e-06, "loss": 0.8906, "step": 23379 }, { "epoch": 0.44, "learning_rate": 3.09268539654194e-06, "loss": 0.8526, "step": 23380 }, { "epoch": 0.44, "learning_rate": 3.0925369850091745e-06, "loss": 1.1703, "step": 23381 }, { "epoch": 0.44, "learning_rate": 3.092388571263895e-06, "loss": 0.9232, "step": 23382 }, { "epoch": 0.44, "learning_rate": 3.0922401553066533e-06, "loss": 1.0607, "step": 23383 }, { "epoch": 0.44, "learning_rate": 3.0920917371380062e-06, "loss": 0.8188, "step": 23384 }, { "epoch": 0.44, "learning_rate": 3.0919433167585057e-06, "loss": 0.7585, "step": 23385 }, { "epoch": 0.44, "learning_rate": 3.091794894168707e-06, "loss": 0.9176, "step": 23386 }, { "epoch": 0.44, "learning_rate": 3.0916464693691654e-06, "loss": 1.2246, "step": 23387 }, { "epoch": 0.44, "learning_rate": 3.0914980423604335e-06, "loss": 1.008, "step": 23388 }, { "epoch": 0.44, "learning_rate": 3.0913496131430654e-06, "loss": 1.0029, "step": 23389 }, { "epoch": 0.44, "learning_rate": 3.091201181717617e-06, "loss": 0.8302, "step": 23390 }, { "epoch": 0.44, "learning_rate": 3.0910527480846402e-06, "loss": 0.6837, "step": 23391 }, { "epoch": 0.44, "learning_rate": 3.090904312244691e-06, "loss": 0.9048, "step": 23392 }, { "epoch": 0.44, "learning_rate": 3.0907558741983246e-06, "loss": 0.9658, "step": 23393 }, { "epoch": 0.44, "learning_rate": 3.0906074339460925e-06, "loss": 1.2086, "step": 23394 }, { "epoch": 0.44, "learning_rate": 3.0904589914885507e-06, "loss": 0.965, "step": 23395 }, { "epoch": 0.44, "learning_rate": 3.090310546826253e-06, "loss": 0.9406, "step": 23396 }, { "epoch": 0.44, "learning_rate": 3.090162099959754e-06, "loss": 0.8732, "step": 23397 }, { "epoch": 0.44, "learning_rate": 3.090013650889607e-06, "loss": 0.7184, "step": 23398 }, { "epoch": 0.44, "learning_rate": 3.089865199616369e-06, "loss": 0.9017, "step": 23399 }, { "epoch": 0.44, "learning_rate": 3.0897167461405908e-06, "loss": 1.1221, "step": 23400 }, { "epoch": 0.44, "learning_rate": 3.089568290462829e-06, "loss": 0.9331, "step": 23401 }, { "epoch": 0.44, "learning_rate": 3.089419832583638e-06, "loss": 0.6041, "step": 23402 }, { "epoch": 0.44, "learning_rate": 3.08927137250357e-06, "loss": 0.9272, "step": 23403 }, { "epoch": 0.44, "learning_rate": 3.0891229102231806e-06, "loss": 0.9059, "step": 23404 }, { "epoch": 0.44, "learning_rate": 3.0889744457430253e-06, "loss": 1.1778, "step": 23405 }, { "epoch": 0.44, "learning_rate": 3.088825979063657e-06, "loss": 0.9264, "step": 23406 }, { "epoch": 0.44, "learning_rate": 3.0886775101856308e-06, "loss": 0.9612, "step": 23407 }, { "epoch": 0.44, "learning_rate": 3.088529039109501e-06, "loss": 0.8381, "step": 23408 }, { "epoch": 0.44, "learning_rate": 3.0883805658358217e-06, "loss": 1.0081, "step": 23409 }, { "epoch": 0.44, "learning_rate": 3.0882320903651475e-06, "loss": 0.7869, "step": 23410 }, { "epoch": 0.44, "learning_rate": 3.088083612698032e-06, "loss": 0.9747, "step": 23411 }, { "epoch": 0.44, "learning_rate": 3.087935132835031e-06, "loss": 1.1693, "step": 23412 }, { "epoch": 0.44, "learning_rate": 3.087786650776698e-06, "loss": 0.9942, "step": 23413 }, { "epoch": 0.44, "learning_rate": 3.0876381665235875e-06, "loss": 0.9368, "step": 23414 }, { "epoch": 0.44, "learning_rate": 3.087489680076255e-06, "loss": 0.777, "step": 23415 }, { "epoch": 0.44, "learning_rate": 3.087341191435253e-06, "loss": 0.916, "step": 23416 }, { "epoch": 0.44, "learning_rate": 3.0871927006011372e-06, "loss": 0.899, "step": 23417 }, { "epoch": 0.44, "learning_rate": 3.087044207574462e-06, "loss": 1.1307, "step": 23418 }, { "epoch": 0.44, "learning_rate": 3.086895712355782e-06, "loss": 0.9774, "step": 23419 }, { "epoch": 0.44, "learning_rate": 3.0867472149456513e-06, "loss": 0.9896, "step": 23420 }, { "epoch": 0.44, "learning_rate": 3.086598715344624e-06, "loss": 0.8328, "step": 23421 }, { "epoch": 0.44, "learning_rate": 3.086450213553256e-06, "loss": 0.8211, "step": 23422 }, { "epoch": 0.44, "learning_rate": 3.0863017095721006e-06, "loss": 0.7672, "step": 23423 }, { "epoch": 0.44, "learning_rate": 3.086153203401712e-06, "loss": 1.0691, "step": 23424 }, { "epoch": 0.44, "learning_rate": 3.0860046950426447e-06, "loss": 1.046, "step": 23425 }, { "epoch": 0.44, "learning_rate": 3.0858561844954552e-06, "loss": 0.8493, "step": 23426 }, { "epoch": 0.44, "learning_rate": 3.0857076717606965e-06, "loss": 0.8904, "step": 23427 }, { "epoch": 0.44, "learning_rate": 3.0855591568389233e-06, "loss": 0.891, "step": 23428 }, { "epoch": 0.44, "learning_rate": 3.08541063973069e-06, "loss": 0.9186, "step": 23429 }, { "epoch": 0.44, "learning_rate": 3.085262120436551e-06, "loss": 0.9739, "step": 23430 }, { "epoch": 0.44, "learning_rate": 3.085113598957061e-06, "loss": 1.04, "step": 23431 }, { "epoch": 0.44, "learning_rate": 3.084965075292776e-06, "loss": 0.9593, "step": 23432 }, { "epoch": 0.44, "learning_rate": 3.084816549444248e-06, "loss": 0.7676, "step": 23433 }, { "epoch": 0.44, "learning_rate": 3.0846680214120335e-06, "loss": 0.857, "step": 23434 }, { "epoch": 0.44, "learning_rate": 3.084519491196687e-06, "loss": 1.0431, "step": 23435 }, { "epoch": 0.44, "learning_rate": 3.0843709587987618e-06, "loss": 0.9351, "step": 23436 }, { "epoch": 0.44, "learning_rate": 3.0842224242188133e-06, "loss": 1.1015, "step": 23437 }, { "epoch": 0.44, "learning_rate": 3.0840738874573966e-06, "loss": 0.7998, "step": 23438 }, { "epoch": 0.44, "learning_rate": 3.083925348515066e-06, "loss": 0.8365, "step": 23439 }, { "epoch": 0.44, "learning_rate": 3.0837768073923756e-06, "loss": 0.8537, "step": 23440 }, { "epoch": 0.44, "learning_rate": 3.0836282640898812e-06, "loss": 0.726, "step": 23441 }, { "epoch": 0.44, "learning_rate": 3.0834797186081367e-06, "loss": 1.0528, "step": 23442 }, { "epoch": 0.44, "learning_rate": 3.0833311709476964e-06, "loss": 1.0759, "step": 23443 }, { "epoch": 0.44, "learning_rate": 3.083182621109116e-06, "loss": 0.9593, "step": 23444 }, { "epoch": 0.44, "learning_rate": 3.083034069092949e-06, "loss": 0.9905, "step": 23445 }, { "epoch": 0.44, "learning_rate": 3.08288551489975e-06, "loss": 0.94, "step": 23446 }, { "epoch": 0.44, "learning_rate": 3.0827369585300755e-06, "loss": 0.8886, "step": 23447 }, { "epoch": 0.44, "learning_rate": 3.0825883999844787e-06, "loss": 0.9158, "step": 23448 }, { "epoch": 0.44, "learning_rate": 3.082439839263514e-06, "loss": 1.0828, "step": 23449 }, { "epoch": 0.44, "learning_rate": 3.0822912763677383e-06, "loss": 1.0872, "step": 23450 }, { "epoch": 0.44, "learning_rate": 3.082142711297704e-06, "loss": 0.9213, "step": 23451 }, { "epoch": 0.44, "learning_rate": 3.0819941440539664e-06, "loss": 0.7715, "step": 23452 }, { "epoch": 0.44, "learning_rate": 3.081845574637081e-06, "loss": 0.8457, "step": 23453 }, { "epoch": 0.44, "learning_rate": 3.081697003047601e-06, "loss": 0.9218, "step": 23454 }, { "epoch": 0.44, "learning_rate": 3.081548429286083e-06, "loss": 0.9278, "step": 23455 }, { "epoch": 0.44, "learning_rate": 3.0813998533530815e-06, "loss": 0.9465, "step": 23456 }, { "epoch": 0.44, "learning_rate": 3.08125127524915e-06, "loss": 0.9206, "step": 23457 }, { "epoch": 0.44, "learning_rate": 3.0811026949748446e-06, "loss": 0.7857, "step": 23458 }, { "epoch": 0.44, "learning_rate": 3.080954112530719e-06, "loss": 0.9008, "step": 23459 }, { "epoch": 0.44, "learning_rate": 3.0808055279173287e-06, "loss": 0.8972, "step": 23460 }, { "epoch": 0.44, "learning_rate": 3.0806569411352288e-06, "loss": 0.8335, "step": 23461 }, { "epoch": 0.44, "learning_rate": 3.080508352184974e-06, "loss": 0.8686, "step": 23462 }, { "epoch": 0.44, "learning_rate": 3.080359761067118e-06, "loss": 0.9083, "step": 23463 }, { "epoch": 0.44, "learning_rate": 3.0802111677822164e-06, "loss": 0.9131, "step": 23464 }, { "epoch": 0.44, "learning_rate": 3.0800625723308245e-06, "loss": 0.8073, "step": 23465 }, { "epoch": 0.44, "learning_rate": 3.079913974713497e-06, "loss": 0.9105, "step": 23466 }, { "epoch": 0.44, "learning_rate": 3.0797653749307877e-06, "loss": 1.0767, "step": 23467 }, { "epoch": 0.44, "learning_rate": 3.0796167729832528e-06, "loss": 0.976, "step": 23468 }, { "epoch": 0.44, "learning_rate": 3.0794681688714466e-06, "loss": 1.0564, "step": 23469 }, { "epoch": 0.44, "learning_rate": 3.0793195625959236e-06, "loss": 1.0228, "step": 23470 }, { "epoch": 0.44, "learning_rate": 3.07917095415724e-06, "loss": 0.8043, "step": 23471 }, { "epoch": 0.44, "learning_rate": 3.079022343555949e-06, "loss": 0.926, "step": 23472 }, { "epoch": 0.44, "learning_rate": 3.0788737307926065e-06, "loss": 0.8441, "step": 23473 }, { "epoch": 0.44, "learning_rate": 3.078725115867767e-06, "loss": 0.9687, "step": 23474 }, { "epoch": 0.44, "learning_rate": 3.0785764987819865e-06, "loss": 1.1723, "step": 23475 }, { "epoch": 0.44, "learning_rate": 3.078427879535818e-06, "loss": 0.8954, "step": 23476 }, { "epoch": 0.44, "learning_rate": 3.0782792581298186e-06, "loss": 0.8251, "step": 23477 }, { "epoch": 0.44, "learning_rate": 3.0781306345645417e-06, "loss": 1.0853, "step": 23478 }, { "epoch": 0.44, "learning_rate": 3.0779820088405425e-06, "loss": 0.6817, "step": 23479 }, { "epoch": 0.44, "learning_rate": 3.0778333809583767e-06, "loss": 0.9436, "step": 23480 }, { "epoch": 0.44, "learning_rate": 3.077684750918598e-06, "loss": 1.2136, "step": 23481 }, { "epoch": 0.44, "learning_rate": 3.077536118721763e-06, "loss": 1.0576, "step": 23482 }, { "epoch": 0.44, "learning_rate": 3.0773874843684258e-06, "loss": 0.7744, "step": 23483 }, { "epoch": 0.44, "learning_rate": 3.077238847859141e-06, "loss": 0.8614, "step": 23484 }, { "epoch": 0.44, "learning_rate": 3.0770902091944645e-06, "loss": 0.7684, "step": 23485 }, { "epoch": 0.44, "learning_rate": 3.0769415683749503e-06, "loss": 0.8154, "step": 23486 }, { "epoch": 0.44, "learning_rate": 3.0767929254011544e-06, "loss": 1.0515, "step": 23487 }, { "epoch": 0.44, "learning_rate": 3.0766442802736306e-06, "loss": 0.8924, "step": 23488 }, { "epoch": 0.44, "learning_rate": 3.0764956329929356e-06, "loss": 1.056, "step": 23489 }, { "epoch": 0.44, "learning_rate": 3.076346983559623e-06, "loss": 0.7639, "step": 23490 }, { "epoch": 0.44, "learning_rate": 3.0761983319742487e-06, "loss": 0.9047, "step": 23491 }, { "epoch": 0.44, "learning_rate": 3.076049678237368e-06, "loss": 0.8754, "step": 23492 }, { "epoch": 0.44, "learning_rate": 3.0759010223495355e-06, "loss": 0.807, "step": 23493 }, { "epoch": 0.44, "learning_rate": 3.075752364311305e-06, "loss": 1.0887, "step": 23494 }, { "epoch": 0.44, "learning_rate": 3.075603704123234e-06, "loss": 1.0192, "step": 23495 }, { "epoch": 0.44, "learning_rate": 3.0754550417858758e-06, "loss": 0.9212, "step": 23496 }, { "epoch": 0.44, "learning_rate": 3.075306377299786e-06, "loss": 0.9297, "step": 23497 }, { "epoch": 0.44, "learning_rate": 3.0751577106655205e-06, "loss": 0.9417, "step": 23498 }, { "epoch": 0.44, "learning_rate": 3.0750090418836335e-06, "loss": 0.9651, "step": 23499 }, { "epoch": 0.44, "learning_rate": 3.074860370954681e-06, "loss": 1.2463, "step": 23500 }, { "epoch": 0.44, "learning_rate": 3.074711697879216e-06, "loss": 1.0186, "step": 23501 }, { "epoch": 0.44, "learning_rate": 3.074563022657796e-06, "loss": 0.9235, "step": 23502 }, { "epoch": 0.44, "learning_rate": 3.0744143452909753e-06, "loss": 0.9406, "step": 23503 }, { "epoch": 0.44, "learning_rate": 3.074265665779309e-06, "loss": 0.965, "step": 23504 }, { "epoch": 0.44, "learning_rate": 3.074116984123352e-06, "loss": 0.9443, "step": 23505 }, { "epoch": 0.44, "learning_rate": 3.0739683003236605e-06, "loss": 1.0663, "step": 23506 }, { "epoch": 0.44, "learning_rate": 3.0738196143807886e-06, "loss": 0.9488, "step": 23507 }, { "epoch": 0.44, "learning_rate": 3.0736709262952915e-06, "loss": 0.7858, "step": 23508 }, { "epoch": 0.44, "learning_rate": 3.0735222360677246e-06, "loss": 0.963, "step": 23509 }, { "epoch": 0.44, "learning_rate": 3.073373543698644e-06, "loss": 0.759, "step": 23510 }, { "epoch": 0.44, "learning_rate": 3.0732248491886036e-06, "loss": 1.0912, "step": 23511 }, { "epoch": 0.44, "learning_rate": 3.0730761525381596e-06, "loss": 1.0762, "step": 23512 }, { "epoch": 0.44, "learning_rate": 3.072927453747867e-06, "loss": 0.9216, "step": 23513 }, { "epoch": 0.44, "learning_rate": 3.07277875281828e-06, "loss": 0.8547, "step": 23514 }, { "epoch": 0.44, "learning_rate": 3.072630049749955e-06, "loss": 0.8728, "step": 23515 }, { "epoch": 0.44, "learning_rate": 3.072481344543447e-06, "loss": 0.6945, "step": 23516 }, { "epoch": 0.44, "learning_rate": 3.072332637199312e-06, "loss": 0.9804, "step": 23517 }, { "epoch": 0.44, "learning_rate": 3.0721839277181038e-06, "loss": 1.0965, "step": 23518 }, { "epoch": 0.44, "learning_rate": 3.072035216100378e-06, "loss": 1.0451, "step": 23519 }, { "epoch": 0.44, "learning_rate": 3.071886502346691e-06, "loss": 1.0754, "step": 23520 }, { "epoch": 0.44, "learning_rate": 3.071737786457597e-06, "loss": 0.7579, "step": 23521 }, { "epoch": 0.44, "learning_rate": 3.0715890684336513e-06, "loss": 0.8875, "step": 23522 }, { "epoch": 0.44, "learning_rate": 3.0714403482754096e-06, "loss": 0.8495, "step": 23523 }, { "epoch": 0.44, "learning_rate": 3.071291625983428e-06, "loss": 1.0323, "step": 23524 }, { "epoch": 0.44, "learning_rate": 3.07114290155826e-06, "loss": 1.0482, "step": 23525 }, { "epoch": 0.44, "learning_rate": 3.0709941750004625e-06, "loss": 1.0667, "step": 23526 }, { "epoch": 0.44, "learning_rate": 3.0708454463105902e-06, "loss": 0.8685, "step": 23527 }, { "epoch": 0.44, "learning_rate": 3.070696715489198e-06, "loss": 0.9874, "step": 23528 }, { "epoch": 0.44, "learning_rate": 3.070547982536842e-06, "loss": 0.8547, "step": 23529 }, { "epoch": 0.44, "learning_rate": 3.0703992474540776e-06, "loss": 0.8574, "step": 23530 }, { "epoch": 0.44, "learning_rate": 3.0702505102414598e-06, "loss": 1.2029, "step": 23531 }, { "epoch": 0.44, "learning_rate": 3.070101770899544e-06, "loss": 0.9305, "step": 23532 }, { "epoch": 0.44, "learning_rate": 3.069953029428886e-06, "loss": 0.8597, "step": 23533 }, { "epoch": 0.44, "learning_rate": 3.06980428583004e-06, "loss": 0.9437, "step": 23534 }, { "epoch": 0.44, "learning_rate": 3.0696555401035634e-06, "loss": 0.9083, "step": 23535 }, { "epoch": 0.44, "learning_rate": 3.06950679225001e-06, "loss": 0.9337, "step": 23536 }, { "epoch": 0.44, "learning_rate": 3.0693580422699353e-06, "loss": 0.8744, "step": 23537 }, { "epoch": 0.44, "learning_rate": 3.069209290163895e-06, "loss": 0.8723, "step": 23538 }, { "epoch": 0.44, "learning_rate": 3.0690605359324453e-06, "loss": 0.9848, "step": 23539 }, { "epoch": 0.44, "learning_rate": 3.0689117795761412e-06, "loss": 0.895, "step": 23540 }, { "epoch": 0.44, "learning_rate": 3.068763021095538e-06, "loss": 1.0297, "step": 23541 }, { "epoch": 0.44, "learning_rate": 3.068614260491191e-06, "loss": 0.6804, "step": 23542 }, { "epoch": 0.44, "learning_rate": 3.068465497763654e-06, "loss": 1.1169, "step": 23543 }, { "epoch": 0.44, "learning_rate": 3.068316732913486e-06, "loss": 1.2061, "step": 23544 }, { "epoch": 0.44, "learning_rate": 3.068167965941241e-06, "loss": 0.8333, "step": 23545 }, { "epoch": 0.44, "learning_rate": 3.0680191968474737e-06, "loss": 0.9012, "step": 23546 }, { "epoch": 0.44, "learning_rate": 3.0678704256327396e-06, "loss": 0.8476, "step": 23547 }, { "epoch": 0.44, "learning_rate": 3.067721652297596e-06, "loss": 0.9767, "step": 23548 }, { "epoch": 0.44, "learning_rate": 3.067572876842596e-06, "loss": 0.7939, "step": 23549 }, { "epoch": 0.44, "learning_rate": 3.0674240992682968e-06, "loss": 0.9948, "step": 23550 }, { "epoch": 0.44, "learning_rate": 3.0672753195752537e-06, "loss": 1.0174, "step": 23551 }, { "epoch": 0.44, "learning_rate": 3.0671265377640214e-06, "loss": 0.6987, "step": 23552 }, { "epoch": 0.44, "learning_rate": 3.066977753835156e-06, "loss": 0.8928, "step": 23553 }, { "epoch": 0.44, "learning_rate": 3.066828967789214e-06, "loss": 0.7375, "step": 23554 }, { "epoch": 0.44, "learning_rate": 3.066680179626749e-06, "loss": 1.0809, "step": 23555 }, { "epoch": 0.44, "learning_rate": 3.0665313893483173e-06, "loss": 1.1046, "step": 23556 }, { "epoch": 0.44, "learning_rate": 3.0663825969544752e-06, "loss": 1.1687, "step": 23557 }, { "epoch": 0.44, "learning_rate": 3.0662338024457777e-06, "loss": 1.0986, "step": 23558 }, { "epoch": 0.44, "learning_rate": 3.066085005822781e-06, "loss": 1.0745, "step": 23559 }, { "epoch": 0.44, "learning_rate": 3.0659362070860406e-06, "loss": 1.048, "step": 23560 }, { "epoch": 0.44, "learning_rate": 3.065787406236111e-06, "loss": 0.7408, "step": 23561 }, { "epoch": 0.44, "learning_rate": 3.0656386032735487e-06, "loss": 1.1171, "step": 23562 }, { "epoch": 0.44, "learning_rate": 3.0654897981989098e-06, "loss": 1.2476, "step": 23563 }, { "epoch": 0.44, "learning_rate": 3.065340991012748e-06, "loss": 0.9778, "step": 23564 }, { "epoch": 0.44, "learning_rate": 3.0651921817156207e-06, "loss": 0.913, "step": 23565 }, { "epoch": 0.44, "learning_rate": 3.065043370308084e-06, "loss": 0.8574, "step": 23566 }, { "epoch": 0.44, "learning_rate": 3.064894556790692e-06, "loss": 0.9462, "step": 23567 }, { "epoch": 0.44, "learning_rate": 3.0647457411640015e-06, "loss": 1.1085, "step": 23568 }, { "epoch": 0.44, "learning_rate": 3.0645969234285676e-06, "loss": 1.0507, "step": 23569 }, { "epoch": 0.44, "learning_rate": 3.0644481035849456e-06, "loss": 1.0029, "step": 23570 }, { "epoch": 0.44, "learning_rate": 3.064299281633692e-06, "loss": 0.9241, "step": 23571 }, { "epoch": 0.44, "learning_rate": 3.0641504575753624e-06, "loss": 0.8357, "step": 23572 }, { "epoch": 0.44, "learning_rate": 3.0640016314105114e-06, "loss": 0.7232, "step": 23573 }, { "epoch": 0.44, "learning_rate": 3.0638528031396965e-06, "loss": 0.9399, "step": 23574 }, { "epoch": 0.44, "learning_rate": 3.0637039727634727e-06, "loss": 0.8445, "step": 23575 }, { "epoch": 0.44, "learning_rate": 3.063555140282395e-06, "loss": 0.9356, "step": 23576 }, { "epoch": 0.44, "learning_rate": 3.0634063056970197e-06, "loss": 0.9362, "step": 23577 }, { "epoch": 0.44, "learning_rate": 3.0632574690079026e-06, "loss": 0.8383, "step": 23578 }, { "epoch": 0.44, "learning_rate": 3.0631086302155992e-06, "loss": 0.8245, "step": 23579 }, { "epoch": 0.44, "learning_rate": 3.062959789320666e-06, "loss": 0.7973, "step": 23580 }, { "epoch": 0.44, "learning_rate": 3.0628109463236583e-06, "loss": 0.9475, "step": 23581 }, { "epoch": 0.44, "learning_rate": 3.062662101225131e-06, "loss": 0.9619, "step": 23582 }, { "epoch": 0.44, "learning_rate": 3.062513254025641e-06, "loss": 0.9481, "step": 23583 }, { "epoch": 0.44, "learning_rate": 3.0623644047257443e-06, "loss": 0.8902, "step": 23584 }, { "epoch": 0.44, "learning_rate": 3.062215553325995e-06, "loss": 0.9066, "step": 23585 }, { "epoch": 0.44, "learning_rate": 3.0620666998269505e-06, "loss": 1.1801, "step": 23586 }, { "epoch": 0.45, "learning_rate": 3.061917844229167e-06, "loss": 0.7825, "step": 23587 }, { "epoch": 0.45, "learning_rate": 3.061768986533199e-06, "loss": 1.0694, "step": 23588 }, { "epoch": 0.45, "learning_rate": 3.0616201267396025e-06, "loss": 0.8121, "step": 23589 }, { "epoch": 0.45, "learning_rate": 3.0614712648489343e-06, "loss": 1.0077, "step": 23590 }, { "epoch": 0.45, "learning_rate": 3.061322400861749e-06, "loss": 1.0175, "step": 23591 }, { "epoch": 0.45, "learning_rate": 3.061173534778603e-06, "loss": 0.692, "step": 23592 }, { "epoch": 0.45, "learning_rate": 3.0610246666000524e-06, "loss": 1.1292, "step": 23593 }, { "epoch": 0.45, "learning_rate": 3.0608757963266532e-06, "loss": 1.1689, "step": 23594 }, { "epoch": 0.45, "learning_rate": 3.0607269239589604e-06, "loss": 1.0293, "step": 23595 }, { "epoch": 0.45, "learning_rate": 3.0605780494975313e-06, "loss": 0.8164, "step": 23596 }, { "epoch": 0.45, "learning_rate": 3.0604291729429204e-06, "loss": 0.7193, "step": 23597 }, { "epoch": 0.45, "learning_rate": 3.0602802942956844e-06, "loss": 0.9534, "step": 23598 }, { "epoch": 0.45, "learning_rate": 3.0601314135563787e-06, "loss": 1.1088, "step": 23599 }, { "epoch": 0.45, "learning_rate": 3.0599825307255594e-06, "loss": 1.0746, "step": 23600 }, { "epoch": 0.45, "learning_rate": 3.0598336458037825e-06, "loss": 0.8586, "step": 23601 }, { "epoch": 0.45, "learning_rate": 3.0596847587916045e-06, "loss": 0.6747, "step": 23602 }, { "epoch": 0.45, "learning_rate": 3.0595358696895798e-06, "loss": 0.8675, "step": 23603 }, { "epoch": 0.45, "learning_rate": 3.059386978498266e-06, "loss": 0.8664, "step": 23604 }, { "epoch": 0.45, "learning_rate": 3.0592380852182192e-06, "loss": 1.0035, "step": 23605 }, { "epoch": 0.45, "learning_rate": 3.0590891898499926e-06, "loss": 0.7539, "step": 23606 }, { "epoch": 0.45, "learning_rate": 3.058940292394145e-06, "loss": 1.1515, "step": 23607 }, { "epoch": 0.45, "learning_rate": 3.058791392851232e-06, "loss": 0.8733, "step": 23608 }, { "epoch": 0.45, "learning_rate": 3.058642491221808e-06, "loss": 0.8399, "step": 23609 }, { "epoch": 0.45, "learning_rate": 3.058493587506431e-06, "loss": 0.9142, "step": 23610 }, { "epoch": 0.45, "learning_rate": 3.058344681705656e-06, "loss": 0.7384, "step": 23611 }, { "epoch": 0.45, "learning_rate": 3.058195773820039e-06, "loss": 1.1564, "step": 23612 }, { "epoch": 0.45, "learning_rate": 3.058046863850136e-06, "loss": 1.0391, "step": 23613 }, { "epoch": 0.45, "learning_rate": 3.057897951796503e-06, "loss": 0.8713, "step": 23614 }, { "epoch": 0.45, "learning_rate": 3.0577490376596962e-06, "loss": 1.0127, "step": 23615 }, { "epoch": 0.45, "learning_rate": 3.0576001214402713e-06, "loss": 0.8197, "step": 23616 }, { "epoch": 0.45, "learning_rate": 3.0574512031387856e-06, "loss": 0.9351, "step": 23617 }, { "epoch": 0.45, "learning_rate": 3.0573022827557935e-06, "loss": 1.1194, "step": 23618 }, { "epoch": 0.45, "learning_rate": 3.057153360291852e-06, "loss": 1.0194, "step": 23619 }, { "epoch": 0.45, "learning_rate": 3.0570044357475165e-06, "loss": 0.9935, "step": 23620 }, { "epoch": 0.45, "learning_rate": 3.056855509123343e-06, "loss": 0.6666, "step": 23621 }, { "epoch": 0.45, "learning_rate": 3.05670658041989e-06, "loss": 0.878, "step": 23622 }, { "epoch": 0.45, "learning_rate": 3.0565576496377104e-06, "loss": 0.7426, "step": 23623 }, { "epoch": 0.45, "learning_rate": 3.0564087167773615e-06, "loss": 0.963, "step": 23624 }, { "epoch": 0.45, "learning_rate": 3.0562597818394003e-06, "loss": 1.131, "step": 23625 }, { "epoch": 0.45, "learning_rate": 3.056110844824381e-06, "loss": 0.6777, "step": 23626 }, { "epoch": 0.45, "learning_rate": 3.0559619057328616e-06, "loss": 1.0354, "step": 23627 }, { "epoch": 0.45, "learning_rate": 3.055812964565398e-06, "loss": 1.0767, "step": 23628 }, { "epoch": 0.45, "learning_rate": 3.0556640213225447e-06, "loss": 0.881, "step": 23629 }, { "epoch": 0.45, "learning_rate": 3.0555150760048593e-06, "loss": 0.9334, "step": 23630 }, { "epoch": 0.45, "learning_rate": 3.055366128612898e-06, "loss": 0.9655, "step": 23631 }, { "epoch": 0.45, "learning_rate": 3.055217179147217e-06, "loss": 1.0599, "step": 23632 }, { "epoch": 0.45, "learning_rate": 3.055068227608371e-06, "loss": 0.8938, "step": 23633 }, { "epoch": 0.45, "learning_rate": 3.054919273996918e-06, "loss": 1.0891, "step": 23634 }, { "epoch": 0.45, "learning_rate": 3.0547703183134124e-06, "loss": 0.9217, "step": 23635 }, { "epoch": 0.45, "learning_rate": 3.0546213605584123e-06, "loss": 0.759, "step": 23636 }, { "epoch": 0.45, "learning_rate": 3.054472400732474e-06, "loss": 1.1475, "step": 23637 }, { "epoch": 0.45, "learning_rate": 3.0543234388361514e-06, "loss": 0.8976, "step": 23638 }, { "epoch": 0.45, "learning_rate": 3.054174474870002e-06, "loss": 0.9044, "step": 23639 }, { "epoch": 0.45, "learning_rate": 3.0540255088345825e-06, "loss": 1.0368, "step": 23640 }, { "epoch": 0.45, "learning_rate": 3.0538765407304487e-06, "loss": 0.9343, "step": 23641 }, { "epoch": 0.45, "learning_rate": 3.053727570558157e-06, "loss": 0.8535, "step": 23642 }, { "epoch": 0.45, "learning_rate": 3.053578598318264e-06, "loss": 1.1106, "step": 23643 }, { "epoch": 0.45, "learning_rate": 3.053429624011325e-06, "loss": 0.9814, "step": 23644 }, { "epoch": 0.45, "learning_rate": 3.053280647637896e-06, "loss": 0.8609, "step": 23645 }, { "epoch": 0.45, "learning_rate": 3.0531316691985357e-06, "loss": 0.886, "step": 23646 }, { "epoch": 0.45, "learning_rate": 3.0529826886937968e-06, "loss": 0.8961, "step": 23647 }, { "epoch": 0.45, "learning_rate": 3.0528337061242384e-06, "loss": 0.8572, "step": 23648 }, { "epoch": 0.45, "learning_rate": 3.0526847214904164e-06, "loss": 1.0176, "step": 23649 }, { "epoch": 0.45, "learning_rate": 3.052535734792886e-06, "loss": 0.806, "step": 23650 }, { "epoch": 0.45, "learning_rate": 3.0523867460322044e-06, "loss": 1.1356, "step": 23651 }, { "epoch": 0.45, "learning_rate": 3.052237755208928e-06, "loss": 1.0188, "step": 23652 }, { "epoch": 0.45, "learning_rate": 3.0520887623236115e-06, "loss": 0.9664, "step": 23653 }, { "epoch": 0.45, "learning_rate": 3.0519397673768135e-06, "loss": 0.9674, "step": 23654 }, { "epoch": 0.45, "learning_rate": 3.0517907703690886e-06, "loss": 1.0364, "step": 23655 }, { "epoch": 0.45, "learning_rate": 3.0516417713009946e-06, "loss": 1.1268, "step": 23656 }, { "epoch": 0.45, "learning_rate": 3.0514927701730867e-06, "loss": 0.8309, "step": 23657 }, { "epoch": 0.45, "learning_rate": 3.0513437669859227e-06, "loss": 0.9351, "step": 23658 }, { "epoch": 0.45, "learning_rate": 3.0511947617400566e-06, "loss": 1.0224, "step": 23659 }, { "epoch": 0.45, "learning_rate": 3.0510457544360465e-06, "loss": 0.7885, "step": 23660 }, { "epoch": 0.45, "learning_rate": 3.0508967450744485e-06, "loss": 0.7778, "step": 23661 }, { "epoch": 0.45, "learning_rate": 3.0507477336558188e-06, "loss": 1.3109, "step": 23662 }, { "epoch": 0.45, "learning_rate": 3.050598720180714e-06, "loss": 1.0224, "step": 23663 }, { "epoch": 0.45, "learning_rate": 3.0504497046496916e-06, "loss": 0.7327, "step": 23664 }, { "epoch": 0.45, "learning_rate": 3.0503006870633054e-06, "loss": 0.7348, "step": 23665 }, { "epoch": 0.45, "learning_rate": 3.0501516674221144e-06, "loss": 0.9298, "step": 23666 }, { "epoch": 0.45, "learning_rate": 3.0500026457266736e-06, "loss": 1.1093, "step": 23667 }, { "epoch": 0.45, "learning_rate": 3.0498536219775387e-06, "loss": 1.1001, "step": 23668 }, { "epoch": 0.45, "learning_rate": 3.0497045961752684e-06, "loss": 0.9348, "step": 23669 }, { "epoch": 0.45, "learning_rate": 3.049555568320418e-06, "loss": 0.7087, "step": 23670 }, { "epoch": 0.45, "learning_rate": 3.049406538413544e-06, "loss": 0.9155, "step": 23671 }, { "epoch": 0.45, "learning_rate": 3.0492575064552023e-06, "loss": 0.9426, "step": 23672 }, { "epoch": 0.45, "learning_rate": 3.049108472445951e-06, "loss": 0.8163, "step": 23673 }, { "epoch": 0.45, "learning_rate": 3.0489594363863438e-06, "loss": 1.1055, "step": 23674 }, { "epoch": 0.45, "learning_rate": 3.04881039827694e-06, "loss": 1.1064, "step": 23675 }, { "epoch": 0.45, "learning_rate": 3.0486613581182944e-06, "loss": 1.0521, "step": 23676 }, { "epoch": 0.45, "learning_rate": 3.048512315910964e-06, "loss": 0.938, "step": 23677 }, { "epoch": 0.45, "learning_rate": 3.0483632716555063e-06, "loss": 0.9708, "step": 23678 }, { "epoch": 0.45, "learning_rate": 3.0482142253524772e-06, "loss": 0.9044, "step": 23679 }, { "epoch": 0.45, "learning_rate": 3.0480651770024317e-06, "loss": 1.1246, "step": 23680 }, { "epoch": 0.45, "learning_rate": 3.0479161266059283e-06, "loss": 1.2484, "step": 23681 }, { "epoch": 0.45, "learning_rate": 3.0477670741635227e-06, "loss": 1.0808, "step": 23682 }, { "epoch": 0.45, "learning_rate": 3.0476180196757723e-06, "loss": 0.825, "step": 23683 }, { "epoch": 0.45, "learning_rate": 3.047468963143232e-06, "loss": 0.9698, "step": 23684 }, { "epoch": 0.45, "learning_rate": 3.0473199045664603e-06, "loss": 0.8282, "step": 23685 }, { "epoch": 0.45, "learning_rate": 3.047170843946012e-06, "loss": 0.9161, "step": 23686 }, { "epoch": 0.45, "learning_rate": 3.0470217812824448e-06, "loss": 0.8989, "step": 23687 }, { "epoch": 0.45, "learning_rate": 3.046872716576316e-06, "loss": 1.028, "step": 23688 }, { "epoch": 0.45, "learning_rate": 3.04672364982818e-06, "loss": 0.8479, "step": 23689 }, { "epoch": 0.45, "learning_rate": 3.046574581038595e-06, "loss": 0.8275, "step": 23690 }, { "epoch": 0.45, "learning_rate": 3.0464255102081174e-06, "loss": 0.9719, "step": 23691 }, { "epoch": 0.45, "learning_rate": 3.0462764373373037e-06, "loss": 0.9359, "step": 23692 }, { "epoch": 0.45, "learning_rate": 3.0461273624267105e-06, "loss": 0.876, "step": 23693 }, { "epoch": 0.45, "learning_rate": 3.045978285476895e-06, "loss": 1.1983, "step": 23694 }, { "epoch": 0.45, "learning_rate": 3.0458292064884127e-06, "loss": 0.9863, "step": 23695 }, { "epoch": 0.45, "learning_rate": 3.0456801254618207e-06, "loss": 0.9782, "step": 23696 }, { "epoch": 0.45, "learning_rate": 3.0455310423976757e-06, "loss": 0.8852, "step": 23697 }, { "epoch": 0.45, "learning_rate": 3.0453819572965354e-06, "loss": 0.8874, "step": 23698 }, { "epoch": 0.45, "learning_rate": 3.045232870158955e-06, "loss": 1.132, "step": 23699 }, { "epoch": 0.45, "learning_rate": 3.0450837809854922e-06, "loss": 0.9634, "step": 23700 }, { "epoch": 0.45, "learning_rate": 3.0449346897767027e-06, "loss": 0.8688, "step": 23701 }, { "epoch": 0.45, "learning_rate": 3.044785596533144e-06, "loss": 1.004, "step": 23702 }, { "epoch": 0.45, "learning_rate": 3.0446365012553726e-06, "loss": 0.8175, "step": 23703 }, { "epoch": 0.45, "learning_rate": 3.0444874039439453e-06, "loss": 0.7163, "step": 23704 }, { "epoch": 0.45, "learning_rate": 3.0443383045994184e-06, "loss": 1.063, "step": 23705 }, { "epoch": 0.45, "learning_rate": 3.04418920322235e-06, "loss": 1.2884, "step": 23706 }, { "epoch": 0.45, "learning_rate": 3.0440400998132946e-06, "loss": 0.946, "step": 23707 }, { "epoch": 0.45, "learning_rate": 3.0438909943728105e-06, "loss": 0.7688, "step": 23708 }, { "epoch": 0.45, "learning_rate": 3.0437418869014547e-06, "loss": 0.8628, "step": 23709 }, { "epoch": 0.45, "learning_rate": 3.043592777399782e-06, "loss": 0.7588, "step": 23710 }, { "epoch": 0.45, "learning_rate": 3.0434436658683513e-06, "loss": 0.9665, "step": 23711 }, { "epoch": 0.45, "learning_rate": 3.0432945523077193e-06, "loss": 1.0222, "step": 23712 }, { "epoch": 0.45, "learning_rate": 3.0431454367184417e-06, "loss": 1.0721, "step": 23713 }, { "epoch": 0.45, "learning_rate": 3.0429963191010754e-06, "loss": 0.9415, "step": 23714 }, { "epoch": 0.45, "learning_rate": 3.042847199456178e-06, "loss": 1.0356, "step": 23715 }, { "epoch": 0.45, "learning_rate": 3.0426980777843053e-06, "loss": 0.9789, "step": 23716 }, { "epoch": 0.45, "learning_rate": 3.042548954086014e-06, "loss": 1.0305, "step": 23717 }, { "epoch": 0.45, "learning_rate": 3.0423998283618627e-06, "loss": 1.129, "step": 23718 }, { "epoch": 0.45, "learning_rate": 3.0422507006124065e-06, "loss": 0.8929, "step": 23719 }, { "epoch": 0.45, "learning_rate": 3.042101570838203e-06, "loss": 0.8982, "step": 23720 }, { "epoch": 0.45, "learning_rate": 3.041952439039809e-06, "loss": 0.9122, "step": 23721 }, { "epoch": 0.45, "learning_rate": 3.041803305217781e-06, "loss": 0.779, "step": 23722 }, { "epoch": 0.45, "learning_rate": 3.041654169372676e-06, "loss": 0.8525, "step": 23723 }, { "epoch": 0.45, "learning_rate": 3.0415050315050508e-06, "loss": 0.9445, "step": 23724 }, { "epoch": 0.45, "learning_rate": 3.041355891615462e-06, "loss": 0.9191, "step": 23725 }, { "epoch": 0.45, "learning_rate": 3.041206749704468e-06, "loss": 0.975, "step": 23726 }, { "epoch": 0.45, "learning_rate": 3.0410576057726243e-06, "loss": 0.7507, "step": 23727 }, { "epoch": 0.45, "learning_rate": 3.040908459820488e-06, "loss": 0.9056, "step": 23728 }, { "epoch": 0.45, "learning_rate": 3.0407593118486157e-06, "loss": 0.8991, "step": 23729 }, { "epoch": 0.45, "learning_rate": 3.0406101618575654e-06, "loss": 0.9796, "step": 23730 }, { "epoch": 0.45, "learning_rate": 3.0404610098478925e-06, "loss": 1.1735, "step": 23731 }, { "epoch": 0.45, "learning_rate": 3.040311855820155e-06, "loss": 0.9989, "step": 23732 }, { "epoch": 0.45, "learning_rate": 3.0401626997749102e-06, "loss": 0.7693, "step": 23733 }, { "epoch": 0.45, "learning_rate": 3.0400135417127143e-06, "loss": 1.1194, "step": 23734 }, { "epoch": 0.45, "learning_rate": 3.0398643816341246e-06, "loss": 0.7695, "step": 23735 }, { "epoch": 0.45, "learning_rate": 3.0397152195396973e-06, "loss": 1.0389, "step": 23736 }, { "epoch": 0.45, "learning_rate": 3.0395660554299894e-06, "loss": 0.9232, "step": 23737 }, { "epoch": 0.45, "learning_rate": 3.0394168893055593e-06, "loss": 0.9682, "step": 23738 }, { "epoch": 0.45, "learning_rate": 3.0392677211669624e-06, "loss": 0.7453, "step": 23739 }, { "epoch": 0.45, "learning_rate": 3.039118551014757e-06, "loss": 0.8863, "step": 23740 }, { "epoch": 0.45, "learning_rate": 3.0389693788494996e-06, "loss": 0.999, "step": 23741 }, { "epoch": 0.45, "learning_rate": 3.0388202046717463e-06, "loss": 0.766, "step": 23742 }, { "epoch": 0.45, "learning_rate": 3.0386710284820555e-06, "loss": 0.8828, "step": 23743 }, { "epoch": 0.45, "learning_rate": 3.0385218502809825e-06, "loss": 1.1172, "step": 23744 }, { "epoch": 0.45, "learning_rate": 3.0383726700690863e-06, "loss": 1.1618, "step": 23745 }, { "epoch": 0.45, "learning_rate": 3.038223487846923e-06, "loss": 0.8084, "step": 23746 }, { "epoch": 0.45, "learning_rate": 3.03807430361505e-06, "loss": 0.7669, "step": 23747 }, { "epoch": 0.45, "learning_rate": 3.0379251173740236e-06, "loss": 0.9108, "step": 23748 }, { "epoch": 0.45, "learning_rate": 3.0377759291244014e-06, "loss": 1.0359, "step": 23749 }, { "epoch": 0.45, "learning_rate": 3.0376267388667414e-06, "loss": 0.9081, "step": 23750 }, { "epoch": 0.45, "learning_rate": 3.037477546601598e-06, "loss": 0.917, "step": 23751 }, { "epoch": 0.45, "learning_rate": 3.0373283523295298e-06, "loss": 0.8589, "step": 23752 }, { "epoch": 0.45, "learning_rate": 3.0371791560510957e-06, "loss": 1.0035, "step": 23753 }, { "epoch": 0.45, "learning_rate": 3.03702995776685e-06, "loss": 0.7198, "step": 23754 }, { "epoch": 0.45, "learning_rate": 3.0368807574773506e-06, "loss": 1.1234, "step": 23755 }, { "epoch": 0.45, "learning_rate": 3.036731555183156e-06, "loss": 1.0518, "step": 23756 }, { "epoch": 0.45, "learning_rate": 3.036582350884822e-06, "loss": 1.05, "step": 23757 }, { "epoch": 0.45, "learning_rate": 3.0364331445829054e-06, "loss": 0.6366, "step": 23758 }, { "epoch": 0.45, "learning_rate": 3.036283936277964e-06, "loss": 0.9467, "step": 23759 }, { "epoch": 0.45, "learning_rate": 3.0361347259705546e-06, "loss": 0.8835, "step": 23760 }, { "epoch": 0.45, "learning_rate": 3.0359855136612347e-06, "loss": 1.0239, "step": 23761 }, { "epoch": 0.45, "learning_rate": 3.035836299350562e-06, "loss": 1.235, "step": 23762 }, { "epoch": 0.45, "learning_rate": 3.035687083039092e-06, "loss": 0.9523, "step": 23763 }, { "epoch": 0.45, "learning_rate": 3.0355378647273837e-06, "loss": 1.0295, "step": 23764 }, { "epoch": 0.45, "learning_rate": 3.035388644415993e-06, "loss": 0.9799, "step": 23765 }, { "epoch": 0.45, "learning_rate": 3.0352394221054774e-06, "loss": 0.7101, "step": 23766 }, { "epoch": 0.45, "learning_rate": 3.0350901977963942e-06, "loss": 0.8201, "step": 23767 }, { "epoch": 0.45, "learning_rate": 3.0349409714893013e-06, "loss": 1.0756, "step": 23768 }, { "epoch": 0.45, "learning_rate": 3.0347917431847544e-06, "loss": 1.0671, "step": 23769 }, { "epoch": 0.45, "learning_rate": 3.0346425128833124e-06, "loss": 0.9561, "step": 23770 }, { "epoch": 0.45, "learning_rate": 3.034493280585531e-06, "loss": 1.0248, "step": 23771 }, { "epoch": 0.45, "learning_rate": 3.0343440462919682e-06, "loss": 0.8059, "step": 23772 }, { "epoch": 0.45, "learning_rate": 3.0341948100031803e-06, "loss": 0.8246, "step": 23773 }, { "epoch": 0.45, "learning_rate": 3.034045571719727e-06, "loss": 1.1889, "step": 23774 }, { "epoch": 0.45, "learning_rate": 3.033896331442163e-06, "loss": 1.0061, "step": 23775 }, { "epoch": 0.45, "learning_rate": 3.0337470891710463e-06, "loss": 0.9395, "step": 23776 }, { "epoch": 0.45, "learning_rate": 3.0335978449069346e-06, "loss": 0.8353, "step": 23777 }, { "epoch": 0.45, "learning_rate": 3.0334485986503853e-06, "loss": 1.1057, "step": 23778 }, { "epoch": 0.45, "learning_rate": 3.0332993504019546e-06, "loss": 0.7583, "step": 23779 }, { "epoch": 0.45, "learning_rate": 3.0331501001622003e-06, "loss": 1.0729, "step": 23780 }, { "epoch": 0.45, "learning_rate": 3.033000847931681e-06, "loss": 1.1261, "step": 23781 }, { "epoch": 0.45, "learning_rate": 3.0328515937109515e-06, "loss": 0.9074, "step": 23782 }, { "epoch": 0.45, "learning_rate": 3.0327023375005716e-06, "loss": 0.8881, "step": 23783 }, { "epoch": 0.45, "learning_rate": 3.032553079301097e-06, "loss": 1.0291, "step": 23784 }, { "epoch": 0.45, "learning_rate": 3.0324038191130856e-06, "loss": 0.934, "step": 23785 }, { "epoch": 0.45, "learning_rate": 3.0322545569370946e-06, "loss": 1.0574, "step": 23786 }, { "epoch": 0.45, "learning_rate": 3.0321052927736815e-06, "loss": 1.2563, "step": 23787 }, { "epoch": 0.45, "learning_rate": 3.0319560266234034e-06, "loss": 1.1232, "step": 23788 }, { "epoch": 0.45, "learning_rate": 3.0318067584868183e-06, "loss": 0.9659, "step": 23789 }, { "epoch": 0.45, "learning_rate": 3.031657488364483e-06, "loss": 0.9486, "step": 23790 }, { "epoch": 0.45, "learning_rate": 3.031508216256954e-06, "loss": 0.8888, "step": 23791 }, { "epoch": 0.45, "learning_rate": 3.031358942164791e-06, "loss": 0.8283, "step": 23792 }, { "epoch": 0.45, "learning_rate": 3.0312096660885492e-06, "loss": 0.8856, "step": 23793 }, { "epoch": 0.45, "learning_rate": 3.031060388028786e-06, "loss": 0.9225, "step": 23794 }, { "epoch": 0.45, "learning_rate": 3.030911107986061e-06, "loss": 0.8075, "step": 23795 }, { "epoch": 0.45, "learning_rate": 3.0307618259609294e-06, "loss": 0.9444, "step": 23796 }, { "epoch": 0.45, "learning_rate": 3.0306125419539496e-06, "loss": 0.7242, "step": 23797 }, { "epoch": 0.45, "learning_rate": 3.0304632559656792e-06, "loss": 0.7289, "step": 23798 }, { "epoch": 0.45, "learning_rate": 3.030313967996675e-06, "loss": 0.9928, "step": 23799 }, { "epoch": 0.45, "learning_rate": 3.0301646780474946e-06, "loss": 1.0811, "step": 23800 }, { "epoch": 0.45, "learning_rate": 3.0300153861186955e-06, "loss": 1.1793, "step": 23801 }, { "epoch": 0.45, "learning_rate": 3.029866092210835e-06, "loss": 0.9135, "step": 23802 }, { "epoch": 0.45, "learning_rate": 3.029716796324471e-06, "loss": 1.0262, "step": 23803 }, { "epoch": 0.45, "learning_rate": 3.0295674984601615e-06, "loss": 0.9786, "step": 23804 }, { "epoch": 0.45, "learning_rate": 3.0294181986184623e-06, "loss": 0.7956, "step": 23805 }, { "epoch": 0.45, "learning_rate": 3.0292688967999318e-06, "loss": 1.0465, "step": 23806 }, { "epoch": 0.45, "learning_rate": 3.0291195930051277e-06, "loss": 1.0239, "step": 23807 }, { "epoch": 0.45, "learning_rate": 3.028970287234607e-06, "loss": 0.9364, "step": 23808 }, { "epoch": 0.45, "learning_rate": 3.028820979488928e-06, "loss": 0.9562, "step": 23809 }, { "epoch": 0.45, "learning_rate": 3.0286716697686476e-06, "loss": 0.9207, "step": 23810 }, { "epoch": 0.45, "learning_rate": 3.028522358074323e-06, "loss": 0.9322, "step": 23811 }, { "epoch": 0.45, "learning_rate": 3.028373044406512e-06, "loss": 1.0376, "step": 23812 }, { "epoch": 0.45, "learning_rate": 3.028223728765773e-06, "loss": 1.1113, "step": 23813 }, { "epoch": 0.45, "learning_rate": 3.0280744111526623e-06, "loss": 1.0397, "step": 23814 }, { "epoch": 0.45, "learning_rate": 3.0279250915677373e-06, "loss": 0.7312, "step": 23815 }, { "epoch": 0.45, "learning_rate": 3.0277757700115574e-06, "loss": 1.0228, "step": 23816 }, { "epoch": 0.45, "learning_rate": 3.0276264464846782e-06, "loss": 0.9976, "step": 23817 }, { "epoch": 0.45, "learning_rate": 3.027477120987658e-06, "loss": 0.9031, "step": 23818 }, { "epoch": 0.45, "learning_rate": 3.027327793521055e-06, "loss": 1.0547, "step": 23819 }, { "epoch": 0.45, "learning_rate": 3.0271784640854256e-06, "loss": 0.8432, "step": 23820 }, { "epoch": 0.45, "learning_rate": 3.0270291326813285e-06, "loss": 0.9764, "step": 23821 }, { "epoch": 0.45, "learning_rate": 3.02687979930932e-06, "loss": 0.7842, "step": 23822 }, { "epoch": 0.45, "learning_rate": 3.0267304639699593e-06, "loss": 0.7546, "step": 23823 }, { "epoch": 0.45, "learning_rate": 3.0265811266638022e-06, "loss": 0.9562, "step": 23824 }, { "epoch": 0.45, "learning_rate": 3.0264317873914086e-06, "loss": 1.1323, "step": 23825 }, { "epoch": 0.45, "learning_rate": 3.026282446153334e-06, "loss": 1.0872, "step": 23826 }, { "epoch": 0.45, "learning_rate": 3.0261331029501373e-06, "loss": 1.0106, "step": 23827 }, { "epoch": 0.45, "learning_rate": 3.0259837577823753e-06, "loss": 0.8886, "step": 23828 }, { "epoch": 0.45, "learning_rate": 3.025834410650606e-06, "loss": 0.7384, "step": 23829 }, { "epoch": 0.45, "learning_rate": 3.0256850615553872e-06, "loss": 0.8555, "step": 23830 }, { "epoch": 0.45, "learning_rate": 3.0255357104972776e-06, "loss": 1.0366, "step": 23831 }, { "epoch": 0.45, "learning_rate": 3.0253863574768328e-06, "loss": 0.8308, "step": 23832 }, { "epoch": 0.45, "learning_rate": 3.0252370024946114e-06, "loss": 0.7766, "step": 23833 }, { "epoch": 0.45, "learning_rate": 3.025087645551172e-06, "loss": 0.7952, "step": 23834 }, { "epoch": 0.45, "learning_rate": 3.0249382866470707e-06, "loss": 0.8848, "step": 23835 }, { "epoch": 0.45, "learning_rate": 3.024788925782865e-06, "loss": 0.8812, "step": 23836 }, { "epoch": 0.45, "learning_rate": 3.024639562959115e-06, "loss": 1.1125, "step": 23837 }, { "epoch": 0.45, "learning_rate": 3.0244901981763762e-06, "loss": 0.843, "step": 23838 }, { "epoch": 0.45, "learning_rate": 3.024340831435207e-06, "loss": 0.6741, "step": 23839 }, { "epoch": 0.45, "learning_rate": 3.0241914627361664e-06, "loss": 0.9376, "step": 23840 }, { "epoch": 0.45, "learning_rate": 3.0240420920798095e-06, "loss": 0.7583, "step": 23841 }, { "epoch": 0.45, "learning_rate": 3.023892719466696e-06, "loss": 0.8627, "step": 23842 }, { "epoch": 0.45, "learning_rate": 3.0237433448973836e-06, "loss": 1.2051, "step": 23843 }, { "epoch": 0.45, "learning_rate": 3.0235939683724292e-06, "loss": 0.9647, "step": 23844 }, { "epoch": 0.45, "learning_rate": 3.0234445898923907e-06, "loss": 0.9716, "step": 23845 }, { "epoch": 0.45, "learning_rate": 3.023295209457827e-06, "loss": 0.8875, "step": 23846 }, { "epoch": 0.45, "learning_rate": 3.0231458270692943e-06, "loss": 0.9034, "step": 23847 }, { "epoch": 0.45, "learning_rate": 3.022996442727351e-06, "loss": 0.7692, "step": 23848 }, { "epoch": 0.45, "learning_rate": 3.0228470564325557e-06, "loss": 1.1121, "step": 23849 }, { "epoch": 0.45, "learning_rate": 3.0226976681854645e-06, "loss": 1.1244, "step": 23850 }, { "epoch": 0.45, "learning_rate": 3.022548277986638e-06, "loss": 0.9724, "step": 23851 }, { "epoch": 0.45, "learning_rate": 3.022398885836631e-06, "loss": 0.8669, "step": 23852 }, { "epoch": 0.45, "learning_rate": 3.0222494917360023e-06, "loss": 0.8908, "step": 23853 }, { "epoch": 0.45, "learning_rate": 3.022100095685311e-06, "loss": 0.873, "step": 23854 }, { "epoch": 0.45, "learning_rate": 3.021950697685113e-06, "loss": 1.0969, "step": 23855 }, { "epoch": 0.45, "learning_rate": 3.021801297735968e-06, "loss": 1.0512, "step": 23856 }, { "epoch": 0.45, "learning_rate": 3.021651895838432e-06, "loss": 0.8569, "step": 23857 }, { "epoch": 0.45, "learning_rate": 3.021502491993064e-06, "loss": 1.0097, "step": 23858 }, { "epoch": 0.45, "learning_rate": 3.021353086200422e-06, "loss": 0.7427, "step": 23859 }, { "epoch": 0.45, "learning_rate": 3.0212036784610637e-06, "loss": 0.7407, "step": 23860 }, { "epoch": 0.45, "learning_rate": 3.0210542687755466e-06, "loss": 0.8628, "step": 23861 }, { "epoch": 0.45, "learning_rate": 3.0209048571444287e-06, "loss": 0.9855, "step": 23862 }, { "epoch": 0.45, "learning_rate": 3.0207554435682683e-06, "loss": 0.9957, "step": 23863 }, { "epoch": 0.45, "learning_rate": 3.020606028047623e-06, "loss": 0.9852, "step": 23864 }, { "epoch": 0.45, "learning_rate": 3.0204566105830505e-06, "loss": 0.9826, "step": 23865 }, { "epoch": 0.45, "learning_rate": 3.0203071911751097e-06, "loss": 0.7948, "step": 23866 }, { "epoch": 0.45, "learning_rate": 3.0201577698243574e-06, "loss": 0.796, "step": 23867 }, { "epoch": 0.45, "learning_rate": 3.0200083465313517e-06, "loss": 1.0442, "step": 23868 }, { "epoch": 0.45, "learning_rate": 3.0198589212966513e-06, "loss": 1.0484, "step": 23869 }, { "epoch": 0.45, "learning_rate": 3.0197094941208127e-06, "loss": 0.9174, "step": 23870 }, { "epoch": 0.45, "learning_rate": 3.019560065004395e-06, "loss": 0.8662, "step": 23871 }, { "epoch": 0.45, "learning_rate": 3.0194106339479567e-06, "loss": 1.0219, "step": 23872 }, { "epoch": 0.45, "learning_rate": 3.0192612009520543e-06, "loss": 0.8991, "step": 23873 }, { "epoch": 0.45, "learning_rate": 3.019111766017247e-06, "loss": 1.0862, "step": 23874 }, { "epoch": 0.45, "learning_rate": 3.0189623291440924e-06, "loss": 1.2476, "step": 23875 }, { "epoch": 0.45, "learning_rate": 3.018812890333148e-06, "loss": 0.7778, "step": 23876 }, { "epoch": 0.45, "learning_rate": 3.018663449584972e-06, "loss": 1.0276, "step": 23877 }, { "epoch": 0.45, "learning_rate": 3.018514006900123e-06, "loss": 0.8794, "step": 23878 }, { "epoch": 0.45, "learning_rate": 3.018364562279158e-06, "loss": 0.7303, "step": 23879 }, { "epoch": 0.45, "learning_rate": 3.0182151157226356e-06, "loss": 0.8965, "step": 23880 }, { "epoch": 0.45, "learning_rate": 3.0180656672311147e-06, "loss": 0.9702, "step": 23881 }, { "epoch": 0.45, "learning_rate": 3.017916216805152e-06, "loss": 0.8911, "step": 23882 }, { "epoch": 0.45, "learning_rate": 3.0177667644453063e-06, "loss": 0.8154, "step": 23883 }, { "epoch": 0.45, "learning_rate": 3.017617310152135e-06, "loss": 0.985, "step": 23884 }, { "epoch": 0.45, "learning_rate": 3.0174678539261963e-06, "loss": 0.9442, "step": 23885 }, { "epoch": 0.45, "learning_rate": 3.017318395768049e-06, "loss": 0.8799, "step": 23886 }, { "epoch": 0.45, "learning_rate": 3.017168935678251e-06, "loss": 1.236, "step": 23887 }, { "epoch": 0.45, "learning_rate": 3.0170194736573593e-06, "loss": 0.9225, "step": 23888 }, { "epoch": 0.45, "learning_rate": 3.0168700097059327e-06, "loss": 0.8448, "step": 23889 }, { "epoch": 0.45, "learning_rate": 3.0167205438245306e-06, "loss": 0.9439, "step": 23890 }, { "epoch": 0.45, "learning_rate": 3.016571076013708e-06, "loss": 0.6549, "step": 23891 }, { "epoch": 0.45, "learning_rate": 3.016421606274026e-06, "loss": 0.9073, "step": 23892 }, { "epoch": 0.45, "learning_rate": 3.0162721346060412e-06, "loss": 1.0114, "step": 23893 }, { "epoch": 0.45, "learning_rate": 3.0161226610103124e-06, "loss": 1.024, "step": 23894 }, { "epoch": 0.45, "learning_rate": 3.0159731854873968e-06, "loss": 0.8945, "step": 23895 }, { "epoch": 0.45, "learning_rate": 3.0158237080378543e-06, "loss": 1.0322, "step": 23896 }, { "epoch": 0.45, "learning_rate": 3.0156742286622407e-06, "loss": 0.9432, "step": 23897 }, { "epoch": 0.45, "learning_rate": 3.015524747361116e-06, "loss": 0.8814, "step": 23898 }, { "epoch": 0.45, "learning_rate": 3.015375264135037e-06, "loss": 0.858, "step": 23899 }, { "epoch": 0.45, "learning_rate": 3.015225778984563e-06, "loss": 1.0297, "step": 23900 }, { "epoch": 0.45, "learning_rate": 3.0150762919102515e-06, "loss": 0.8266, "step": 23901 }, { "epoch": 0.45, "learning_rate": 3.014926802912662e-06, "loss": 0.8723, "step": 23902 }, { "epoch": 0.45, "learning_rate": 3.0147773119923506e-06, "loss": 0.7208, "step": 23903 }, { "epoch": 0.45, "learning_rate": 3.0146278191498767e-06, "loss": 0.7983, "step": 23904 }, { "epoch": 0.45, "learning_rate": 3.014478324385798e-06, "loss": 0.9715, "step": 23905 }, { "epoch": 0.45, "learning_rate": 3.0143288277006734e-06, "loss": 0.9368, "step": 23906 }, { "epoch": 0.45, "learning_rate": 3.0141793290950606e-06, "loss": 1.126, "step": 23907 }, { "epoch": 0.45, "learning_rate": 3.014029828569518e-06, "loss": 1.0049, "step": 23908 }, { "epoch": 0.45, "learning_rate": 3.0138803261246037e-06, "loss": 0.8932, "step": 23909 }, { "epoch": 0.45, "learning_rate": 3.013730821760876e-06, "loss": 0.8094, "step": 23910 }, { "epoch": 0.45, "learning_rate": 3.013581315478894e-06, "loss": 0.9232, "step": 23911 }, { "epoch": 0.45, "learning_rate": 3.0134318072792135e-06, "loss": 0.9838, "step": 23912 }, { "epoch": 0.45, "learning_rate": 3.013282297162395e-06, "loss": 1.1833, "step": 23913 }, { "epoch": 0.45, "learning_rate": 3.013132785128997e-06, "loss": 0.8849, "step": 23914 }, { "epoch": 0.45, "learning_rate": 3.012983271179576e-06, "loss": 0.9003, "step": 23915 }, { "epoch": 0.45, "learning_rate": 3.0128337553146913e-06, "loss": 0.7519, "step": 23916 }, { "epoch": 0.45, "learning_rate": 3.012684237534902e-06, "loss": 0.7751, "step": 23917 }, { "epoch": 0.45, "learning_rate": 3.0125347178407645e-06, "loss": 0.9413, "step": 23918 }, { "epoch": 0.45, "learning_rate": 3.012385196232838e-06, "loss": 1.0416, "step": 23919 }, { "epoch": 0.45, "learning_rate": 3.0122356727116813e-06, "loss": 0.8145, "step": 23920 }, { "epoch": 0.45, "learning_rate": 3.0120861472778515e-06, "loss": 0.8098, "step": 23921 }, { "epoch": 0.45, "learning_rate": 3.011936619931909e-06, "loss": 0.8774, "step": 23922 }, { "epoch": 0.45, "learning_rate": 3.0117870906744107e-06, "loss": 0.8855, "step": 23923 }, { "epoch": 0.45, "learning_rate": 3.0116375595059142e-06, "loss": 0.8929, "step": 23924 }, { "epoch": 0.45, "learning_rate": 3.011488026426979e-06, "loss": 1.1567, "step": 23925 }, { "epoch": 0.45, "learning_rate": 3.0113384914381636e-06, "loss": 0.9116, "step": 23926 }, { "epoch": 0.45, "learning_rate": 3.011188954540026e-06, "loss": 0.812, "step": 23927 }, { "epoch": 0.45, "learning_rate": 3.011039415733124e-06, "loss": 0.9303, "step": 23928 }, { "epoch": 0.45, "learning_rate": 3.0108898750180173e-06, "loss": 0.8044, "step": 23929 }, { "epoch": 0.45, "learning_rate": 3.010740332395263e-06, "loss": 0.952, "step": 23930 }, { "epoch": 0.45, "learning_rate": 3.0105907878654197e-06, "loss": 1.1988, "step": 23931 }, { "epoch": 0.45, "learning_rate": 3.010441241429046e-06, "loss": 1.087, "step": 23932 }, { "epoch": 0.45, "learning_rate": 3.0102916930867006e-06, "loss": 0.9435, "step": 23933 }, { "epoch": 0.45, "learning_rate": 3.0101421428389416e-06, "loss": 0.8214, "step": 23934 }, { "epoch": 0.45, "learning_rate": 3.0099925906863275e-06, "loss": 1.029, "step": 23935 }, { "epoch": 0.45, "learning_rate": 3.009843036629417e-06, "loss": 0.7273, "step": 23936 }, { "epoch": 0.45, "learning_rate": 3.009693480668768e-06, "loss": 1.1187, "step": 23937 }, { "epoch": 0.45, "learning_rate": 3.0095439228049392e-06, "loss": 1.0825, "step": 23938 }, { "epoch": 0.45, "learning_rate": 3.009394363038489e-06, "loss": 0.8704, "step": 23939 }, { "epoch": 0.45, "learning_rate": 3.0092448013699756e-06, "loss": 0.9681, "step": 23940 }, { "epoch": 0.45, "learning_rate": 3.0090952377999583e-06, "loss": 0.8353, "step": 23941 }, { "epoch": 0.45, "learning_rate": 3.0089456723289946e-06, "loss": 0.8159, "step": 23942 }, { "epoch": 0.45, "learning_rate": 3.008796104957643e-06, "loss": 1.1878, "step": 23943 }, { "epoch": 0.45, "learning_rate": 3.008646535686463e-06, "loss": 1.0352, "step": 23944 }, { "epoch": 0.45, "learning_rate": 3.008496964516012e-06, "loss": 0.8611, "step": 23945 }, { "epoch": 0.45, "learning_rate": 3.008347391446849e-06, "loss": 0.7231, "step": 23946 }, { "epoch": 0.45, "learning_rate": 3.008197816479533e-06, "loss": 0.7634, "step": 23947 }, { "epoch": 0.45, "learning_rate": 3.008048239614621e-06, "loss": 0.9537, "step": 23948 }, { "epoch": 0.45, "learning_rate": 3.0078986608526727e-06, "loss": 0.9806, "step": 23949 }, { "epoch": 0.45, "learning_rate": 3.0077490801942473e-06, "loss": 1.2144, "step": 23950 }, { "epoch": 0.45, "learning_rate": 3.0075994976399016e-06, "loss": 1.02, "step": 23951 }, { "epoch": 0.45, "learning_rate": 3.007449913190195e-06, "loss": 0.7814, "step": 23952 }, { "epoch": 0.45, "learning_rate": 3.007300326845686e-06, "loss": 0.8559, "step": 23953 }, { "epoch": 0.45, "learning_rate": 3.007150738606933e-06, "loss": 0.8645, "step": 23954 }, { "epoch": 0.45, "learning_rate": 3.007001148474495e-06, "loss": 0.8282, "step": 23955 }, { "epoch": 0.45, "learning_rate": 3.0068515564489304e-06, "loss": 0.9792, "step": 23956 }, { "epoch": 0.45, "learning_rate": 3.006701962530797e-06, "loss": 0.9422, "step": 23957 }, { "epoch": 0.45, "learning_rate": 3.0065523667206543e-06, "loss": 0.7414, "step": 23958 }, { "epoch": 0.45, "learning_rate": 3.006402769019061e-06, "loss": 0.8652, "step": 23959 }, { "epoch": 0.45, "learning_rate": 3.006253169426575e-06, "loss": 0.6934, "step": 23960 }, { "epoch": 0.45, "learning_rate": 3.0061035679437546e-06, "loss": 0.8641, "step": 23961 }, { "epoch": 0.45, "learning_rate": 3.00595396457116e-06, "loss": 1.0559, "step": 23962 }, { "epoch": 0.45, "learning_rate": 3.0058043593093478e-06, "loss": 1.0156, "step": 23963 }, { "epoch": 0.45, "learning_rate": 3.005654752158878e-06, "loss": 1.0011, "step": 23964 }, { "epoch": 0.45, "learning_rate": 3.0055051431203096e-06, "loss": 0.8816, "step": 23965 }, { "epoch": 0.45, "learning_rate": 3.0053555321941998e-06, "loss": 0.698, "step": 23966 }, { "epoch": 0.45, "learning_rate": 3.0052059193811077e-06, "loss": 0.952, "step": 23967 }, { "epoch": 0.45, "learning_rate": 3.0050563046815927e-06, "loss": 0.9327, "step": 23968 }, { "epoch": 0.45, "learning_rate": 3.004906688096213e-06, "loss": 1.0038, "step": 23969 }, { "epoch": 0.45, "learning_rate": 3.0047570696255267e-06, "loss": 0.9377, "step": 23970 }, { "epoch": 0.45, "learning_rate": 3.004607449270094e-06, "loss": 0.972, "step": 23971 }, { "epoch": 0.45, "learning_rate": 3.0044578270304714e-06, "loss": 0.8838, "step": 23972 }, { "epoch": 0.45, "learning_rate": 3.0043082029072194e-06, "loss": 0.877, "step": 23973 }, { "epoch": 0.45, "learning_rate": 3.004158576900895e-06, "loss": 0.826, "step": 23974 }, { "epoch": 0.45, "learning_rate": 3.004008949012059e-06, "loss": 1.045, "step": 23975 }, { "epoch": 0.45, "learning_rate": 3.003859319241269e-06, "loss": 0.7401, "step": 23976 }, { "epoch": 0.45, "learning_rate": 3.0037096875890837e-06, "loss": 1.0188, "step": 23977 }, { "epoch": 0.45, "learning_rate": 3.003560054056061e-06, "loss": 0.8122, "step": 23978 }, { "epoch": 0.45, "learning_rate": 3.003410418642762e-06, "loss": 0.8726, "step": 23979 }, { "epoch": 0.45, "learning_rate": 3.003260781349743e-06, "loss": 1.1003, "step": 23980 }, { "epoch": 0.45, "learning_rate": 3.003111142177564e-06, "loss": 1.2, "step": 23981 }, { "epoch": 0.45, "learning_rate": 3.0029615011267825e-06, "loss": 0.9362, "step": 23982 }, { "epoch": 0.45, "learning_rate": 3.002811858197959e-06, "loss": 0.9623, "step": 23983 }, { "epoch": 0.45, "learning_rate": 3.002662213391651e-06, "loss": 0.9519, "step": 23984 }, { "epoch": 0.45, "learning_rate": 3.0025125667084187e-06, "loss": 0.8494, "step": 23985 }, { "epoch": 0.45, "learning_rate": 3.002362918148819e-06, "loss": 0.9828, "step": 23986 }, { "epoch": 0.45, "learning_rate": 3.002213267713412e-06, "loss": 1.0472, "step": 23987 }, { "epoch": 0.45, "learning_rate": 3.0020636154027556e-06, "loss": 1.067, "step": 23988 }, { "epoch": 0.45, "learning_rate": 3.0019139612174094e-06, "loss": 1.0216, "step": 23989 }, { "epoch": 0.45, "learning_rate": 3.0017643051579316e-06, "loss": 0.8412, "step": 23990 }, { "epoch": 0.45, "learning_rate": 3.0016146472248814e-06, "loss": 0.9637, "step": 23991 }, { "epoch": 0.45, "learning_rate": 3.0014649874188173e-06, "loss": 0.7841, "step": 23992 }, { "epoch": 0.45, "learning_rate": 3.0013153257402987e-06, "loss": 1.0198, "step": 23993 }, { "epoch": 0.45, "learning_rate": 3.0011656621898844e-06, "loss": 1.127, "step": 23994 }, { "epoch": 0.45, "learning_rate": 3.001015996768131e-06, "loss": 1.0435, "step": 23995 }, { "epoch": 0.45, "learning_rate": 3.0008663294756006e-06, "loss": 0.7415, "step": 23996 }, { "epoch": 0.45, "learning_rate": 3.0007166603128514e-06, "loss": 0.8992, "step": 23997 }, { "epoch": 0.45, "learning_rate": 3.0005669892804405e-06, "loss": 0.8515, "step": 23998 }, { "epoch": 0.45, "learning_rate": 3.0004173163789285e-06, "loss": 0.98, "step": 23999 }, { "epoch": 0.45, "learning_rate": 3.0002676416088733e-06, "loss": 1.1285, "step": 24000 }, { "epoch": 0.45, "learning_rate": 3.000117964970834e-06, "loss": 0.9164, "step": 24001 }, { "epoch": 0.45, "learning_rate": 2.9999682864653697e-06, "loss": 0.8813, "step": 24002 }, { "epoch": 0.45, "learning_rate": 2.9998186060930385e-06, "loss": 0.9667, "step": 24003 }, { "epoch": 0.45, "learning_rate": 2.9996689238544003e-06, "loss": 0.8612, "step": 24004 }, { "epoch": 0.45, "learning_rate": 2.999519239750014e-06, "loss": 0.9535, "step": 24005 }, { "epoch": 0.45, "learning_rate": 2.999369553780438e-06, "loss": 1.0925, "step": 24006 }, { "epoch": 0.45, "learning_rate": 2.999219865946231e-06, "loss": 1.0007, "step": 24007 }, { "epoch": 0.45, "learning_rate": 2.999070176247953e-06, "loss": 0.8166, "step": 24008 }, { "epoch": 0.45, "learning_rate": 2.9989204846861615e-06, "loss": 0.9994, "step": 24009 }, { "epoch": 0.45, "learning_rate": 2.998770791261417e-06, "loss": 1.0766, "step": 24010 }, { "epoch": 0.45, "learning_rate": 2.9986210959742767e-06, "loss": 1.2888, "step": 24011 }, { "epoch": 0.45, "learning_rate": 2.998471398825302e-06, "loss": 0.9363, "step": 24012 }, { "epoch": 0.45, "learning_rate": 2.9983216998150488e-06, "loss": 0.9683, "step": 24013 }, { "epoch": 0.45, "learning_rate": 2.998171998944078e-06, "loss": 0.8228, "step": 24014 }, { "epoch": 0.45, "learning_rate": 2.9980222962129495e-06, "loss": 0.7457, "step": 24015 }, { "epoch": 0.45, "learning_rate": 2.9978725916222197e-06, "loss": 0.7806, "step": 24016 }, { "epoch": 0.45, "learning_rate": 2.9977228851724487e-06, "loss": 0.9977, "step": 24017 }, { "epoch": 0.45, "learning_rate": 2.997573176864197e-06, "loss": 1.1588, "step": 24018 }, { "epoch": 0.45, "learning_rate": 2.9974234666980213e-06, "loss": 0.9722, "step": 24019 }, { "epoch": 0.45, "learning_rate": 2.9972737546744817e-06, "loss": 0.9271, "step": 24020 }, { "epoch": 0.45, "learning_rate": 2.9971240407941383e-06, "loss": 0.7533, "step": 24021 }, { "epoch": 0.45, "learning_rate": 2.9969743250575476e-06, "loss": 0.9723, "step": 24022 }, { "epoch": 0.45, "learning_rate": 2.996824607465271e-06, "loss": 0.8779, "step": 24023 }, { "epoch": 0.45, "learning_rate": 2.996674888017865e-06, "loss": 0.9475, "step": 24024 }, { "epoch": 0.45, "learning_rate": 2.996525166715891e-06, "loss": 0.9835, "step": 24025 }, { "epoch": 0.45, "learning_rate": 2.996375443559908e-06, "loss": 0.954, "step": 24026 }, { "epoch": 0.45, "learning_rate": 2.996225718550474e-06, "loss": 0.8835, "step": 24027 }, { "epoch": 0.45, "learning_rate": 2.996075991688148e-06, "loss": 1.0474, "step": 24028 }, { "epoch": 0.45, "learning_rate": 2.9959262629734896e-06, "loss": 0.7959, "step": 24029 }, { "epoch": 0.45, "learning_rate": 2.9957765324070575e-06, "loss": 0.9652, "step": 24030 }, { "epoch": 0.45, "learning_rate": 2.9956267999894112e-06, "loss": 1.2054, "step": 24031 }, { "epoch": 0.45, "learning_rate": 2.9954770657211097e-06, "loss": 1.0945, "step": 24032 }, { "epoch": 0.45, "learning_rate": 2.9953273296027125e-06, "loss": 0.8144, "step": 24033 }, { "epoch": 0.45, "learning_rate": 2.9951775916347774e-06, "loss": 0.9117, "step": 24034 }, { "epoch": 0.45, "learning_rate": 2.995027851817865e-06, "loss": 0.884, "step": 24035 }, { "epoch": 0.45, "learning_rate": 2.9948781101525336e-06, "loss": 0.9385, "step": 24036 }, { "epoch": 0.45, "learning_rate": 2.9947283666393422e-06, "loss": 1.0607, "step": 24037 }, { "epoch": 0.45, "learning_rate": 2.9945786212788504e-06, "loss": 1.1733, "step": 24038 }, { "epoch": 0.45, "learning_rate": 2.9944288740716175e-06, "loss": 0.8307, "step": 24039 }, { "epoch": 0.45, "learning_rate": 2.9942791250182017e-06, "loss": 1.032, "step": 24040 }, { "epoch": 0.45, "learning_rate": 2.9941293741191634e-06, "loss": 0.9846, "step": 24041 }, { "epoch": 0.45, "learning_rate": 2.9939796213750617e-06, "loss": 0.8207, "step": 24042 }, { "epoch": 0.45, "learning_rate": 2.993829866786454e-06, "loss": 1.1215, "step": 24043 }, { "epoch": 0.45, "learning_rate": 2.9936801103539017e-06, "loss": 0.8959, "step": 24044 }, { "epoch": 0.45, "learning_rate": 2.993530352077962e-06, "loss": 0.7177, "step": 24045 }, { "epoch": 0.45, "learning_rate": 2.9933805919591954e-06, "loss": 0.8607, "step": 24046 }, { "epoch": 0.45, "learning_rate": 2.993230829998161e-06, "loss": 0.8134, "step": 24047 }, { "epoch": 0.45, "learning_rate": 2.993081066195418e-06, "loss": 0.7175, "step": 24048 }, { "epoch": 0.45, "learning_rate": 2.9929313005515254e-06, "loss": 0.7768, "step": 24049 }, { "epoch": 0.45, "learning_rate": 2.9927815330670424e-06, "loss": 1.1827, "step": 24050 }, { "epoch": 0.45, "learning_rate": 2.992631763742528e-06, "loss": 0.9246, "step": 24051 }, { "epoch": 0.45, "learning_rate": 2.9924819925785413e-06, "loss": 0.795, "step": 24052 }, { "epoch": 0.45, "learning_rate": 2.9923322195756425e-06, "loss": 0.8547, "step": 24053 }, { "epoch": 0.45, "learning_rate": 2.9921824447343905e-06, "loss": 0.8265, "step": 24054 }, { "epoch": 0.45, "learning_rate": 2.9920326680553445e-06, "loss": 0.9831, "step": 24055 }, { "epoch": 0.45, "learning_rate": 2.991882889539063e-06, "loss": 1.1572, "step": 24056 }, { "epoch": 0.45, "learning_rate": 2.991733109186107e-06, "loss": 1.0959, "step": 24057 }, { "epoch": 0.45, "learning_rate": 2.991583326997033e-06, "loss": 0.98, "step": 24058 }, { "epoch": 0.45, "learning_rate": 2.9914335429724025e-06, "loss": 0.9102, "step": 24059 }, { "epoch": 0.45, "learning_rate": 2.9912837571127747e-06, "loss": 0.8135, "step": 24060 }, { "epoch": 0.45, "learning_rate": 2.991133969418708e-06, "loss": 0.9318, "step": 24061 }, { "epoch": 0.45, "learning_rate": 2.990984179890762e-06, "loss": 1.0118, "step": 24062 }, { "epoch": 0.45, "learning_rate": 2.9908343885294964e-06, "loss": 0.9984, "step": 24063 }, { "epoch": 0.45, "learning_rate": 2.99068459533547e-06, "loss": 1.0708, "step": 24064 }, { "epoch": 0.45, "learning_rate": 2.990534800309243e-06, "loss": 0.8619, "step": 24065 }, { "epoch": 0.45, "learning_rate": 2.990385003451373e-06, "loss": 0.7643, "step": 24066 }, { "epoch": 0.45, "learning_rate": 2.990235204762421e-06, "loss": 0.926, "step": 24067 }, { "epoch": 0.45, "learning_rate": 2.990085404242946e-06, "loss": 0.9165, "step": 24068 }, { "epoch": 0.45, "learning_rate": 2.9899356018935078e-06, "loss": 0.9297, "step": 24069 }, { "epoch": 0.45, "learning_rate": 2.989785797714664e-06, "loss": 1.0393, "step": 24070 }, { "epoch": 0.45, "learning_rate": 2.989635991706975e-06, "loss": 0.8961, "step": 24071 }, { "epoch": 0.45, "learning_rate": 2.9894861838710005e-06, "loss": 0.8029, "step": 24072 }, { "epoch": 0.45, "learning_rate": 2.9893363742072994e-06, "loss": 0.8786, "step": 24073 }, { "epoch": 0.45, "learning_rate": 2.9891865627164318e-06, "loss": 1.0944, "step": 24074 }, { "epoch": 0.45, "learning_rate": 2.9890367493989562e-06, "loss": 0.9677, "step": 24075 }, { "epoch": 0.45, "learning_rate": 2.9888869342554327e-06, "loss": 1.0233, "step": 24076 }, { "epoch": 0.45, "learning_rate": 2.98873711728642e-06, "loss": 0.9474, "step": 24077 }, { "epoch": 0.45, "learning_rate": 2.9885872984924784e-06, "loss": 1.142, "step": 24078 }, { "epoch": 0.45, "learning_rate": 2.988437477874166e-06, "loss": 0.9756, "step": 24079 }, { "epoch": 0.45, "learning_rate": 2.988287655432043e-06, "loss": 0.9182, "step": 24080 }, { "epoch": 0.45, "learning_rate": 2.9881378311666698e-06, "loss": 0.9707, "step": 24081 }, { "epoch": 0.45, "learning_rate": 2.9879880050786047e-06, "loss": 1.1392, "step": 24082 }, { "epoch": 0.45, "learning_rate": 2.9878381771684066e-06, "loss": 0.9537, "step": 24083 }, { "epoch": 0.45, "learning_rate": 2.987688347436637e-06, "loss": 0.8472, "step": 24084 }, { "epoch": 0.45, "learning_rate": 2.9875385158838533e-06, "loss": 0.8761, "step": 24085 }, { "epoch": 0.45, "learning_rate": 2.9873886825106154e-06, "loss": 0.9513, "step": 24086 }, { "epoch": 0.45, "learning_rate": 2.9872388473174827e-06, "loss": 1.2978, "step": 24087 }, { "epoch": 0.45, "learning_rate": 2.987089010305016e-06, "loss": 0.985, "step": 24088 }, { "epoch": 0.45, "learning_rate": 2.9869391714737744e-06, "loss": 0.868, "step": 24089 }, { "epoch": 0.45, "learning_rate": 2.9867893308243155e-06, "loss": 1.1924, "step": 24090 }, { "epoch": 0.45, "learning_rate": 2.986639488357201e-06, "loss": 0.8063, "step": 24091 }, { "epoch": 0.45, "learning_rate": 2.986489644072989e-06, "loss": 1.1714, "step": 24092 }, { "epoch": 0.45, "learning_rate": 2.9863397979722405e-06, "loss": 0.996, "step": 24093 }, { "epoch": 0.45, "learning_rate": 2.986189950055513e-06, "loss": 1.0508, "step": 24094 }, { "epoch": 0.45, "learning_rate": 2.986040100323368e-06, "loss": 0.7429, "step": 24095 }, { "epoch": 0.45, "learning_rate": 2.9858902487763636e-06, "loss": 0.8473, "step": 24096 }, { "epoch": 0.45, "learning_rate": 2.9857403954150603e-06, "loss": 1.0025, "step": 24097 }, { "epoch": 0.45, "learning_rate": 2.9855905402400176e-06, "loss": 0.8319, "step": 24098 }, { "epoch": 0.45, "learning_rate": 2.9854406832517942e-06, "loss": 1.0309, "step": 24099 }, { "epoch": 0.45, "learning_rate": 2.985290824450949e-06, "loss": 1.1472, "step": 24100 }, { "epoch": 0.45, "learning_rate": 2.9851409638380447e-06, "loss": 0.9623, "step": 24101 }, { "epoch": 0.45, "learning_rate": 2.984991101413638e-06, "loss": 0.8102, "step": 24102 }, { "epoch": 0.45, "learning_rate": 2.9848412371782896e-06, "loss": 0.7787, "step": 24103 }, { "epoch": 0.45, "learning_rate": 2.984691371132559e-06, "loss": 1.0407, "step": 24104 }, { "epoch": 0.45, "learning_rate": 2.9845415032770055e-06, "loss": 0.9928, "step": 24105 }, { "epoch": 0.45, "learning_rate": 2.9843916336121886e-06, "loss": 1.0621, "step": 24106 }, { "epoch": 0.45, "learning_rate": 2.984241762138669e-06, "loss": 1.0052, "step": 24107 }, { "epoch": 0.45, "learning_rate": 2.984091888857005e-06, "loss": 1.0032, "step": 24108 }, { "epoch": 0.45, "learning_rate": 2.983942013767756e-06, "loss": 0.9867, "step": 24109 }, { "epoch": 0.45, "learning_rate": 2.9837921368714834e-06, "loss": 0.8466, "step": 24110 }, { "epoch": 0.45, "learning_rate": 2.9836422581687458e-06, "loss": 0.7592, "step": 24111 }, { "epoch": 0.45, "learning_rate": 2.983492377660102e-06, "loss": 1.1055, "step": 24112 }, { "epoch": 0.45, "learning_rate": 2.9833424953461133e-06, "loss": 1.0, "step": 24113 }, { "epoch": 0.45, "learning_rate": 2.9831926112273378e-06, "loss": 1.0629, "step": 24114 }, { "epoch": 0.45, "learning_rate": 2.9830427253043363e-06, "loss": 0.7954, "step": 24115 }, { "epoch": 0.45, "learning_rate": 2.982892837577669e-06, "loss": 1.0578, "step": 24116 }, { "epoch": 0.46, "learning_rate": 2.982742948047893e-06, "loss": 0.9757, "step": 24117 }, { "epoch": 0.46, "learning_rate": 2.9825930567155703e-06, "loss": 1.0463, "step": 24118 }, { "epoch": 0.46, "learning_rate": 2.9824431635812607e-06, "loss": 0.9536, "step": 24119 }, { "epoch": 0.46, "learning_rate": 2.9822932686455225e-06, "loss": 0.9078, "step": 24120 }, { "epoch": 0.46, "learning_rate": 2.9821433719089156e-06, "loss": 0.9558, "step": 24121 }, { "epoch": 0.46, "learning_rate": 2.9819934733720003e-06, "loss": 0.8077, "step": 24122 }, { "epoch": 0.46, "learning_rate": 2.981843573035336e-06, "loss": 0.7265, "step": 24123 }, { "epoch": 0.46, "learning_rate": 2.9816936708994832e-06, "loss": 1.0048, "step": 24124 }, { "epoch": 0.46, "learning_rate": 2.981543766965001e-06, "loss": 1.1387, "step": 24125 }, { "epoch": 0.46, "learning_rate": 2.9813938612324487e-06, "loss": 0.835, "step": 24126 }, { "epoch": 0.46, "learning_rate": 2.981243953702387e-06, "loss": 0.6958, "step": 24127 }, { "epoch": 0.46, "learning_rate": 2.9810940443753742e-06, "loss": 0.9375, "step": 24128 }, { "epoch": 0.46, "learning_rate": 2.9809441332519716e-06, "loss": 0.7426, "step": 24129 }, { "epoch": 0.46, "learning_rate": 2.9807942203327384e-06, "loss": 0.9697, "step": 24130 }, { "epoch": 0.46, "learning_rate": 2.9806443056182345e-06, "loss": 0.9551, "step": 24131 }, { "epoch": 0.46, "learning_rate": 2.9804943891090195e-06, "loss": 1.0115, "step": 24132 }, { "epoch": 0.46, "learning_rate": 2.9803444708056527e-06, "loss": 0.9727, "step": 24133 }, { "epoch": 0.46, "learning_rate": 2.9801945507086945e-06, "loss": 1.1524, "step": 24134 }, { "epoch": 0.46, "learning_rate": 2.9800446288187047e-06, "loss": 0.7729, "step": 24135 }, { "epoch": 0.46, "learning_rate": 2.9798947051362425e-06, "loss": 0.9374, "step": 24136 }, { "epoch": 0.46, "learning_rate": 2.979744779661869e-06, "loss": 1.1003, "step": 24137 }, { "epoch": 0.46, "learning_rate": 2.9795948523961427e-06, "loss": 0.8566, "step": 24138 }, { "epoch": 0.46, "learning_rate": 2.979444923339624e-06, "loss": 0.9392, "step": 24139 }, { "epoch": 0.46, "learning_rate": 2.9792949924928733e-06, "loss": 0.8121, "step": 24140 }, { "epoch": 0.46, "learning_rate": 2.9791450598564486e-06, "loss": 0.7953, "step": 24141 }, { "epoch": 0.46, "learning_rate": 2.9789951254309113e-06, "loss": 0.9027, "step": 24142 }, { "epoch": 0.46, "learning_rate": 2.9788451892168215e-06, "loss": 0.9482, "step": 24143 }, { "epoch": 0.46, "learning_rate": 2.9786952512147383e-06, "loss": 1.0293, "step": 24144 }, { "epoch": 0.46, "learning_rate": 2.9785453114252212e-06, "loss": 1.0356, "step": 24145 }, { "epoch": 0.46, "learning_rate": 2.978395369848831e-06, "loss": 0.8329, "step": 24146 }, { "epoch": 0.46, "learning_rate": 2.978245426486127e-06, "loss": 0.7151, "step": 24147 }, { "epoch": 0.46, "learning_rate": 2.9780954813376696e-06, "loss": 0.7664, "step": 24148 }, { "epoch": 0.46, "learning_rate": 2.9779455344040175e-06, "loss": 0.7854, "step": 24149 }, { "epoch": 0.46, "learning_rate": 2.9777955856857317e-06, "loss": 0.996, "step": 24150 }, { "epoch": 0.46, "learning_rate": 2.977645635183372e-06, "loss": 0.7668, "step": 24151 }, { "epoch": 0.46, "learning_rate": 2.977495682897499e-06, "loss": 0.7945, "step": 24152 }, { "epoch": 0.46, "learning_rate": 2.9773457288286707e-06, "loss": 0.9587, "step": 24153 }, { "epoch": 0.46, "learning_rate": 2.977195772977448e-06, "loss": 0.6566, "step": 24154 }, { "epoch": 0.46, "learning_rate": 2.977045815344391e-06, "loss": 0.9979, "step": 24155 }, { "epoch": 0.46, "learning_rate": 2.9768958559300597e-06, "loss": 1.0588, "step": 24156 }, { "epoch": 0.46, "learning_rate": 2.976745894735014e-06, "loss": 0.9638, "step": 24157 }, { "epoch": 0.46, "learning_rate": 2.976595931759814e-06, "loss": 0.7224, "step": 24158 }, { "epoch": 0.46, "learning_rate": 2.9764459670050195e-06, "loss": 1.017, "step": 24159 }, { "epoch": 0.46, "learning_rate": 2.97629600047119e-06, "loss": 0.6954, "step": 24160 }, { "epoch": 0.46, "learning_rate": 2.976146032158886e-06, "loss": 0.7454, "step": 24161 }, { "epoch": 0.46, "learning_rate": 2.975996062068667e-06, "loss": 0.9386, "step": 24162 }, { "epoch": 0.46, "learning_rate": 2.975846090201093e-06, "loss": 0.9944, "step": 24163 }, { "epoch": 0.46, "learning_rate": 2.975696116556725e-06, "loss": 0.9802, "step": 24164 }, { "epoch": 0.46, "learning_rate": 2.975546141136122e-06, "loss": 0.8727, "step": 24165 }, { "epoch": 0.46, "learning_rate": 2.975396163939844e-06, "loss": 0.7893, "step": 24166 }, { "epoch": 0.46, "learning_rate": 2.9752461849684523e-06, "loss": 0.8623, "step": 24167 }, { "epoch": 0.46, "learning_rate": 2.9750962042225053e-06, "loss": 1.1534, "step": 24168 }, { "epoch": 0.46, "learning_rate": 2.9749462217025634e-06, "loss": 1.1692, "step": 24169 }, { "epoch": 0.46, "learning_rate": 2.9747962374091873e-06, "loss": 0.8835, "step": 24170 }, { "epoch": 0.46, "learning_rate": 2.9746462513429357e-06, "loss": 0.8371, "step": 24171 }, { "epoch": 0.46, "learning_rate": 2.97449626350437e-06, "loss": 0.8271, "step": 24172 }, { "epoch": 0.46, "learning_rate": 2.974346273894051e-06, "loss": 0.9094, "step": 24173 }, { "epoch": 0.46, "learning_rate": 2.974196282512536e-06, "loss": 0.9348, "step": 24174 }, { "epoch": 0.46, "learning_rate": 2.974046289360387e-06, "loss": 1.0471, "step": 24175 }, { "epoch": 0.46, "learning_rate": 2.9738962944381637e-06, "loss": 0.8762, "step": 24176 }, { "epoch": 0.46, "learning_rate": 2.9737462977464267e-06, "loss": 0.683, "step": 24177 }, { "epoch": 0.46, "learning_rate": 2.9735962992857347e-06, "loss": 1.037, "step": 24178 }, { "epoch": 0.46, "learning_rate": 2.9734462990566497e-06, "loss": 0.9109, "step": 24179 }, { "epoch": 0.46, "learning_rate": 2.9732962970597302e-06, "loss": 1.1498, "step": 24180 }, { "epoch": 0.46, "learning_rate": 2.9731462932955366e-06, "loss": 1.0297, "step": 24181 }, { "epoch": 0.46, "learning_rate": 2.97299628776463e-06, "loss": 1.1851, "step": 24182 }, { "epoch": 0.46, "learning_rate": 2.972846280467569e-06, "loss": 0.888, "step": 24183 }, { "epoch": 0.46, "learning_rate": 2.972696271404914e-06, "loss": 0.9636, "step": 24184 }, { "epoch": 0.46, "learning_rate": 2.972546260577227e-06, "loss": 0.697, "step": 24185 }, { "epoch": 0.46, "learning_rate": 2.972396247985066e-06, "loss": 0.9199, "step": 24186 }, { "epoch": 0.46, "learning_rate": 2.972246233628992e-06, "loss": 1.0984, "step": 24187 }, { "epoch": 0.46, "learning_rate": 2.9720962175095653e-06, "loss": 0.9479, "step": 24188 }, { "epoch": 0.46, "learning_rate": 2.971946199627345e-06, "loss": 0.7866, "step": 24189 }, { "epoch": 0.46, "learning_rate": 2.971796179982893e-06, "loss": 0.9151, "step": 24190 }, { "epoch": 0.46, "learning_rate": 2.971646158576768e-06, "loss": 0.7422, "step": 24191 }, { "epoch": 0.46, "learning_rate": 2.9714961354095306e-06, "loss": 0.7016, "step": 24192 }, { "epoch": 0.46, "learning_rate": 2.971346110481741e-06, "loss": 1.0972, "step": 24193 }, { "epoch": 0.46, "learning_rate": 2.9711960837939603e-06, "loss": 0.907, "step": 24194 }, { "epoch": 0.46, "learning_rate": 2.9710460553467472e-06, "loss": 0.8818, "step": 24195 }, { "epoch": 0.46, "learning_rate": 2.9708960251406626e-06, "loss": 0.9617, "step": 24196 }, { "epoch": 0.46, "learning_rate": 2.9707459931762668e-06, "loss": 0.9174, "step": 24197 }, { "epoch": 0.46, "learning_rate": 2.97059595945412e-06, "loss": 0.8383, "step": 24198 }, { "epoch": 0.46, "learning_rate": 2.970445923974782e-06, "loss": 0.9002, "step": 24199 }, { "epoch": 0.46, "learning_rate": 2.9702958867388138e-06, "loss": 1.1754, "step": 24200 }, { "epoch": 0.46, "learning_rate": 2.970145847746775e-06, "loss": 0.9357, "step": 24201 }, { "epoch": 0.46, "learning_rate": 2.9699958069992263e-06, "loss": 0.8437, "step": 24202 }, { "epoch": 0.46, "learning_rate": 2.969845764496727e-06, "loss": 0.962, "step": 24203 }, { "epoch": 0.46, "learning_rate": 2.9696957202398385e-06, "loss": 0.7913, "step": 24204 }, { "epoch": 0.46, "learning_rate": 2.9695456742291203e-06, "loss": 0.9997, "step": 24205 }, { "epoch": 0.46, "learning_rate": 2.9693956264651332e-06, "loss": 1.064, "step": 24206 }, { "epoch": 0.46, "learning_rate": 2.969245576948437e-06, "loss": 0.9855, "step": 24207 }, { "epoch": 0.46, "learning_rate": 2.969095525679592e-06, "loss": 0.9062, "step": 24208 }, { "epoch": 0.46, "learning_rate": 2.968945472659159e-06, "loss": 0.904, "step": 24209 }, { "epoch": 0.46, "learning_rate": 2.968795417887698e-06, "loss": 1.0698, "step": 24210 }, { "epoch": 0.46, "learning_rate": 2.9686453613657695e-06, "loss": 1.0405, "step": 24211 }, { "epoch": 0.46, "learning_rate": 2.968495303093933e-06, "loss": 1.1226, "step": 24212 }, { "epoch": 0.46, "learning_rate": 2.96834524307275e-06, "loss": 0.9169, "step": 24213 }, { "epoch": 0.46, "learning_rate": 2.96819518130278e-06, "loss": 0.8336, "step": 24214 }, { "epoch": 0.46, "learning_rate": 2.9680451177845836e-06, "loss": 0.822, "step": 24215 }, { "epoch": 0.46, "learning_rate": 2.9678950525187207e-06, "loss": 0.6337, "step": 24216 }, { "epoch": 0.46, "learning_rate": 2.9677449855057528e-06, "loss": 0.8315, "step": 24217 }, { "epoch": 0.46, "learning_rate": 2.967594916746238e-06, "loss": 1.4579, "step": 24218 }, { "epoch": 0.46, "learning_rate": 2.9674448462407395e-06, "loss": 1.0375, "step": 24219 }, { "epoch": 0.46, "learning_rate": 2.967294773989816e-06, "loss": 0.8736, "step": 24220 }, { "epoch": 0.46, "learning_rate": 2.967144699994028e-06, "loss": 0.8938, "step": 24221 }, { "epoch": 0.46, "learning_rate": 2.966994624253936e-06, "loss": 0.8289, "step": 24222 }, { "epoch": 0.46, "learning_rate": 2.966844546770101e-06, "loss": 1.0211, "step": 24223 }, { "epoch": 0.46, "learning_rate": 2.966694467543082e-06, "loss": 1.0409, "step": 24224 }, { "epoch": 0.46, "learning_rate": 2.96654438657344e-06, "loss": 1.1839, "step": 24225 }, { "epoch": 0.46, "learning_rate": 2.966394303861736e-06, "loss": 0.9857, "step": 24226 }, { "epoch": 0.46, "learning_rate": 2.96624421940853e-06, "loss": 0.6885, "step": 24227 }, { "epoch": 0.46, "learning_rate": 2.9660941332143824e-06, "loss": 1.0671, "step": 24228 }, { "epoch": 0.46, "learning_rate": 2.9659440452798536e-06, "loss": 0.8534, "step": 24229 }, { "epoch": 0.46, "learning_rate": 2.965793955605504e-06, "loss": 0.8306, "step": 24230 }, { "epoch": 0.46, "learning_rate": 2.9656438641918935e-06, "loss": 0.9016, "step": 24231 }, { "epoch": 0.46, "learning_rate": 2.9654937710395837e-06, "loss": 0.9762, "step": 24232 }, { "epoch": 0.46, "learning_rate": 2.965343676149134e-06, "loss": 0.7598, "step": 24233 }, { "epoch": 0.46, "learning_rate": 2.965193579521105e-06, "loss": 0.9464, "step": 24234 }, { "epoch": 0.46, "learning_rate": 2.9650434811560587e-06, "loss": 0.7789, "step": 24235 }, { "epoch": 0.46, "learning_rate": 2.9648933810545534e-06, "loss": 1.1027, "step": 24236 }, { "epoch": 0.46, "learning_rate": 2.9647432792171506e-06, "loss": 0.8616, "step": 24237 }, { "epoch": 0.46, "learning_rate": 2.9645931756444107e-06, "loss": 0.9695, "step": 24238 }, { "epoch": 0.46, "learning_rate": 2.9644430703368943e-06, "loss": 0.8293, "step": 24239 }, { "epoch": 0.46, "learning_rate": 2.964292963295161e-06, "loss": 0.7959, "step": 24240 }, { "epoch": 0.46, "learning_rate": 2.9641428545197732e-06, "loss": 1.0858, "step": 24241 }, { "epoch": 0.46, "learning_rate": 2.963992744011289e-06, "loss": 0.7615, "step": 24242 }, { "epoch": 0.46, "learning_rate": 2.963842631770271e-06, "loss": 0.985, "step": 24243 }, { "epoch": 0.46, "learning_rate": 2.9636925177972786e-06, "loss": 0.8705, "step": 24244 }, { "epoch": 0.46, "learning_rate": 2.963542402092873e-06, "loss": 0.8367, "step": 24245 }, { "epoch": 0.46, "learning_rate": 2.963392284657613e-06, "loss": 0.8377, "step": 24246 }, { "epoch": 0.46, "learning_rate": 2.963242165492061e-06, "loss": 0.8173, "step": 24247 }, { "epoch": 0.46, "learning_rate": 2.9630920445967775e-06, "loss": 0.9459, "step": 24248 }, { "epoch": 0.46, "learning_rate": 2.962941921972322e-06, "loss": 1.0308, "step": 24249 }, { "epoch": 0.46, "learning_rate": 2.962791797619256e-06, "loss": 0.8716, "step": 24250 }, { "epoch": 0.46, "learning_rate": 2.9626416715381394e-06, "loss": 0.9926, "step": 24251 }, { "epoch": 0.46, "learning_rate": 2.9624915437295325e-06, "loss": 0.8028, "step": 24252 }, { "epoch": 0.46, "learning_rate": 2.9623414141939965e-06, "loss": 0.7491, "step": 24253 }, { "epoch": 0.46, "learning_rate": 2.962191282932092e-06, "loss": 0.7885, "step": 24254 }, { "epoch": 0.46, "learning_rate": 2.9620411499443797e-06, "loss": 0.9232, "step": 24255 }, { "epoch": 0.46, "learning_rate": 2.96189101523142e-06, "loss": 1.1579, "step": 24256 }, { "epoch": 0.46, "learning_rate": 2.961740878793773e-06, "loss": 0.8563, "step": 24257 }, { "epoch": 0.46, "learning_rate": 2.961590740632e-06, "loss": 1.0594, "step": 24258 }, { "epoch": 0.46, "learning_rate": 2.9614406007466613e-06, "loss": 0.8588, "step": 24259 }, { "epoch": 0.46, "learning_rate": 2.961290459138317e-06, "loss": 0.8668, "step": 24260 }, { "epoch": 0.46, "learning_rate": 2.9611403158075287e-06, "loss": 0.7537, "step": 24261 }, { "epoch": 0.46, "learning_rate": 2.9609901707548574e-06, "loss": 1.141, "step": 24262 }, { "epoch": 0.46, "learning_rate": 2.9608400239808617e-06, "loss": 1.0624, "step": 24263 }, { "epoch": 0.46, "learning_rate": 2.9606898754861034e-06, "loss": 0.9798, "step": 24264 }, { "epoch": 0.46, "learning_rate": 2.9605397252711444e-06, "loss": 1.0432, "step": 24265 }, { "epoch": 0.46, "learning_rate": 2.9603895733365434e-06, "loss": 0.8546, "step": 24266 }, { "epoch": 0.46, "learning_rate": 2.9602394196828614e-06, "loss": 0.8713, "step": 24267 }, { "epoch": 0.46, "learning_rate": 2.9600892643106606e-06, "loss": 1.1044, "step": 24268 }, { "epoch": 0.46, "learning_rate": 2.9599391072204995e-06, "loss": 1.0248, "step": 24269 }, { "epoch": 0.46, "learning_rate": 2.9597889484129406e-06, "loss": 0.9736, "step": 24270 }, { "epoch": 0.46, "learning_rate": 2.959638787888544e-06, "loss": 0.8787, "step": 24271 }, { "epoch": 0.46, "learning_rate": 2.95948862564787e-06, "loss": 0.9606, "step": 24272 }, { "epoch": 0.46, "learning_rate": 2.9593384616914794e-06, "loss": 1.0063, "step": 24273 }, { "epoch": 0.46, "learning_rate": 2.959188296019933e-06, "loss": 0.8737, "step": 24274 }, { "epoch": 0.46, "learning_rate": 2.959038128633792e-06, "loss": 1.0058, "step": 24275 }, { "epoch": 0.46, "learning_rate": 2.958887959533616e-06, "loss": 0.7446, "step": 24276 }, { "epoch": 0.46, "learning_rate": 2.9587377887199674e-06, "loss": 0.8635, "step": 24277 }, { "epoch": 0.46, "learning_rate": 2.958587616193406e-06, "loss": 0.8806, "step": 24278 }, { "epoch": 0.46, "learning_rate": 2.9584374419544915e-06, "loss": 0.8328, "step": 24279 }, { "epoch": 0.46, "learning_rate": 2.958287266003786e-06, "loss": 0.9792, "step": 24280 }, { "epoch": 0.46, "learning_rate": 2.9581370883418498e-06, "loss": 1.0738, "step": 24281 }, { "epoch": 0.46, "learning_rate": 2.9579869089692444e-06, "loss": 0.9612, "step": 24282 }, { "epoch": 0.46, "learning_rate": 2.9578367278865295e-06, "loss": 0.8861, "step": 24283 }, { "epoch": 0.46, "learning_rate": 2.957686545094266e-06, "loss": 0.781, "step": 24284 }, { "epoch": 0.46, "learning_rate": 2.957536360593015e-06, "loss": 0.8786, "step": 24285 }, { "epoch": 0.46, "learning_rate": 2.957386174383338e-06, "loss": 0.967, "step": 24286 }, { "epoch": 0.46, "learning_rate": 2.957235986465795e-06, "loss": 1.1472, "step": 24287 }, { "epoch": 0.46, "learning_rate": 2.9570857968409455e-06, "loss": 1.0047, "step": 24288 }, { "epoch": 0.46, "learning_rate": 2.9569356055093534e-06, "loss": 0.9372, "step": 24289 }, { "epoch": 0.46, "learning_rate": 2.9567854124715765e-06, "loss": 0.899, "step": 24290 }, { "epoch": 0.46, "learning_rate": 2.9566352177281777e-06, "loss": 0.941, "step": 24291 }, { "epoch": 0.46, "learning_rate": 2.956485021279717e-06, "loss": 0.9296, "step": 24292 }, { "epoch": 0.46, "learning_rate": 2.956334823126755e-06, "loss": 1.211, "step": 24293 }, { "epoch": 0.46, "learning_rate": 2.956184623269852e-06, "loss": 1.0607, "step": 24294 }, { "epoch": 0.46, "learning_rate": 2.95603442170957e-06, "loss": 1.0339, "step": 24295 }, { "epoch": 0.46, "learning_rate": 2.95588421844647e-06, "loss": 0.884, "step": 24296 }, { "epoch": 0.46, "learning_rate": 2.9557340134811113e-06, "loss": 0.9121, "step": 24297 }, { "epoch": 0.46, "learning_rate": 2.9555838068140567e-06, "loss": 1.0201, "step": 24298 }, { "epoch": 0.46, "learning_rate": 2.955433598445866e-06, "loss": 0.974, "step": 24299 }, { "epoch": 0.46, "learning_rate": 2.9552833883770997e-06, "loss": 0.9704, "step": 24300 }, { "epoch": 0.46, "learning_rate": 2.9551331766083195e-06, "loss": 1.0642, "step": 24301 }, { "epoch": 0.46, "learning_rate": 2.9549829631400863e-06, "loss": 0.8755, "step": 24302 }, { "epoch": 0.46, "learning_rate": 2.95483274797296e-06, "loss": 0.8712, "step": 24303 }, { "epoch": 0.46, "learning_rate": 2.9546825311075034e-06, "loss": 0.6944, "step": 24304 }, { "epoch": 0.46, "learning_rate": 2.9545323125442747e-06, "loss": 1.1055, "step": 24305 }, { "epoch": 0.46, "learning_rate": 2.9543820922838372e-06, "loss": 1.2166, "step": 24306 }, { "epoch": 0.46, "learning_rate": 2.954231870326751e-06, "loss": 1.0363, "step": 24307 }, { "epoch": 0.46, "learning_rate": 2.9540816466735766e-06, "loss": 0.8415, "step": 24308 }, { "epoch": 0.46, "learning_rate": 2.953931421324874e-06, "loss": 0.8539, "step": 24309 }, { "epoch": 0.46, "learning_rate": 2.953781194281207e-06, "loss": 0.884, "step": 24310 }, { "epoch": 0.46, "learning_rate": 2.953630965543135e-06, "loss": 0.7747, "step": 24311 }, { "epoch": 0.46, "learning_rate": 2.9534807351112183e-06, "loss": 1.1797, "step": 24312 }, { "epoch": 0.46, "learning_rate": 2.953330502986019e-06, "loss": 0.9725, "step": 24313 }, { "epoch": 0.46, "learning_rate": 2.9531802691680965e-06, "loss": 0.6699, "step": 24314 }, { "epoch": 0.46, "learning_rate": 2.9530300336580132e-06, "loss": 0.9695, "step": 24315 }, { "epoch": 0.46, "learning_rate": 2.95287979645633e-06, "loss": 0.9129, "step": 24316 }, { "epoch": 0.46, "learning_rate": 2.9527295575636073e-06, "loss": 0.9736, "step": 24317 }, { "epoch": 0.46, "learning_rate": 2.952579316980406e-06, "loss": 1.2682, "step": 24318 }, { "epoch": 0.46, "learning_rate": 2.9524290747072883e-06, "loss": 1.0013, "step": 24319 }, { "epoch": 0.46, "learning_rate": 2.9522788307448136e-06, "loss": 0.9216, "step": 24320 }, { "epoch": 0.46, "learning_rate": 2.9521285850935437e-06, "loss": 0.9064, "step": 24321 }, { "epoch": 0.46, "learning_rate": 2.951978337754039e-06, "loss": 1.0761, "step": 24322 }, { "epoch": 0.46, "learning_rate": 2.9518280887268615e-06, "loss": 0.9836, "step": 24323 }, { "epoch": 0.46, "learning_rate": 2.951677838012572e-06, "loss": 1.0888, "step": 24324 }, { "epoch": 0.46, "learning_rate": 2.9515275856117315e-06, "loss": 1.101, "step": 24325 }, { "epoch": 0.46, "learning_rate": 2.9513773315249007e-06, "loss": 1.0051, "step": 24326 }, { "epoch": 0.46, "learning_rate": 2.9512270757526407e-06, "loss": 0.902, "step": 24327 }, { "epoch": 0.46, "learning_rate": 2.9510768182955124e-06, "loss": 0.8222, "step": 24328 }, { "epoch": 0.46, "learning_rate": 2.950926559154077e-06, "loss": 0.8975, "step": 24329 }, { "epoch": 0.46, "learning_rate": 2.9507762983288957e-06, "loss": 0.8959, "step": 24330 }, { "epoch": 0.46, "learning_rate": 2.9506260358205296e-06, "loss": 1.0168, "step": 24331 }, { "epoch": 0.46, "learning_rate": 2.9504757716295397e-06, "loss": 0.9736, "step": 24332 }, { "epoch": 0.46, "learning_rate": 2.9503255057564877e-06, "loss": 0.9048, "step": 24333 }, { "epoch": 0.46, "learning_rate": 2.9501752382019334e-06, "loss": 1.0031, "step": 24334 }, { "epoch": 0.46, "learning_rate": 2.9500249689664384e-06, "loss": 0.8355, "step": 24335 }, { "epoch": 0.46, "learning_rate": 2.9498746980505643e-06, "loss": 1.0939, "step": 24336 }, { "epoch": 0.46, "learning_rate": 2.949724425454872e-06, "loss": 1.1808, "step": 24337 }, { "epoch": 0.46, "learning_rate": 2.949574151179922e-06, "loss": 1.0664, "step": 24338 }, { "epoch": 0.46, "learning_rate": 2.9494238752262768e-06, "loss": 0.8873, "step": 24339 }, { "epoch": 0.46, "learning_rate": 2.9492735975944957e-06, "loss": 0.9589, "step": 24340 }, { "epoch": 0.46, "learning_rate": 2.949123318285141e-06, "loss": 0.7274, "step": 24341 }, { "epoch": 0.46, "learning_rate": 2.948973037298774e-06, "loss": 0.9507, "step": 24342 }, { "epoch": 0.46, "learning_rate": 2.948822754635955e-06, "loss": 1.0446, "step": 24343 }, { "epoch": 0.46, "learning_rate": 2.948672470297245e-06, "loss": 1.0396, "step": 24344 }, { "epoch": 0.46, "learning_rate": 2.9485221842832074e-06, "loss": 0.8885, "step": 24345 }, { "epoch": 0.46, "learning_rate": 2.948371896594401e-06, "loss": 0.8456, "step": 24346 }, { "epoch": 0.46, "learning_rate": 2.9482216072313867e-06, "loss": 0.8448, "step": 24347 }, { "epoch": 0.46, "learning_rate": 2.948071316194728e-06, "loss": 0.7997, "step": 24348 }, { "epoch": 0.46, "learning_rate": 2.9479210234849843e-06, "loss": 0.9777, "step": 24349 }, { "epoch": 0.46, "learning_rate": 2.9477707291027167e-06, "loss": 1.1447, "step": 24350 }, { "epoch": 0.46, "learning_rate": 2.9476204330484874e-06, "loss": 0.9043, "step": 24351 }, { "epoch": 0.46, "learning_rate": 2.9474701353228575e-06, "loss": 0.9574, "step": 24352 }, { "epoch": 0.46, "learning_rate": 2.947319835926387e-06, "loss": 0.9698, "step": 24353 }, { "epoch": 0.46, "learning_rate": 2.947169534859639e-06, "loss": 0.81, "step": 24354 }, { "epoch": 0.46, "learning_rate": 2.9470192321231728e-06, "loss": 0.8008, "step": 24355 }, { "epoch": 0.46, "learning_rate": 2.9468689277175506e-06, "loss": 1.2312, "step": 24356 }, { "epoch": 0.46, "learning_rate": 2.9467186216433336e-06, "loss": 1.1606, "step": 24357 }, { "epoch": 0.46, "learning_rate": 2.946568313901083e-06, "loss": 0.9376, "step": 24358 }, { "epoch": 0.46, "learning_rate": 2.94641800449136e-06, "loss": 0.8358, "step": 24359 }, { "epoch": 0.46, "learning_rate": 2.946267693414726e-06, "loss": 0.9062, "step": 24360 }, { "epoch": 0.46, "learning_rate": 2.946117380671742e-06, "loss": 0.8153, "step": 24361 }, { "epoch": 0.46, "learning_rate": 2.945967066262969e-06, "loss": 0.9251, "step": 24362 }, { "epoch": 0.46, "learning_rate": 2.94581675018897e-06, "loss": 1.1657, "step": 24363 }, { "epoch": 0.46, "learning_rate": 2.9456664324503033e-06, "loss": 0.9317, "step": 24364 }, { "epoch": 0.46, "learning_rate": 2.9455161130475324e-06, "loss": 0.9826, "step": 24365 }, { "epoch": 0.46, "learning_rate": 2.9453657919812185e-06, "loss": 0.9025, "step": 24366 }, { "epoch": 0.46, "learning_rate": 2.945215469251922e-06, "loss": 0.946, "step": 24367 }, { "epoch": 0.46, "learning_rate": 2.945065144860204e-06, "loss": 1.1649, "step": 24368 }, { "epoch": 0.46, "learning_rate": 2.9449148188066275e-06, "loss": 1.2225, "step": 24369 }, { "epoch": 0.46, "learning_rate": 2.944764491091752e-06, "loss": 1.058, "step": 24370 }, { "epoch": 0.46, "learning_rate": 2.9446141617161394e-06, "loss": 0.8532, "step": 24371 }, { "epoch": 0.46, "learning_rate": 2.9444638306803515e-06, "loss": 0.9302, "step": 24372 }, { "epoch": 0.46, "learning_rate": 2.944313497984949e-06, "loss": 0.9422, "step": 24373 }, { "epoch": 0.46, "learning_rate": 2.9441631636304936e-06, "loss": 1.0589, "step": 24374 }, { "epoch": 0.46, "learning_rate": 2.9440128276175473e-06, "loss": 0.9189, "step": 24375 }, { "epoch": 0.46, "learning_rate": 2.94386248994667e-06, "loss": 0.83, "step": 24376 }, { "epoch": 0.46, "learning_rate": 2.9437121506184235e-06, "loss": 0.8553, "step": 24377 }, { "epoch": 0.46, "learning_rate": 2.9435618096333697e-06, "loss": 1.0923, "step": 24378 }, { "epoch": 0.46, "learning_rate": 2.94341146699207e-06, "loss": 0.8804, "step": 24379 }, { "epoch": 0.46, "learning_rate": 2.943261122695085e-06, "loss": 0.9037, "step": 24380 }, { "epoch": 0.46, "learning_rate": 2.9431107767429774e-06, "loss": 0.9385, "step": 24381 }, { "epoch": 0.46, "learning_rate": 2.9429604291363066e-06, "loss": 0.9389, "step": 24382 }, { "epoch": 0.46, "learning_rate": 2.942810079875636e-06, "loss": 0.9329, "step": 24383 }, { "epoch": 0.46, "learning_rate": 2.9426597289615266e-06, "loss": 0.8399, "step": 24384 }, { "epoch": 0.46, "learning_rate": 2.9425093763945377e-06, "loss": 1.0063, "step": 24385 }, { "epoch": 0.46, "learning_rate": 2.942359022175233e-06, "loss": 0.9087, "step": 24386 }, { "epoch": 0.46, "learning_rate": 2.9422086663041745e-06, "loss": 1.1927, "step": 24387 }, { "epoch": 0.46, "learning_rate": 2.942058308781921e-06, "loss": 0.7746, "step": 24388 }, { "epoch": 0.46, "learning_rate": 2.941907949609036e-06, "loss": 0.9597, "step": 24389 }, { "epoch": 0.46, "learning_rate": 2.94175758878608e-06, "loss": 0.8343, "step": 24390 }, { "epoch": 0.46, "learning_rate": 2.941607226313615e-06, "loss": 0.686, "step": 24391 }, { "epoch": 0.46, "learning_rate": 2.9414568621922017e-06, "loss": 0.7982, "step": 24392 }, { "epoch": 0.46, "learning_rate": 2.941306496422402e-06, "loss": 1.1514, "step": 24393 }, { "epoch": 0.46, "learning_rate": 2.9411561290047776e-06, "loss": 1.1808, "step": 24394 }, { "epoch": 0.46, "learning_rate": 2.9410057599398895e-06, "loss": 0.8597, "step": 24395 }, { "epoch": 0.46, "learning_rate": 2.9408553892283e-06, "loss": 0.9995, "step": 24396 }, { "epoch": 0.46, "learning_rate": 2.94070501687057e-06, "loss": 0.9225, "step": 24397 }, { "epoch": 0.46, "learning_rate": 2.9405546428672604e-06, "loss": 0.9197, "step": 24398 }, { "epoch": 0.46, "learning_rate": 2.940404267218933e-06, "loss": 0.907, "step": 24399 }, { "epoch": 0.46, "learning_rate": 2.94025388992615e-06, "loss": 1.1599, "step": 24400 }, { "epoch": 0.46, "learning_rate": 2.940103510989473e-06, "loss": 1.0718, "step": 24401 }, { "epoch": 0.46, "learning_rate": 2.9399531304094623e-06, "loss": 1.0937, "step": 24402 }, { "epoch": 0.46, "learning_rate": 2.93980274818668e-06, "loss": 0.9616, "step": 24403 }, { "epoch": 0.46, "learning_rate": 2.9396523643216883e-06, "loss": 0.8208, "step": 24404 }, { "epoch": 0.46, "learning_rate": 2.939501978815048e-06, "loss": 0.9492, "step": 24405 }, { "epoch": 0.46, "learning_rate": 2.9393515916673205e-06, "loss": 1.0564, "step": 24406 }, { "epoch": 0.46, "learning_rate": 2.9392012028790674e-06, "loss": 0.9656, "step": 24407 }, { "epoch": 0.46, "learning_rate": 2.9390508124508517e-06, "loss": 0.7193, "step": 24408 }, { "epoch": 0.46, "learning_rate": 2.9389004203832326e-06, "loss": 0.7117, "step": 24409 }, { "epoch": 0.46, "learning_rate": 2.9387500266767733e-06, "loss": 0.8296, "step": 24410 }, { "epoch": 0.46, "learning_rate": 2.9385996313320345e-06, "loss": 0.9979, "step": 24411 }, { "epoch": 0.46, "learning_rate": 2.9384492343495783e-06, "loss": 1.0038, "step": 24412 }, { "epoch": 0.46, "learning_rate": 2.938298835729966e-06, "loss": 0.9022, "step": 24413 }, { "epoch": 0.46, "learning_rate": 2.9381484354737594e-06, "loss": 1.0388, "step": 24414 }, { "epoch": 0.46, "learning_rate": 2.9379980335815195e-06, "loss": 0.8193, "step": 24415 }, { "epoch": 0.46, "learning_rate": 2.937847630053809e-06, "loss": 0.8408, "step": 24416 }, { "epoch": 0.46, "learning_rate": 2.9376972248911887e-06, "loss": 0.8882, "step": 24417 }, { "epoch": 0.46, "learning_rate": 2.9375468180942206e-06, "loss": 1.009, "step": 24418 }, { "epoch": 0.46, "learning_rate": 2.9373964096634657e-06, "loss": 1.0688, "step": 24419 }, { "epoch": 0.46, "learning_rate": 2.937245999599486e-06, "loss": 0.9937, "step": 24420 }, { "epoch": 0.46, "learning_rate": 2.9370955879028435e-06, "loss": 0.9086, "step": 24421 }, { "epoch": 0.46, "learning_rate": 2.936945174574099e-06, "loss": 1.0165, "step": 24422 }, { "epoch": 0.46, "learning_rate": 2.9367947596138153e-06, "loss": 0.9948, "step": 24423 }, { "epoch": 0.46, "learning_rate": 2.9366443430225527e-06, "loss": 0.9257, "step": 24424 }, { "epoch": 0.46, "learning_rate": 2.936493924800874e-06, "loss": 0.9641, "step": 24425 }, { "epoch": 0.46, "learning_rate": 2.9363435049493406e-06, "loss": 0.6209, "step": 24426 }, { "epoch": 0.46, "learning_rate": 2.9361930834685125e-06, "loss": 0.9783, "step": 24427 }, { "epoch": 0.46, "learning_rate": 2.9360426603589544e-06, "loss": 0.9053, "step": 24428 }, { "epoch": 0.46, "learning_rate": 2.9358922356212254e-06, "loss": 0.9065, "step": 24429 }, { "epoch": 0.46, "learning_rate": 2.9357418092558887e-06, "loss": 0.9463, "step": 24430 }, { "epoch": 0.46, "learning_rate": 2.935591381263505e-06, "loss": 1.1519, "step": 24431 }, { "epoch": 0.46, "learning_rate": 2.9354409516446377e-06, "loss": 0.9406, "step": 24432 }, { "epoch": 0.46, "learning_rate": 2.9352905203998457e-06, "loss": 1.011, "step": 24433 }, { "epoch": 0.46, "learning_rate": 2.935140087529693e-06, "loss": 1.0184, "step": 24434 }, { "epoch": 0.46, "learning_rate": 2.93498965303474e-06, "loss": 0.85, "step": 24435 }, { "epoch": 0.46, "learning_rate": 2.9348392169155492e-06, "loss": 0.7854, "step": 24436 }, { "epoch": 0.46, "learning_rate": 2.9346887791726826e-06, "loss": 0.93, "step": 24437 }, { "epoch": 0.46, "learning_rate": 2.9345383398067005e-06, "loss": 0.9382, "step": 24438 }, { "epoch": 0.46, "learning_rate": 2.9343878988181662e-06, "loss": 0.9481, "step": 24439 }, { "epoch": 0.46, "learning_rate": 2.934237456207641e-06, "loss": 0.9618, "step": 24440 }, { "epoch": 0.46, "learning_rate": 2.934087011975686e-06, "loss": 0.7923, "step": 24441 }, { "epoch": 0.46, "learning_rate": 2.9339365661228633e-06, "loss": 0.7309, "step": 24442 }, { "epoch": 0.46, "learning_rate": 2.9337861186497353e-06, "loss": 1.1372, "step": 24443 }, { "epoch": 0.46, "learning_rate": 2.933635669556863e-06, "loss": 1.0201, "step": 24444 }, { "epoch": 0.46, "learning_rate": 2.933485218844808e-06, "loss": 0.7979, "step": 24445 }, { "epoch": 0.46, "learning_rate": 2.933334766514134e-06, "loss": 0.9032, "step": 24446 }, { "epoch": 0.46, "learning_rate": 2.9331843125653996e-06, "loss": 0.8031, "step": 24447 }, { "epoch": 0.46, "learning_rate": 2.933033856999168e-06, "loss": 0.9095, "step": 24448 }, { "epoch": 0.46, "learning_rate": 2.9328833998160022e-06, "loss": 0.9618, "step": 24449 }, { "epoch": 0.46, "learning_rate": 2.9327329410164628e-06, "loss": 1.1255, "step": 24450 }, { "epoch": 0.46, "learning_rate": 2.9325824806011122e-06, "loss": 0.9485, "step": 24451 }, { "epoch": 0.46, "learning_rate": 2.932432018570512e-06, "loss": 0.7644, "step": 24452 }, { "epoch": 0.46, "learning_rate": 2.932281554925224e-06, "loss": 0.9326, "step": 24453 }, { "epoch": 0.46, "learning_rate": 2.932131089665809e-06, "loss": 0.7824, "step": 24454 }, { "epoch": 0.46, "learning_rate": 2.93198062279283e-06, "loss": 1.0255, "step": 24455 }, { "epoch": 0.46, "learning_rate": 2.9318301543068482e-06, "loss": 0.9286, "step": 24456 }, { "epoch": 0.46, "learning_rate": 2.9316796842084267e-06, "loss": 0.8536, "step": 24457 }, { "epoch": 0.46, "learning_rate": 2.9315292124981264e-06, "loss": 1.0068, "step": 24458 }, { "epoch": 0.46, "learning_rate": 2.931378739176509e-06, "loss": 0.99, "step": 24459 }, { "epoch": 0.46, "learning_rate": 2.931228264244137e-06, "loss": 0.7572, "step": 24460 }, { "epoch": 0.46, "learning_rate": 2.9310777877015717e-06, "loss": 0.8251, "step": 24461 }, { "epoch": 0.46, "learning_rate": 2.9309273095493746e-06, "loss": 1.0941, "step": 24462 }, { "epoch": 0.46, "learning_rate": 2.9307768297881083e-06, "loss": 0.9281, "step": 24463 }, { "epoch": 0.46, "learning_rate": 2.9306263484183354e-06, "loss": 0.9315, "step": 24464 }, { "epoch": 0.46, "learning_rate": 2.930475865440616e-06, "loss": 0.9285, "step": 24465 }, { "epoch": 0.46, "learning_rate": 2.9303253808555137e-06, "loss": 0.978, "step": 24466 }, { "epoch": 0.46, "learning_rate": 2.9301748946635894e-06, "loss": 1.1197, "step": 24467 }, { "epoch": 0.46, "learning_rate": 2.930024406865405e-06, "loss": 1.1084, "step": 24468 }, { "epoch": 0.46, "learning_rate": 2.9298739174615222e-06, "loss": 1.0013, "step": 24469 }, { "epoch": 0.46, "learning_rate": 2.929723426452504e-06, "loss": 0.9621, "step": 24470 }, { "epoch": 0.46, "learning_rate": 2.929572933838912e-06, "loss": 0.8009, "step": 24471 }, { "epoch": 0.46, "learning_rate": 2.9294224396213068e-06, "loss": 0.912, "step": 24472 }, { "epoch": 0.46, "learning_rate": 2.9292719438002526e-06, "loss": 0.807, "step": 24473 }, { "epoch": 0.46, "learning_rate": 2.929121446376309e-06, "loss": 0.9081, "step": 24474 }, { "epoch": 0.46, "learning_rate": 2.9289709473500393e-06, "loss": 0.9911, "step": 24475 }, { "epoch": 0.46, "learning_rate": 2.9288204467220055e-06, "loss": 1.0211, "step": 24476 }, { "epoch": 0.46, "learning_rate": 2.9286699444927693e-06, "loss": 0.7474, "step": 24477 }, { "epoch": 0.46, "learning_rate": 2.9285194406628924e-06, "loss": 0.8466, "step": 24478 }, { "epoch": 0.46, "learning_rate": 2.928368935232938e-06, "loss": 0.9157, "step": 24479 }, { "epoch": 0.46, "learning_rate": 2.9282184282034663e-06, "loss": 0.8414, "step": 24480 }, { "epoch": 0.46, "learning_rate": 2.92806791957504e-06, "loss": 0.8379, "step": 24481 }, { "epoch": 0.46, "learning_rate": 2.9279174093482215e-06, "loss": 0.9762, "step": 24482 }, { "epoch": 0.46, "learning_rate": 2.9277668975235725e-06, "loss": 1.0313, "step": 24483 }, { "epoch": 0.46, "learning_rate": 2.927616384101655e-06, "loss": 0.8696, "step": 24484 }, { "epoch": 0.46, "learning_rate": 2.9274658690830313e-06, "loss": 0.8779, "step": 24485 }, { "epoch": 0.46, "learning_rate": 2.927315352468263e-06, "loss": 0.8018, "step": 24486 }, { "epoch": 0.46, "learning_rate": 2.9271648342579116e-06, "loss": 0.9061, "step": 24487 }, { "epoch": 0.46, "learning_rate": 2.927014314452541e-06, "loss": 0.9253, "step": 24488 }, { "epoch": 0.46, "learning_rate": 2.926863793052711e-06, "loss": 0.8241, "step": 24489 }, { "epoch": 0.46, "learning_rate": 2.9267132700589843e-06, "loss": 1.1365, "step": 24490 }, { "epoch": 0.46, "learning_rate": 2.9265627454719248e-06, "loss": 0.881, "step": 24491 }, { "epoch": 0.46, "learning_rate": 2.9264122192920925e-06, "loss": 1.017, "step": 24492 }, { "epoch": 0.46, "learning_rate": 2.9262616915200497e-06, "loss": 1.2237, "step": 24493 }, { "epoch": 0.46, "learning_rate": 2.92611116215636e-06, "loss": 1.0496, "step": 24494 }, { "epoch": 0.46, "learning_rate": 2.9259606312015833e-06, "loss": 0.9749, "step": 24495 }, { "epoch": 0.46, "learning_rate": 2.925810098656282e-06, "loss": 0.8024, "step": 24496 }, { "epoch": 0.46, "learning_rate": 2.9256595645210193e-06, "loss": 1.0819, "step": 24497 }, { "epoch": 0.46, "learning_rate": 2.9255090287963574e-06, "loss": 0.9476, "step": 24498 }, { "epoch": 0.46, "learning_rate": 2.9253584914828578e-06, "loss": 1.0367, "step": 24499 }, { "epoch": 0.46, "learning_rate": 2.925207952581083e-06, "loss": 0.9778, "step": 24500 }, { "epoch": 0.46, "learning_rate": 2.9250574120915937e-06, "loss": 0.9858, "step": 24501 }, { "epoch": 0.46, "learning_rate": 2.924906870014953e-06, "loss": 0.785, "step": 24502 }, { "epoch": 0.46, "learning_rate": 2.9247563263517238e-06, "loss": 1.1979, "step": 24503 }, { "epoch": 0.46, "learning_rate": 2.924605781102467e-06, "loss": 0.8931, "step": 24504 }, { "epoch": 0.46, "learning_rate": 2.924455234267745e-06, "loss": 1.079, "step": 24505 }, { "epoch": 0.46, "learning_rate": 2.924304685848122e-06, "loss": 1.0947, "step": 24506 }, { "epoch": 0.46, "learning_rate": 2.924154135844156e-06, "loss": 1.1161, "step": 24507 }, { "epoch": 0.46, "learning_rate": 2.9240035842564123e-06, "loss": 1.0515, "step": 24508 }, { "epoch": 0.46, "learning_rate": 2.923853031085453e-06, "loss": 0.8739, "step": 24509 }, { "epoch": 0.46, "learning_rate": 2.923702476331839e-06, "loss": 0.8392, "step": 24510 }, { "epoch": 0.46, "learning_rate": 2.923551919996132e-06, "loss": 0.9074, "step": 24511 }, { "epoch": 0.46, "learning_rate": 2.9234013620788964e-06, "loss": 1.1465, "step": 24512 }, { "epoch": 0.46, "learning_rate": 2.923250802580692e-06, "loss": 0.9717, "step": 24513 }, { "epoch": 0.46, "learning_rate": 2.9231002415020825e-06, "loss": 1.0302, "step": 24514 }, { "epoch": 0.46, "learning_rate": 2.922949678843631e-06, "loss": 0.8776, "step": 24515 }, { "epoch": 0.46, "learning_rate": 2.9227991146058964e-06, "loss": 0.9371, "step": 24516 }, { "epoch": 0.46, "learning_rate": 2.922648548789444e-06, "loss": 0.8609, "step": 24517 }, { "epoch": 0.46, "learning_rate": 2.9224979813948344e-06, "loss": 1.1177, "step": 24518 }, { "epoch": 0.46, "learning_rate": 2.9223474124226305e-06, "loss": 1.0041, "step": 24519 }, { "epoch": 0.46, "learning_rate": 2.9221968418733935e-06, "loss": 0.9788, "step": 24520 }, { "epoch": 0.46, "learning_rate": 2.922046269747688e-06, "loss": 0.819, "step": 24521 }, { "epoch": 0.46, "learning_rate": 2.9218956960460735e-06, "loss": 0.8645, "step": 24522 }, { "epoch": 0.46, "learning_rate": 2.921745120769114e-06, "loss": 0.7887, "step": 24523 }, { "epoch": 0.46, "learning_rate": 2.921594543917371e-06, "loss": 0.9382, "step": 24524 }, { "epoch": 0.46, "learning_rate": 2.921443965491406e-06, "loss": 0.8419, "step": 24525 }, { "epoch": 0.46, "learning_rate": 2.9212933854917834e-06, "loss": 0.9484, "step": 24526 }, { "epoch": 0.46, "learning_rate": 2.9211428039190644e-06, "loss": 1.1053, "step": 24527 }, { "epoch": 0.46, "learning_rate": 2.92099222077381e-06, "loss": 0.9759, "step": 24528 }, { "epoch": 0.46, "learning_rate": 2.920841636056584e-06, "loss": 0.817, "step": 24529 }, { "epoch": 0.46, "learning_rate": 2.9206910497679487e-06, "loss": 0.8431, "step": 24530 }, { "epoch": 0.46, "learning_rate": 2.9205404619084652e-06, "loss": 1.118, "step": 24531 }, { "epoch": 0.46, "learning_rate": 2.920389872478696e-06, "loss": 0.9949, "step": 24532 }, { "epoch": 0.46, "learning_rate": 2.920239281479205e-06, "loss": 1.0594, "step": 24533 }, { "epoch": 0.46, "learning_rate": 2.9200886889105535e-06, "loss": 0.8968, "step": 24534 }, { "epoch": 0.46, "learning_rate": 2.919938094773303e-06, "loss": 0.862, "step": 24535 }, { "epoch": 0.46, "learning_rate": 2.9197874990680176e-06, "loss": 0.7648, "step": 24536 }, { "epoch": 0.46, "learning_rate": 2.9196369017952575e-06, "loss": 1.0505, "step": 24537 }, { "epoch": 0.46, "learning_rate": 2.9194863029555864e-06, "loss": 1.0297, "step": 24538 }, { "epoch": 0.46, "learning_rate": 2.9193357025495663e-06, "loss": 1.081, "step": 24539 }, { "epoch": 0.46, "learning_rate": 2.9191851005777587e-06, "loss": 0.7759, "step": 24540 }, { "epoch": 0.46, "learning_rate": 2.919034497040728e-06, "loss": 0.9879, "step": 24541 }, { "epoch": 0.46, "learning_rate": 2.918883891939035e-06, "loss": 0.9218, "step": 24542 }, { "epoch": 0.46, "learning_rate": 2.9187332852732427e-06, "loss": 1.0804, "step": 24543 }, { "epoch": 0.46, "learning_rate": 2.9185826770439124e-06, "loss": 0.9249, "step": 24544 }, { "epoch": 0.46, "learning_rate": 2.9184320672516076e-06, "loss": 0.9352, "step": 24545 }, { "epoch": 0.46, "learning_rate": 2.9182814558968904e-06, "loss": 0.8466, "step": 24546 }, { "epoch": 0.46, "learning_rate": 2.9181308429803224e-06, "loss": 1.0345, "step": 24547 }, { "epoch": 0.46, "learning_rate": 2.9179802285024677e-06, "loss": 0.842, "step": 24548 }, { "epoch": 0.46, "learning_rate": 2.917829612463887e-06, "loss": 0.9855, "step": 24549 }, { "epoch": 0.46, "learning_rate": 2.9176789948651436e-06, "loss": 1.0076, "step": 24550 }, { "epoch": 0.46, "learning_rate": 2.9175283757067996e-06, "loss": 0.7818, "step": 24551 }, { "epoch": 0.46, "learning_rate": 2.917377754989417e-06, "loss": 0.9388, "step": 24552 }, { "epoch": 0.46, "learning_rate": 2.917227132713559e-06, "loss": 0.8446, "step": 24553 }, { "epoch": 0.46, "learning_rate": 2.917076508879788e-06, "loss": 0.7243, "step": 24554 }, { "epoch": 0.46, "learning_rate": 2.916925883488666e-06, "loss": 0.8405, "step": 24555 }, { "epoch": 0.46, "learning_rate": 2.9167752565407554e-06, "loss": 1.035, "step": 24556 }, { "epoch": 0.46, "learning_rate": 2.916624628036619e-06, "loss": 0.884, "step": 24557 }, { "epoch": 0.46, "learning_rate": 2.9164739979768187e-06, "loss": 0.8737, "step": 24558 }, { "epoch": 0.46, "learning_rate": 2.9163233663619166e-06, "loss": 0.7375, "step": 24559 }, { "epoch": 0.46, "learning_rate": 2.9161727331924766e-06, "loss": 0.7503, "step": 24560 }, { "epoch": 0.46, "learning_rate": 2.91602209846906e-06, "loss": 1.0315, "step": 24561 }, { "epoch": 0.46, "learning_rate": 2.9158714621922307e-06, "loss": 1.1643, "step": 24562 }, { "epoch": 0.46, "learning_rate": 2.915720824362549e-06, "loss": 1.1621, "step": 24563 }, { "epoch": 0.46, "learning_rate": 2.915570184980579e-06, "loss": 0.9627, "step": 24564 }, { "epoch": 0.46, "learning_rate": 2.9154195440468822e-06, "loss": 0.915, "step": 24565 }, { "epoch": 0.46, "learning_rate": 2.9152689015620216e-06, "loss": 0.9616, "step": 24566 }, { "epoch": 0.46, "learning_rate": 2.91511825752656e-06, "loss": 0.8372, "step": 24567 }, { "epoch": 0.46, "learning_rate": 2.9149676119410595e-06, "loss": 0.9971, "step": 24568 }, { "epoch": 0.46, "learning_rate": 2.9148169648060833e-06, "loss": 1.025, "step": 24569 }, { "epoch": 0.46, "learning_rate": 2.914666316122192e-06, "loss": 0.7531, "step": 24570 }, { "epoch": 0.46, "learning_rate": 2.91451566588995e-06, "loss": 0.9468, "step": 24571 }, { "epoch": 0.46, "learning_rate": 2.9143650141099194e-06, "loss": 1.0224, "step": 24572 }, { "epoch": 0.46, "learning_rate": 2.914214360782662e-06, "loss": 0.7554, "step": 24573 }, { "epoch": 0.46, "learning_rate": 2.914063705908742e-06, "loss": 1.1542, "step": 24574 }, { "epoch": 0.46, "learning_rate": 2.9139130494887198e-06, "loss": 1.0189, "step": 24575 }, { "epoch": 0.46, "learning_rate": 2.913762391523159e-06, "loss": 0.9172, "step": 24576 }, { "epoch": 0.46, "learning_rate": 2.913611732012622e-06, "loss": 0.8607, "step": 24577 }, { "epoch": 0.46, "learning_rate": 2.913461070957672e-06, "loss": 0.8728, "step": 24578 }, { "epoch": 0.46, "learning_rate": 2.913310408358871e-06, "loss": 0.9268, "step": 24579 }, { "epoch": 0.46, "learning_rate": 2.9131597442167816e-06, "loss": 1.0199, "step": 24580 }, { "epoch": 0.46, "learning_rate": 2.913009078531966e-06, "loss": 0.9801, "step": 24581 }, { "epoch": 0.46, "learning_rate": 2.9128584113049866e-06, "loss": 1.1202, "step": 24582 }, { "epoch": 0.46, "learning_rate": 2.912707742536408e-06, "loss": 0.9134, "step": 24583 }, { "epoch": 0.46, "learning_rate": 2.912557072226791e-06, "loss": 0.7822, "step": 24584 }, { "epoch": 0.46, "learning_rate": 2.9124064003766978e-06, "loss": 0.9346, "step": 24585 }, { "epoch": 0.46, "learning_rate": 2.912255726986692e-06, "loss": 1.132, "step": 24586 }, { "epoch": 0.46, "learning_rate": 2.9121050520573362e-06, "loss": 1.1191, "step": 24587 }, { "epoch": 0.46, "learning_rate": 2.9119543755891927e-06, "loss": 0.8254, "step": 24588 }, { "epoch": 0.46, "learning_rate": 2.9118036975828247e-06, "loss": 0.9563, "step": 24589 }, { "epoch": 0.46, "learning_rate": 2.9116530180387937e-06, "loss": 0.9469, "step": 24590 }, { "epoch": 0.46, "learning_rate": 2.9115023369576626e-06, "loss": 0.6006, "step": 24591 }, { "epoch": 0.46, "learning_rate": 2.9113516543399956e-06, "loss": 0.8257, "step": 24592 }, { "epoch": 0.46, "learning_rate": 2.911200970186353e-06, "loss": 1.0224, "step": 24593 }, { "epoch": 0.46, "learning_rate": 2.911050284497298e-06, "loss": 1.0146, "step": 24594 }, { "epoch": 0.46, "learning_rate": 2.9108995972733956e-06, "loss": 0.8518, "step": 24595 }, { "epoch": 0.46, "learning_rate": 2.9107489085152056e-06, "loss": 0.8753, "step": 24596 }, { "epoch": 0.46, "learning_rate": 2.910598218223292e-06, "loss": 0.8724, "step": 24597 }, { "epoch": 0.46, "learning_rate": 2.910447526398218e-06, "loss": 0.8304, "step": 24598 }, { "epoch": 0.46, "learning_rate": 2.9102968330405447e-06, "loss": 0.9405, "step": 24599 }, { "epoch": 0.46, "learning_rate": 2.9101461381508356e-06, "loss": 1.109, "step": 24600 }, { "epoch": 0.46, "learning_rate": 2.909995441729653e-06, "loss": 0.984, "step": 24601 }, { "epoch": 0.46, "learning_rate": 2.909844743777561e-06, "loss": 0.892, "step": 24602 }, { "epoch": 0.46, "learning_rate": 2.9096940442951205e-06, "loss": 0.9301, "step": 24603 }, { "epoch": 0.46, "learning_rate": 2.9095433432828955e-06, "loss": 0.7934, "step": 24604 }, { "epoch": 0.46, "learning_rate": 2.909392640741448e-06, "loss": 0.895, "step": 24605 }, { "epoch": 0.46, "learning_rate": 2.909241936671341e-06, "loss": 1.1439, "step": 24606 }, { "epoch": 0.46, "learning_rate": 2.9090912310731374e-06, "loss": 0.9313, "step": 24607 }, { "epoch": 0.46, "learning_rate": 2.908940523947399e-06, "loss": 0.9764, "step": 24608 }, { "epoch": 0.46, "learning_rate": 2.9087898152946895e-06, "loss": 0.8065, "step": 24609 }, { "epoch": 0.46, "learning_rate": 2.908639105115572e-06, "loss": 0.8227, "step": 24610 }, { "epoch": 0.46, "learning_rate": 2.908488393410608e-06, "loss": 0.8426, "step": 24611 }, { "epoch": 0.46, "learning_rate": 2.908337680180361e-06, "loss": 0.8842, "step": 24612 }, { "epoch": 0.46, "learning_rate": 2.9081869654253935e-06, "loss": 1.0958, "step": 24613 }, { "epoch": 0.46, "learning_rate": 2.9080362491462687e-06, "loss": 0.9695, "step": 24614 }, { "epoch": 0.46, "learning_rate": 2.9078855313435484e-06, "loss": 0.9301, "step": 24615 }, { "epoch": 0.46, "learning_rate": 2.9077348120177968e-06, "loss": 0.9672, "step": 24616 }, { "epoch": 0.46, "learning_rate": 2.907584091169575e-06, "loss": 0.9586, "step": 24617 }, { "epoch": 0.46, "learning_rate": 2.9074333687994477e-06, "loss": 0.8577, "step": 24618 }, { "epoch": 0.46, "learning_rate": 2.907282644907977e-06, "loss": 1.022, "step": 24619 }, { "epoch": 0.46, "learning_rate": 2.9071319194957243e-06, "loss": 0.9461, "step": 24620 }, { "epoch": 0.46, "learning_rate": 2.9069811925632534e-06, "loss": 0.8493, "step": 24621 }, { "epoch": 0.46, "learning_rate": 2.906830464111128e-06, "loss": 1.1265, "step": 24622 }, { "epoch": 0.46, "learning_rate": 2.9066797341399095e-06, "loss": 0.9058, "step": 24623 }, { "epoch": 0.46, "learning_rate": 2.9065290026501613e-06, "loss": 0.9343, "step": 24624 }, { "epoch": 0.46, "learning_rate": 2.906378269642447e-06, "loss": 0.9607, "step": 24625 }, { "epoch": 0.46, "learning_rate": 2.9062275351173287e-06, "loss": 0.8182, "step": 24626 }, { "epoch": 0.46, "learning_rate": 2.9060767990753684e-06, "loss": 0.7822, "step": 24627 }, { "epoch": 0.46, "learning_rate": 2.90592606151713e-06, "loss": 0.7985, "step": 24628 }, { "epoch": 0.46, "learning_rate": 2.9057753224431764e-06, "loss": 0.8957, "step": 24629 }, { "epoch": 0.46, "learning_rate": 2.90562458185407e-06, "loss": 0.8208, "step": 24630 }, { "epoch": 0.46, "learning_rate": 2.9054738397503747e-06, "loss": 1.1588, "step": 24631 }, { "epoch": 0.46, "learning_rate": 2.905323096132651e-06, "loss": 0.8749, "step": 24632 }, { "epoch": 0.46, "learning_rate": 2.9051723510014644e-06, "loss": 0.9698, "step": 24633 }, { "epoch": 0.46, "learning_rate": 2.9050216043573765e-06, "loss": 0.9129, "step": 24634 }, { "epoch": 0.46, "learning_rate": 2.90487085620095e-06, "loss": 0.9064, "step": 24635 }, { "epoch": 0.46, "learning_rate": 2.904720106532748e-06, "loss": 1.0544, "step": 24636 }, { "epoch": 0.46, "learning_rate": 2.9045693553533343e-06, "loss": 1.1287, "step": 24637 }, { "epoch": 0.46, "learning_rate": 2.9044186026632704e-06, "loss": 0.7358, "step": 24638 }, { "epoch": 0.46, "learning_rate": 2.9042678484631205e-06, "loss": 1.0196, "step": 24639 }, { "epoch": 0.46, "learning_rate": 2.9041170927534464e-06, "loss": 1.2302, "step": 24640 }, { "epoch": 0.46, "learning_rate": 2.9039663355348115e-06, "loss": 0.7438, "step": 24641 }, { "epoch": 0.46, "learning_rate": 2.9038155768077787e-06, "loss": 0.8605, "step": 24642 }, { "epoch": 0.46, "learning_rate": 2.9036648165729103e-06, "loss": 1.23, "step": 24643 }, { "epoch": 0.46, "learning_rate": 2.9035140548307705e-06, "loss": 1.1701, "step": 24644 }, { "epoch": 0.46, "learning_rate": 2.9033632915819217e-06, "loss": 0.7506, "step": 24645 }, { "epoch": 0.46, "learning_rate": 2.903212526826927e-06, "loss": 0.8953, "step": 24646 }, { "epoch": 0.47, "learning_rate": 2.9030617605663482e-06, "loss": 0.7179, "step": 24647 }, { "epoch": 0.47, "learning_rate": 2.902910992800749e-06, "loss": 0.7062, "step": 24648 }, { "epoch": 0.47, "learning_rate": 2.9027602235306935e-06, "loss": 1.1562, "step": 24649 }, { "epoch": 0.47, "learning_rate": 2.9026094527567426e-06, "loss": 1.052, "step": 24650 }, { "epoch": 0.47, "learning_rate": 2.9024586804794615e-06, "loss": 1.0559, "step": 24651 }, { "epoch": 0.47, "learning_rate": 2.902307906699412e-06, "loss": 0.7846, "step": 24652 }, { "epoch": 0.47, "learning_rate": 2.9021571314171565e-06, "loss": 0.9522, "step": 24653 }, { "epoch": 0.47, "learning_rate": 2.9020063546332582e-06, "loss": 0.8126, "step": 24654 }, { "epoch": 0.47, "learning_rate": 2.9018555763482812e-06, "loss": 0.9593, "step": 24655 }, { "epoch": 0.47, "learning_rate": 2.9017047965627883e-06, "loss": 0.876, "step": 24656 }, { "epoch": 0.47, "learning_rate": 2.9015540152773402e-06, "loss": 0.8964, "step": 24657 }, { "epoch": 0.47, "learning_rate": 2.9014032324925032e-06, "loss": 0.9115, "step": 24658 }, { "epoch": 0.47, "learning_rate": 2.901252448208839e-06, "loss": 0.9382, "step": 24659 }, { "epoch": 0.47, "learning_rate": 2.9011016624269096e-06, "loss": 0.9785, "step": 24660 }, { "epoch": 0.47, "learning_rate": 2.9009508751472796e-06, "loss": 0.9667, "step": 24661 }, { "epoch": 0.47, "learning_rate": 2.900800086370511e-06, "loss": 0.9803, "step": 24662 }, { "epoch": 0.47, "learning_rate": 2.9006492960971673e-06, "loss": 1.2019, "step": 24663 }, { "epoch": 0.47, "learning_rate": 2.9004985043278107e-06, "loss": 0.8288, "step": 24664 }, { "epoch": 0.47, "learning_rate": 2.9003477110630057e-06, "loss": 0.7906, "step": 24665 }, { "epoch": 0.47, "learning_rate": 2.900196916303314e-06, "loss": 0.8799, "step": 24666 }, { "epoch": 0.47, "learning_rate": 2.9000461200493e-06, "loss": 0.8997, "step": 24667 }, { "epoch": 0.47, "learning_rate": 2.8998953223015257e-06, "loss": 0.9511, "step": 24668 }, { "epoch": 0.47, "learning_rate": 2.8997445230605554e-06, "loss": 1.0905, "step": 24669 }, { "epoch": 0.47, "learning_rate": 2.89959372232695e-06, "loss": 0.7874, "step": 24670 }, { "epoch": 0.47, "learning_rate": 2.899442920101274e-06, "loss": 0.9813, "step": 24671 }, { "epoch": 0.47, "learning_rate": 2.8992921163840914e-06, "loss": 1.0595, "step": 24672 }, { "epoch": 0.47, "learning_rate": 2.899141311175964e-06, "loss": 0.7439, "step": 24673 }, { "epoch": 0.47, "learning_rate": 2.8989905044774542e-06, "loss": 0.8488, "step": 24674 }, { "epoch": 0.47, "learning_rate": 2.8988396962891276e-06, "loss": 1.2021, "step": 24675 }, { "epoch": 0.47, "learning_rate": 2.8986888866115442e-06, "loss": 0.8607, "step": 24676 }, { "epoch": 0.47, "learning_rate": 2.8985380754452696e-06, "loss": 0.7263, "step": 24677 }, { "epoch": 0.47, "learning_rate": 2.898387262790866e-06, "loss": 0.8921, "step": 24678 }, { "epoch": 0.47, "learning_rate": 2.8982364486488964e-06, "loss": 0.8332, "step": 24679 }, { "epoch": 0.47, "learning_rate": 2.8980856330199236e-06, "loss": 1.1133, "step": 24680 }, { "epoch": 0.47, "learning_rate": 2.897934815904512e-06, "loss": 1.3141, "step": 24681 }, { "epoch": 0.47, "learning_rate": 2.897783997303224e-06, "loss": 0.9688, "step": 24682 }, { "epoch": 0.47, "learning_rate": 2.8976331772166227e-06, "loss": 0.9233, "step": 24683 }, { "epoch": 0.47, "learning_rate": 2.8974823556452712e-06, "loss": 0.9664, "step": 24684 }, { "epoch": 0.47, "learning_rate": 2.897331532589733e-06, "loss": 0.961, "step": 24685 }, { "epoch": 0.47, "learning_rate": 2.8971807080505703e-06, "loss": 0.8699, "step": 24686 }, { "epoch": 0.47, "learning_rate": 2.8970298820283482e-06, "loss": 0.8998, "step": 24687 }, { "epoch": 0.47, "learning_rate": 2.8968790545236275e-06, "loss": 0.9983, "step": 24688 }, { "epoch": 0.47, "learning_rate": 2.8967282255369735e-06, "loss": 0.9204, "step": 24689 }, { "epoch": 0.47, "learning_rate": 2.896577395068948e-06, "loss": 0.5858, "step": 24690 }, { "epoch": 0.47, "learning_rate": 2.8964265631201146e-06, "loss": 0.7168, "step": 24691 }, { "epoch": 0.47, "learning_rate": 2.896275729691036e-06, "loss": 0.8511, "step": 24692 }, { "epoch": 0.47, "learning_rate": 2.8961248947822773e-06, "loss": 1.1197, "step": 24693 }, { "epoch": 0.47, "learning_rate": 2.8959740583943997e-06, "loss": 0.9612, "step": 24694 }, { "epoch": 0.47, "learning_rate": 2.8958232205279673e-06, "loss": 1.0709, "step": 24695 }, { "epoch": 0.47, "learning_rate": 2.895672381183543e-06, "loss": 0.8978, "step": 24696 }, { "epoch": 0.47, "learning_rate": 2.8955215403616905e-06, "loss": 0.9112, "step": 24697 }, { "epoch": 0.47, "learning_rate": 2.895370698062972e-06, "loss": 0.7483, "step": 24698 }, { "epoch": 0.47, "learning_rate": 2.895219854287952e-06, "loss": 0.8563, "step": 24699 }, { "epoch": 0.47, "learning_rate": 2.8950690090371925e-06, "loss": 1.1653, "step": 24700 }, { "epoch": 0.47, "learning_rate": 2.8949181623112584e-06, "loss": 0.9846, "step": 24701 }, { "epoch": 0.47, "learning_rate": 2.8947673141107115e-06, "loss": 0.8755, "step": 24702 }, { "epoch": 0.47, "learning_rate": 2.894616464436115e-06, "loss": 1.0592, "step": 24703 }, { "epoch": 0.47, "learning_rate": 2.894465613288034e-06, "loss": 0.806, "step": 24704 }, { "epoch": 0.47, "learning_rate": 2.8943147606670293e-06, "loss": 1.0872, "step": 24705 }, { "epoch": 0.47, "learning_rate": 2.894163906573666e-06, "loss": 1.0725, "step": 24706 }, { "epoch": 0.47, "learning_rate": 2.894013051008506e-06, "loss": 0.7732, "step": 24707 }, { "epoch": 0.47, "learning_rate": 2.8938621939721146e-06, "loss": 0.793, "step": 24708 }, { "epoch": 0.47, "learning_rate": 2.893711335465053e-06, "loss": 0.8563, "step": 24709 }, { "epoch": 0.47, "learning_rate": 2.8935604754878855e-06, "loss": 0.9792, "step": 24710 }, { "epoch": 0.47, "learning_rate": 2.893409614041176e-06, "loss": 0.9434, "step": 24711 }, { "epoch": 0.47, "learning_rate": 2.8932587511254857e-06, "loss": 1.1138, "step": 24712 }, { "epoch": 0.47, "learning_rate": 2.89310788674138e-06, "loss": 0.9534, "step": 24713 }, { "epoch": 0.47, "learning_rate": 2.8929570208894215e-06, "loss": 0.9146, "step": 24714 }, { "epoch": 0.47, "learning_rate": 2.8928061535701733e-06, "loss": 0.9245, "step": 24715 }, { "epoch": 0.47, "learning_rate": 2.8926552847841995e-06, "loss": 1.0147, "step": 24716 }, { "epoch": 0.47, "learning_rate": 2.8925044145320624e-06, "loss": 0.9429, "step": 24717 }, { "epoch": 0.47, "learning_rate": 2.8923535428143263e-06, "loss": 1.0588, "step": 24718 }, { "epoch": 0.47, "learning_rate": 2.8922026696315536e-06, "loss": 0.9474, "step": 24719 }, { "epoch": 0.47, "learning_rate": 2.892051794984308e-06, "loss": 0.9771, "step": 24720 }, { "epoch": 0.47, "learning_rate": 2.8919009188731533e-06, "loss": 0.8953, "step": 24721 }, { "epoch": 0.47, "learning_rate": 2.8917500412986527e-06, "loss": 0.8743, "step": 24722 }, { "epoch": 0.47, "learning_rate": 2.89159916226137e-06, "loss": 0.8287, "step": 24723 }, { "epoch": 0.47, "learning_rate": 2.8914482817618673e-06, "loss": 1.0864, "step": 24724 }, { "epoch": 0.47, "learning_rate": 2.891297399800709e-06, "loss": 1.0815, "step": 24725 }, { "epoch": 0.47, "learning_rate": 2.8911465163784576e-06, "loss": 1.0755, "step": 24726 }, { "epoch": 0.47, "learning_rate": 2.890995631495677e-06, "loss": 0.7581, "step": 24727 }, { "epoch": 0.47, "learning_rate": 2.8908447451529313e-06, "loss": 1.1411, "step": 24728 }, { "epoch": 0.47, "learning_rate": 2.890693857350784e-06, "loss": 0.7976, "step": 24729 }, { "epoch": 0.47, "learning_rate": 2.8905429680897966e-06, "loss": 1.0349, "step": 24730 }, { "epoch": 0.47, "learning_rate": 2.890392077370535e-06, "loss": 1.2352, "step": 24731 }, { "epoch": 0.47, "learning_rate": 2.8902411851935607e-06, "loss": 1.1188, "step": 24732 }, { "epoch": 0.47, "learning_rate": 2.890090291559437e-06, "loss": 0.8114, "step": 24733 }, { "epoch": 0.47, "learning_rate": 2.8899393964687284e-06, "loss": 0.9697, "step": 24734 }, { "epoch": 0.47, "learning_rate": 2.889788499921999e-06, "loss": 0.8262, "step": 24735 }, { "epoch": 0.47, "learning_rate": 2.8896376019198106e-06, "loss": 0.9831, "step": 24736 }, { "epoch": 0.47, "learning_rate": 2.889486702462727e-06, "loss": 1.1721, "step": 24737 }, { "epoch": 0.47, "learning_rate": 2.8893358015513128e-06, "loss": 0.9414, "step": 24738 }, { "epoch": 0.47, "learning_rate": 2.8891848991861306e-06, "loss": 0.8985, "step": 24739 }, { "epoch": 0.47, "learning_rate": 2.8890339953677436e-06, "loss": 0.9508, "step": 24740 }, { "epoch": 0.47, "learning_rate": 2.8888830900967153e-06, "loss": 0.838, "step": 24741 }, { "epoch": 0.47, "learning_rate": 2.8887321833736096e-06, "loss": 0.7062, "step": 24742 }, { "epoch": 0.47, "learning_rate": 2.88858127519899e-06, "loss": 1.039, "step": 24743 }, { "epoch": 0.47, "learning_rate": 2.8884303655734202e-06, "loss": 0.9814, "step": 24744 }, { "epoch": 0.47, "learning_rate": 2.888279454497463e-06, "loss": 1.0969, "step": 24745 }, { "epoch": 0.47, "learning_rate": 2.888128541971682e-06, "loss": 0.9959, "step": 24746 }, { "epoch": 0.47, "learning_rate": 2.887977627996641e-06, "loss": 0.8114, "step": 24747 }, { "epoch": 0.47, "learning_rate": 2.887826712572904e-06, "loss": 0.7506, "step": 24748 }, { "epoch": 0.47, "learning_rate": 2.887675795701033e-06, "loss": 0.9708, "step": 24749 }, { "epoch": 0.47, "learning_rate": 2.8875248773815932e-06, "loss": 1.299, "step": 24750 }, { "epoch": 0.47, "learning_rate": 2.887373957615147e-06, "loss": 0.8079, "step": 24751 }, { "epoch": 0.47, "learning_rate": 2.8872230364022587e-06, "loss": 0.7805, "step": 24752 }, { "epoch": 0.47, "learning_rate": 2.8870721137434914e-06, "loss": 0.9135, "step": 24753 }, { "epoch": 0.47, "learning_rate": 2.8869211896394077e-06, "loss": 1.0934, "step": 24754 }, { "epoch": 0.47, "learning_rate": 2.886770264090573e-06, "loss": 0.8488, "step": 24755 }, { "epoch": 0.47, "learning_rate": 2.8866193370975504e-06, "loss": 0.9236, "step": 24756 }, { "epoch": 0.47, "learning_rate": 2.886468408660903e-06, "loss": 1.082, "step": 24757 }, { "epoch": 0.47, "learning_rate": 2.886317478781194e-06, "loss": 0.7259, "step": 24758 }, { "epoch": 0.47, "learning_rate": 2.886166547458987e-06, "loss": 1.062, "step": 24759 }, { "epoch": 0.47, "learning_rate": 2.886015614694847e-06, "loss": 0.9496, "step": 24760 }, { "epoch": 0.47, "learning_rate": 2.885864680489335e-06, "loss": 0.9529, "step": 24761 }, { "epoch": 0.47, "learning_rate": 2.8857137448430172e-06, "loss": 0.9535, "step": 24762 }, { "epoch": 0.47, "learning_rate": 2.885562807756456e-06, "loss": 0.9193, "step": 24763 }, { "epoch": 0.47, "learning_rate": 2.8854118692302148e-06, "loss": 0.9565, "step": 24764 }, { "epoch": 0.47, "learning_rate": 2.885260929264858e-06, "loss": 1.0322, "step": 24765 }, { "epoch": 0.47, "learning_rate": 2.8851099878609485e-06, "loss": 0.7449, "step": 24766 }, { "epoch": 0.47, "learning_rate": 2.88495904501905e-06, "loss": 0.9448, "step": 24767 }, { "epoch": 0.47, "learning_rate": 2.884808100739726e-06, "loss": 1.2354, "step": 24768 }, { "epoch": 0.47, "learning_rate": 2.88465715502354e-06, "loss": 0.8797, "step": 24769 }, { "epoch": 0.47, "learning_rate": 2.884506207871057e-06, "loss": 0.9592, "step": 24770 }, { "epoch": 0.47, "learning_rate": 2.8843552592828394e-06, "loss": 0.8856, "step": 24771 }, { "epoch": 0.47, "learning_rate": 2.8842043092594506e-06, "loss": 0.7691, "step": 24772 }, { "epoch": 0.47, "learning_rate": 2.884053357801455e-06, "loss": 0.8165, "step": 24773 }, { "epoch": 0.47, "learning_rate": 2.8839024049094168e-06, "loss": 1.0764, "step": 24774 }, { "epoch": 0.47, "learning_rate": 2.883751450583897e-06, "loss": 0.9501, "step": 24775 }, { "epoch": 0.47, "learning_rate": 2.8836004948254612e-06, "loss": 1.0212, "step": 24776 }, { "epoch": 0.47, "learning_rate": 2.8834495376346744e-06, "loss": 0.9138, "step": 24777 }, { "epoch": 0.47, "learning_rate": 2.883298579012098e-06, "loss": 0.994, "step": 24778 }, { "epoch": 0.47, "learning_rate": 2.8831476189582964e-06, "loss": 0.9818, "step": 24779 }, { "epoch": 0.47, "learning_rate": 2.882996657473834e-06, "loss": 0.8746, "step": 24780 }, { "epoch": 0.47, "learning_rate": 2.8828456945592727e-06, "loss": 1.074, "step": 24781 }, { "epoch": 0.47, "learning_rate": 2.8826947302151774e-06, "loss": 0.8399, "step": 24782 }, { "epoch": 0.47, "learning_rate": 2.882543764442112e-06, "loss": 0.9369, "step": 24783 }, { "epoch": 0.47, "learning_rate": 2.88239279724064e-06, "loss": 1.0825, "step": 24784 }, { "epoch": 0.47, "learning_rate": 2.882241828611326e-06, "loss": 0.8524, "step": 24785 }, { "epoch": 0.47, "learning_rate": 2.882090858554731e-06, "loss": 1.0526, "step": 24786 }, { "epoch": 0.47, "learning_rate": 2.8819398870714217e-06, "loss": 1.0409, "step": 24787 }, { "epoch": 0.47, "learning_rate": 2.88178891416196e-06, "loss": 1.1248, "step": 24788 }, { "epoch": 0.47, "learning_rate": 2.88163793982691e-06, "loss": 0.9649, "step": 24789 }, { "epoch": 0.47, "learning_rate": 2.8814869640668364e-06, "loss": 0.9366, "step": 24790 }, { "epoch": 0.47, "learning_rate": 2.8813359868823023e-06, "loss": 0.9444, "step": 24791 }, { "epoch": 0.47, "learning_rate": 2.88118500827387e-06, "loss": 0.9501, "step": 24792 }, { "epoch": 0.47, "learning_rate": 2.8810340282421055e-06, "loss": 1.0214, "step": 24793 }, { "epoch": 0.47, "learning_rate": 2.8808830467875716e-06, "loss": 1.1842, "step": 24794 }, { "epoch": 0.47, "learning_rate": 2.880732063910832e-06, "loss": 0.8976, "step": 24795 }, { "epoch": 0.47, "learning_rate": 2.8805810796124502e-06, "loss": 0.9366, "step": 24796 }, { "epoch": 0.47, "learning_rate": 2.8804300938929906e-06, "loss": 0.9762, "step": 24797 }, { "epoch": 0.47, "learning_rate": 2.8802791067530165e-06, "loss": 0.8739, "step": 24798 }, { "epoch": 0.47, "learning_rate": 2.8801281181930916e-06, "loss": 0.9667, "step": 24799 }, { "epoch": 0.47, "learning_rate": 2.8799771282137814e-06, "loss": 1.1451, "step": 24800 }, { "epoch": 0.47, "learning_rate": 2.8798261368156473e-06, "loss": 0.9241, "step": 24801 }, { "epoch": 0.47, "learning_rate": 2.879675143999254e-06, "loss": 0.9145, "step": 24802 }, { "epoch": 0.47, "learning_rate": 2.879524149765165e-06, "loss": 0.9788, "step": 24803 }, { "epoch": 0.47, "learning_rate": 2.8793731541139447e-06, "loss": 0.8732, "step": 24804 }, { "epoch": 0.47, "learning_rate": 2.8792221570461566e-06, "loss": 0.7486, "step": 24805 }, { "epoch": 0.47, "learning_rate": 2.8790711585623654e-06, "loss": 1.0209, "step": 24806 }, { "epoch": 0.47, "learning_rate": 2.8789201586631334e-06, "loss": 1.0184, "step": 24807 }, { "epoch": 0.47, "learning_rate": 2.878769157349025e-06, "loss": 0.9168, "step": 24808 }, { "epoch": 0.47, "learning_rate": 2.8786181546206044e-06, "loss": 0.7203, "step": 24809 }, { "epoch": 0.47, "learning_rate": 2.8784671504784352e-06, "loss": 0.9721, "step": 24810 }, { "epoch": 0.47, "learning_rate": 2.878316144923081e-06, "loss": 0.9729, "step": 24811 }, { "epoch": 0.47, "learning_rate": 2.8781651379551066e-06, "loss": 1.168, "step": 24812 }, { "epoch": 0.47, "learning_rate": 2.8780141295750745e-06, "loss": 0.818, "step": 24813 }, { "epoch": 0.47, "learning_rate": 2.87786311978355e-06, "loss": 0.9595, "step": 24814 }, { "epoch": 0.47, "learning_rate": 2.8777121085810962e-06, "loss": 1.0388, "step": 24815 }, { "epoch": 0.47, "learning_rate": 2.8775610959682758e-06, "loss": 0.8091, "step": 24816 }, { "epoch": 0.47, "learning_rate": 2.877410081945654e-06, "loss": 0.8778, "step": 24817 }, { "epoch": 0.47, "learning_rate": 2.8772590665137957e-06, "loss": 1.1193, "step": 24818 }, { "epoch": 0.47, "learning_rate": 2.8771080496732627e-06, "loss": 1.1002, "step": 24819 }, { "epoch": 0.47, "learning_rate": 2.87695703142462e-06, "loss": 0.8225, "step": 24820 }, { "epoch": 0.47, "learning_rate": 2.876806011768432e-06, "loss": 0.8524, "step": 24821 }, { "epoch": 0.47, "learning_rate": 2.876654990705261e-06, "loss": 0.8035, "step": 24822 }, { "epoch": 0.47, "learning_rate": 2.876503968235672e-06, "loss": 1.0007, "step": 24823 }, { "epoch": 0.47, "learning_rate": 2.876352944360229e-06, "loss": 1.0275, "step": 24824 }, { "epoch": 0.47, "learning_rate": 2.8762019190794953e-06, "loss": 1.1021, "step": 24825 }, { "epoch": 0.47, "learning_rate": 2.876050892394035e-06, "loss": 0.952, "step": 24826 }, { "epoch": 0.47, "learning_rate": 2.8758998643044133e-06, "loss": 0.9137, "step": 24827 }, { "epoch": 0.47, "learning_rate": 2.8757488348111918e-06, "loss": 1.1196, "step": 24828 }, { "epoch": 0.47, "learning_rate": 2.8755978039149364e-06, "loss": 1.0089, "step": 24829 }, { "epoch": 0.47, "learning_rate": 2.87544677161621e-06, "loss": 1.0428, "step": 24830 }, { "epoch": 0.47, "learning_rate": 2.8752957379155765e-06, "loss": 1.0965, "step": 24831 }, { "epoch": 0.47, "learning_rate": 2.8751447028136005e-06, "loss": 1.0841, "step": 24832 }, { "epoch": 0.47, "learning_rate": 2.8749936663108464e-06, "loss": 1.0345, "step": 24833 }, { "epoch": 0.47, "learning_rate": 2.874842628407877e-06, "loss": 0.9458, "step": 24834 }, { "epoch": 0.47, "learning_rate": 2.874691589105256e-06, "loss": 0.9831, "step": 24835 }, { "epoch": 0.47, "learning_rate": 2.8745405484035492e-06, "loss": 0.9323, "step": 24836 }, { "epoch": 0.47, "learning_rate": 2.874389506303319e-06, "loss": 0.8712, "step": 24837 }, { "epoch": 0.47, "learning_rate": 2.874238462805129e-06, "loss": 0.912, "step": 24838 }, { "epoch": 0.47, "learning_rate": 2.874087417909546e-06, "loss": 0.812, "step": 24839 }, { "epoch": 0.47, "learning_rate": 2.8739363716171305e-06, "loss": 0.7932, "step": 24840 }, { "epoch": 0.47, "learning_rate": 2.8737853239284486e-06, "loss": 0.8879, "step": 24841 }, { "epoch": 0.47, "learning_rate": 2.8736342748440636e-06, "loss": 1.0445, "step": 24842 }, { "epoch": 0.47, "learning_rate": 2.87348322436454e-06, "loss": 1.0339, "step": 24843 }, { "epoch": 0.47, "learning_rate": 2.8733321724904404e-06, "loss": 0.9937, "step": 24844 }, { "epoch": 0.47, "learning_rate": 2.8731811192223314e-06, "loss": 0.8716, "step": 24845 }, { "epoch": 0.47, "learning_rate": 2.8730300645607744e-06, "loss": 0.8466, "step": 24846 }, { "epoch": 0.47, "learning_rate": 2.8728790085063353e-06, "loss": 0.8748, "step": 24847 }, { "epoch": 0.47, "learning_rate": 2.8727279510595772e-06, "loss": 0.8881, "step": 24848 }, { "epoch": 0.47, "learning_rate": 2.8725768922210644e-06, "loss": 0.7535, "step": 24849 }, { "epoch": 0.47, "learning_rate": 2.8724258319913606e-06, "loss": 1.2277, "step": 24850 }, { "epoch": 0.47, "learning_rate": 2.8722747703710303e-06, "loss": 1.0314, "step": 24851 }, { "epoch": 0.47, "learning_rate": 2.872123707360637e-06, "loss": 0.985, "step": 24852 }, { "epoch": 0.47, "learning_rate": 2.8719726429607457e-06, "loss": 0.8147, "step": 24853 }, { "epoch": 0.47, "learning_rate": 2.8718215771719206e-06, "loss": 0.9513, "step": 24854 }, { "epoch": 0.47, "learning_rate": 2.8716705099947246e-06, "loss": 1.0698, "step": 24855 }, { "epoch": 0.47, "learning_rate": 2.871519441429722e-06, "loss": 1.2729, "step": 24856 }, { "epoch": 0.47, "learning_rate": 2.8713683714774774e-06, "loss": 1.0324, "step": 24857 }, { "epoch": 0.47, "learning_rate": 2.8712173001385545e-06, "loss": 0.9815, "step": 24858 }, { "epoch": 0.47, "learning_rate": 2.8710662274135176e-06, "loss": 0.914, "step": 24859 }, { "epoch": 0.47, "learning_rate": 2.8709151533029313e-06, "loss": 0.8113, "step": 24860 }, { "epoch": 0.47, "learning_rate": 2.8707640778073585e-06, "loss": 0.8795, "step": 24861 }, { "epoch": 0.47, "learning_rate": 2.8706130009273645e-06, "loss": 0.9745, "step": 24862 }, { "epoch": 0.47, "learning_rate": 2.870461922663513e-06, "loss": 1.0399, "step": 24863 }, { "epoch": 0.47, "learning_rate": 2.870310843016368e-06, "loss": 1.028, "step": 24864 }, { "epoch": 0.47, "learning_rate": 2.8701597619864936e-06, "loss": 1.0214, "step": 24865 }, { "epoch": 0.47, "learning_rate": 2.870008679574454e-06, "loss": 0.9095, "step": 24866 }, { "epoch": 0.47, "learning_rate": 2.8698575957808126e-06, "loss": 0.9384, "step": 24867 }, { "epoch": 0.47, "learning_rate": 2.869706510606135e-06, "loss": 1.0771, "step": 24868 }, { "epoch": 0.47, "learning_rate": 2.8695554240509847e-06, "loss": 1.0657, "step": 24869 }, { "epoch": 0.47, "learning_rate": 2.869404336115925e-06, "loss": 1.0215, "step": 24870 }, { "epoch": 0.47, "learning_rate": 2.8692532468015217e-06, "loss": 0.833, "step": 24871 }, { "epoch": 0.47, "learning_rate": 2.8691021561083376e-06, "loss": 0.7337, "step": 24872 }, { "epoch": 0.47, "learning_rate": 2.8689510640369377e-06, "loss": 0.689, "step": 24873 }, { "epoch": 0.47, "learning_rate": 2.8687999705878854e-06, "loss": 0.9546, "step": 24874 }, { "epoch": 0.47, "learning_rate": 2.8686488757617464e-06, "loss": 1.1073, "step": 24875 }, { "epoch": 0.47, "learning_rate": 2.868497779559083e-06, "loss": 0.9139, "step": 24876 }, { "epoch": 0.47, "learning_rate": 2.86834668198046e-06, "loss": 0.8542, "step": 24877 }, { "epoch": 0.47, "learning_rate": 2.8681955830264423e-06, "loss": 0.6503, "step": 24878 }, { "epoch": 0.47, "learning_rate": 2.8680444826975927e-06, "loss": 0.7559, "step": 24879 }, { "epoch": 0.47, "learning_rate": 2.8678933809944766e-06, "loss": 0.9051, "step": 24880 }, { "epoch": 0.47, "learning_rate": 2.867742277917659e-06, "loss": 0.9921, "step": 24881 }, { "epoch": 0.47, "learning_rate": 2.867591173467702e-06, "loss": 0.9022, "step": 24882 }, { "epoch": 0.47, "learning_rate": 2.8674400676451706e-06, "loss": 0.7925, "step": 24883 }, { "epoch": 0.47, "learning_rate": 2.8672889604506302e-06, "loss": 0.8536, "step": 24884 }, { "epoch": 0.47, "learning_rate": 2.867137851884643e-06, "loss": 0.9509, "step": 24885 }, { "epoch": 0.47, "learning_rate": 2.8669867419477756e-06, "loss": 1.1702, "step": 24886 }, { "epoch": 0.47, "learning_rate": 2.86683563064059e-06, "loss": 1.1987, "step": 24887 }, { "epoch": 0.47, "learning_rate": 2.866684517963651e-06, "loss": 1.0978, "step": 24888 }, { "epoch": 0.47, "learning_rate": 2.866533403917524e-06, "loss": 0.9187, "step": 24889 }, { "epoch": 0.47, "learning_rate": 2.8663822885027724e-06, "loss": 0.8534, "step": 24890 }, { "epoch": 0.47, "learning_rate": 2.866231171719961e-06, "loss": 0.8894, "step": 24891 }, { "epoch": 0.47, "learning_rate": 2.8660800535696533e-06, "loss": 0.8865, "step": 24892 }, { "epoch": 0.47, "learning_rate": 2.8659289340524132e-06, "loss": 1.1283, "step": 24893 }, { "epoch": 0.47, "learning_rate": 2.8657778131688065e-06, "loss": 0.9703, "step": 24894 }, { "epoch": 0.47, "learning_rate": 2.8656266909193964e-06, "loss": 0.9238, "step": 24895 }, { "epoch": 0.47, "learning_rate": 2.8654755673047475e-06, "loss": 0.8234, "step": 24896 }, { "epoch": 0.47, "learning_rate": 2.865324442325424e-06, "loss": 0.8567, "step": 24897 }, { "epoch": 0.47, "learning_rate": 2.86517331598199e-06, "loss": 0.9404, "step": 24898 }, { "epoch": 0.47, "learning_rate": 2.8650221882750105e-06, "loss": 1.287, "step": 24899 }, { "epoch": 0.47, "learning_rate": 2.864871059205049e-06, "loss": 1.0641, "step": 24900 }, { "epoch": 0.47, "learning_rate": 2.86471992877267e-06, "loss": 0.7072, "step": 24901 }, { "epoch": 0.47, "learning_rate": 2.8645687969784386e-06, "loss": 0.8172, "step": 24902 }, { "epoch": 0.47, "learning_rate": 2.864417663822918e-06, "loss": 0.7712, "step": 24903 }, { "epoch": 0.47, "learning_rate": 2.864266529306674e-06, "loss": 0.8901, "step": 24904 }, { "epoch": 0.47, "learning_rate": 2.864115393430269e-06, "loss": 0.9987, "step": 24905 }, { "epoch": 0.47, "learning_rate": 2.8639642561942682e-06, "loss": 1.0514, "step": 24906 }, { "epoch": 0.47, "learning_rate": 2.8638131175992356e-06, "loss": 0.9438, "step": 24907 }, { "epoch": 0.47, "learning_rate": 2.863661977645737e-06, "loss": 0.9074, "step": 24908 }, { "epoch": 0.47, "learning_rate": 2.863510836334335e-06, "loss": 1.0177, "step": 24909 }, { "epoch": 0.47, "learning_rate": 2.8633596936655957e-06, "loss": 0.9983, "step": 24910 }, { "epoch": 0.47, "learning_rate": 2.863208549640081e-06, "loss": 1.0205, "step": 24911 }, { "epoch": 0.47, "learning_rate": 2.8630574042583576e-06, "loss": 1.1556, "step": 24912 }, { "epoch": 0.47, "learning_rate": 2.8629062575209887e-06, "loss": 1.0149, "step": 24913 }, { "epoch": 0.47, "learning_rate": 2.862755109428539e-06, "loss": 0.9069, "step": 24914 }, { "epoch": 0.47, "learning_rate": 2.862603959981573e-06, "loss": 0.9127, "step": 24915 }, { "epoch": 0.47, "learning_rate": 2.862452809180655e-06, "loss": 0.9301, "step": 24916 }, { "epoch": 0.47, "learning_rate": 2.8623016570263496e-06, "loss": 0.9202, "step": 24917 }, { "epoch": 0.47, "learning_rate": 2.8621505035192198e-06, "loss": 0.97, "step": 24918 }, { "epoch": 0.47, "learning_rate": 2.8619993486598324e-06, "loss": 1.1152, "step": 24919 }, { "epoch": 0.47, "learning_rate": 2.86184819244875e-06, "loss": 0.7874, "step": 24920 }, { "epoch": 0.47, "learning_rate": 2.861697034886537e-06, "loss": 0.982, "step": 24921 }, { "epoch": 0.47, "learning_rate": 2.861545875973759e-06, "loss": 0.961, "step": 24922 }, { "epoch": 0.47, "learning_rate": 2.8613947157109802e-06, "loss": 0.8346, "step": 24923 }, { "epoch": 0.47, "learning_rate": 2.8612435540987637e-06, "loss": 0.9977, "step": 24924 }, { "epoch": 0.47, "learning_rate": 2.8610923911376755e-06, "loss": 1.1464, "step": 24925 }, { "epoch": 0.47, "learning_rate": 2.8609412268282786e-06, "loss": 0.9543, "step": 24926 }, { "epoch": 0.47, "learning_rate": 2.8607900611711392e-06, "loss": 0.6766, "step": 24927 }, { "epoch": 0.47, "learning_rate": 2.86063889416682e-06, "loss": 0.7997, "step": 24928 }, { "epoch": 0.47, "learning_rate": 2.8604877258158865e-06, "loss": 0.9942, "step": 24929 }, { "epoch": 0.47, "learning_rate": 2.8603365561189027e-06, "loss": 0.9328, "step": 24930 }, { "epoch": 0.47, "learning_rate": 2.8601853850764337e-06, "loss": 1.0107, "step": 24931 }, { "epoch": 0.47, "learning_rate": 2.8600342126890437e-06, "loss": 0.8728, "step": 24932 }, { "epoch": 0.47, "learning_rate": 2.8598830389572963e-06, "loss": 0.9766, "step": 24933 }, { "epoch": 0.47, "learning_rate": 2.8597318638817566e-06, "loss": 0.8384, "step": 24934 }, { "epoch": 0.47, "learning_rate": 2.8595806874629895e-06, "loss": 0.7769, "step": 24935 }, { "epoch": 0.47, "learning_rate": 2.859429509701559e-06, "loss": 0.9132, "step": 24936 }, { "epoch": 0.47, "learning_rate": 2.8592783305980305e-06, "loss": 0.7885, "step": 24937 }, { "epoch": 0.47, "learning_rate": 2.8591271501529664e-06, "loss": 1.1385, "step": 24938 }, { "epoch": 0.47, "learning_rate": 2.858975968366933e-06, "loss": 1.0978, "step": 24939 }, { "epoch": 0.47, "learning_rate": 2.8588247852404956e-06, "loss": 1.0184, "step": 24940 }, { "epoch": 0.47, "learning_rate": 2.8586736007742163e-06, "loss": 0.7814, "step": 24941 }, { "epoch": 0.47, "learning_rate": 2.85852241496866e-06, "loss": 0.8804, "step": 24942 }, { "epoch": 0.47, "learning_rate": 2.8583712278243934e-06, "loss": 1.051, "step": 24943 }, { "epoch": 0.47, "learning_rate": 2.858220039341979e-06, "loss": 1.1293, "step": 24944 }, { "epoch": 0.47, "learning_rate": 2.858068849521982e-06, "loss": 0.8976, "step": 24945 }, { "epoch": 0.47, "learning_rate": 2.857917658364967e-06, "loss": 0.9874, "step": 24946 }, { "epoch": 0.47, "learning_rate": 2.857766465871499e-06, "loss": 0.9243, "step": 24947 }, { "epoch": 0.47, "learning_rate": 2.8576152720421406e-06, "loss": 0.8127, "step": 24948 }, { "epoch": 0.47, "learning_rate": 2.8574640768774587e-06, "loss": 0.8193, "step": 24949 }, { "epoch": 0.47, "learning_rate": 2.8573128803780163e-06, "loss": 1.0325, "step": 24950 }, { "epoch": 0.47, "learning_rate": 2.8571616825443792e-06, "loss": 0.9946, "step": 24951 }, { "epoch": 0.47, "learning_rate": 2.8570104833771113e-06, "loss": 0.7989, "step": 24952 }, { "epoch": 0.47, "learning_rate": 2.8568592828767774e-06, "loss": 1.0585, "step": 24953 }, { "epoch": 0.47, "learning_rate": 2.8567080810439408e-06, "loss": 0.7844, "step": 24954 }, { "epoch": 0.47, "learning_rate": 2.856556877879168e-06, "loss": 0.971, "step": 24955 }, { "epoch": 0.47, "learning_rate": 2.8564056733830224e-06, "loss": 1.0092, "step": 24956 }, { "epoch": 0.47, "learning_rate": 2.856254467556069e-06, "loss": 0.8749, "step": 24957 }, { "epoch": 0.47, "learning_rate": 2.856103260398873e-06, "loss": 0.8227, "step": 24958 }, { "epoch": 0.47, "learning_rate": 2.8559520519119975e-06, "loss": 0.8747, "step": 24959 }, { "epoch": 0.47, "learning_rate": 2.8558008420960084e-06, "loss": 0.9206, "step": 24960 }, { "epoch": 0.47, "learning_rate": 2.8556496309514705e-06, "loss": 0.8009, "step": 24961 }, { "epoch": 0.47, "learning_rate": 2.8554984184789463e-06, "loss": 1.0407, "step": 24962 }, { "epoch": 0.47, "learning_rate": 2.855347204679002e-06, "loss": 0.8864, "step": 24963 }, { "epoch": 0.47, "learning_rate": 2.855195989552203e-06, "loss": 0.8615, "step": 24964 }, { "epoch": 0.47, "learning_rate": 2.8550447730991125e-06, "loss": 1.0265, "step": 24965 }, { "epoch": 0.47, "learning_rate": 2.854893555320296e-06, "loss": 0.896, "step": 24966 }, { "epoch": 0.47, "learning_rate": 2.8547423362163185e-06, "loss": 0.946, "step": 24967 }, { "epoch": 0.47, "learning_rate": 2.854591115787744e-06, "loss": 0.9807, "step": 24968 }, { "epoch": 0.47, "learning_rate": 2.854439894035136e-06, "loss": 1.2396, "step": 24969 }, { "epoch": 0.47, "learning_rate": 2.854288670959061e-06, "loss": 1.0372, "step": 24970 }, { "epoch": 0.47, "learning_rate": 2.8541374465600823e-06, "loss": 0.9493, "step": 24971 }, { "epoch": 0.47, "learning_rate": 2.853986220838765e-06, "loss": 0.9224, "step": 24972 }, { "epoch": 0.47, "learning_rate": 2.8538349937956755e-06, "loss": 0.9659, "step": 24973 }, { "epoch": 0.47, "learning_rate": 2.8536837654313767e-06, "loss": 1.1046, "step": 24974 }, { "epoch": 0.47, "learning_rate": 2.853532535746433e-06, "loss": 1.1517, "step": 24975 }, { "epoch": 0.47, "learning_rate": 2.853381304741409e-06, "loss": 1.1025, "step": 24976 }, { "epoch": 0.47, "learning_rate": 2.8532300724168705e-06, "loss": 0.9128, "step": 24977 }, { "epoch": 0.47, "learning_rate": 2.853078838773382e-06, "loss": 0.7593, "step": 24978 }, { "epoch": 0.47, "learning_rate": 2.8529276038115085e-06, "loss": 0.8423, "step": 24979 }, { "epoch": 0.47, "learning_rate": 2.8527763675318134e-06, "loss": 0.9712, "step": 24980 }, { "epoch": 0.47, "learning_rate": 2.8526251299348622e-06, "loss": 1.1451, "step": 24981 }, { "epoch": 0.47, "learning_rate": 2.8524738910212204e-06, "loss": 0.9566, "step": 24982 }, { "epoch": 0.47, "learning_rate": 2.852322650791451e-06, "loss": 0.8843, "step": 24983 }, { "epoch": 0.47, "learning_rate": 2.852171409246119e-06, "loss": 0.9111, "step": 24984 }, { "epoch": 0.47, "learning_rate": 2.852020166385791e-06, "loss": 0.7572, "step": 24985 }, { "epoch": 0.47, "learning_rate": 2.85186892221103e-06, "loss": 0.8098, "step": 24986 }, { "epoch": 0.47, "learning_rate": 2.8517176767224013e-06, "loss": 1.0779, "step": 24987 }, { "epoch": 0.47, "learning_rate": 2.85156642992047e-06, "loss": 0.9834, "step": 24988 }, { "epoch": 0.47, "learning_rate": 2.8514151818058e-06, "loss": 1.0396, "step": 24989 }, { "epoch": 0.47, "learning_rate": 2.8512639323789563e-06, "loss": 0.8917, "step": 24990 }, { "epoch": 0.47, "learning_rate": 2.8511126816405037e-06, "loss": 0.9616, "step": 24991 }, { "epoch": 0.47, "learning_rate": 2.8509614295910076e-06, "loss": 0.8323, "step": 24992 }, { "epoch": 0.47, "learning_rate": 2.850810176231032e-06, "loss": 1.0787, "step": 24993 }, { "epoch": 0.47, "learning_rate": 2.8506589215611424e-06, "loss": 0.8265, "step": 24994 }, { "epoch": 0.47, "learning_rate": 2.850507665581903e-06, "loss": 1.0386, "step": 24995 }, { "epoch": 0.47, "learning_rate": 2.850356408293878e-06, "loss": 0.8737, "step": 24996 }, { "epoch": 0.47, "learning_rate": 2.850205149697634e-06, "loss": 0.9175, "step": 24997 }, { "epoch": 0.47, "learning_rate": 2.850053889793734e-06, "loss": 0.7861, "step": 24998 }, { "epoch": 0.47, "learning_rate": 2.8499026285827437e-06, "loss": 1.1659, "step": 24999 }, { "epoch": 0.47, "learning_rate": 2.849751366065228e-06, "loss": 1.0026, "step": 25000 }, { "epoch": 0.47, "learning_rate": 2.849600102241751e-06, "loss": 1.0271, "step": 25001 }, { "epoch": 0.47, "learning_rate": 2.849448837112878e-06, "loss": 0.858, "step": 25002 }, { "epoch": 0.47, "learning_rate": 2.849297570679174e-06, "loss": 1.1619, "step": 25003 }, { "epoch": 0.47, "learning_rate": 2.8491463029412035e-06, "loss": 0.8061, "step": 25004 }, { "epoch": 0.47, "learning_rate": 2.848995033899531e-06, "loss": 0.9411, "step": 25005 }, { "epoch": 0.47, "learning_rate": 2.848843763554722e-06, "loss": 1.1204, "step": 25006 }, { "epoch": 0.47, "learning_rate": 2.848692491907341e-06, "loss": 0.9908, "step": 25007 }, { "epoch": 0.47, "learning_rate": 2.848541218957953e-06, "loss": 1.0561, "step": 25008 }, { "epoch": 0.47, "learning_rate": 2.848389944707124e-06, "loss": 0.7674, "step": 25009 }, { "epoch": 0.47, "learning_rate": 2.848238669155416e-06, "loss": 0.8636, "step": 25010 }, { "epoch": 0.47, "learning_rate": 2.8480873923033957e-06, "loss": 0.8124, "step": 25011 }, { "epoch": 0.47, "learning_rate": 2.847936114151628e-06, "loss": 0.9045, "step": 25012 }, { "epoch": 0.47, "learning_rate": 2.8477848347006774e-06, "loss": 1.032, "step": 25013 }, { "epoch": 0.47, "learning_rate": 2.8476335539511093e-06, "loss": 0.9014, "step": 25014 }, { "epoch": 0.47, "learning_rate": 2.8474822719034877e-06, "loss": 0.8683, "step": 25015 }, { "epoch": 0.47, "learning_rate": 2.847330988558378e-06, "loss": 0.8821, "step": 25016 }, { "epoch": 0.47, "learning_rate": 2.847179703916346e-06, "loss": 0.9285, "step": 25017 }, { "epoch": 0.47, "learning_rate": 2.847028417977954e-06, "loss": 0.9886, "step": 25018 }, { "epoch": 0.47, "learning_rate": 2.846877130743769e-06, "loss": 0.8727, "step": 25019 }, { "epoch": 0.47, "learning_rate": 2.8467258422143566e-06, "loss": 0.7804, "step": 25020 }, { "epoch": 0.47, "learning_rate": 2.8465745523902797e-06, "loss": 1.042, "step": 25021 }, { "epoch": 0.47, "learning_rate": 2.846423261272104e-06, "loss": 0.838, "step": 25022 }, { "epoch": 0.47, "learning_rate": 2.8462719688603946e-06, "loss": 0.8879, "step": 25023 }, { "epoch": 0.47, "learning_rate": 2.8461206751557163e-06, "loss": 1.1161, "step": 25024 }, { "epoch": 0.47, "learning_rate": 2.8459693801586343e-06, "loss": 1.1029, "step": 25025 }, { "epoch": 0.47, "learning_rate": 2.8458180838697127e-06, "loss": 0.933, "step": 25026 }, { "epoch": 0.47, "learning_rate": 2.8456667862895164e-06, "loss": 1.0236, "step": 25027 }, { "epoch": 0.47, "learning_rate": 2.845515487418612e-06, "loss": 0.9139, "step": 25028 }, { "epoch": 0.47, "learning_rate": 2.8453641872575633e-06, "loss": 0.9674, "step": 25029 }, { "epoch": 0.47, "learning_rate": 2.845212885806935e-06, "loss": 0.8793, "step": 25030 }, { "epoch": 0.47, "learning_rate": 2.8450615830672923e-06, "loss": 1.2082, "step": 25031 }, { "epoch": 0.47, "learning_rate": 2.8449102790392005e-06, "loss": 1.091, "step": 25032 }, { "epoch": 0.47, "learning_rate": 2.8447589737232234e-06, "loss": 0.8163, "step": 25033 }, { "epoch": 0.47, "learning_rate": 2.8446076671199274e-06, "loss": 0.7651, "step": 25034 }, { "epoch": 0.47, "learning_rate": 2.8444563592298778e-06, "loss": 0.8235, "step": 25035 }, { "epoch": 0.47, "learning_rate": 2.844305050053638e-06, "loss": 0.801, "step": 25036 }, { "epoch": 0.47, "learning_rate": 2.8441537395917735e-06, "loss": 0.9933, "step": 25037 }, { "epoch": 0.47, "learning_rate": 2.8440024278448504e-06, "loss": 1.1414, "step": 25038 }, { "epoch": 0.47, "learning_rate": 2.843851114813431e-06, "loss": 0.9126, "step": 25039 }, { "epoch": 0.47, "learning_rate": 2.843699800498083e-06, "loss": 0.9109, "step": 25040 }, { "epoch": 0.47, "learning_rate": 2.8435484848993716e-06, "loss": 0.8867, "step": 25041 }, { "epoch": 0.47, "learning_rate": 2.8433971680178598e-06, "loss": 0.8442, "step": 25042 }, { "epoch": 0.47, "learning_rate": 2.8432458498541132e-06, "loss": 1.0741, "step": 25043 }, { "epoch": 0.47, "learning_rate": 2.843094530408698e-06, "loss": 1.0037, "step": 25044 }, { "epoch": 0.47, "learning_rate": 2.8429432096821773e-06, "loss": 0.8745, "step": 25045 }, { "epoch": 0.47, "learning_rate": 2.8427918876751175e-06, "loss": 1.0578, "step": 25046 }, { "epoch": 0.47, "learning_rate": 2.8426405643880833e-06, "loss": 0.8235, "step": 25047 }, { "epoch": 0.47, "learning_rate": 2.8424892398216397e-06, "loss": 0.8847, "step": 25048 }, { "epoch": 0.47, "learning_rate": 2.8423379139763517e-06, "loss": 0.8302, "step": 25049 }, { "epoch": 0.47, "learning_rate": 2.8421865868527855e-06, "loss": 1.1071, "step": 25050 }, { "epoch": 0.47, "learning_rate": 2.8420352584515036e-06, "loss": 1.0119, "step": 25051 }, { "epoch": 0.47, "learning_rate": 2.841883928773073e-06, "loss": 0.9368, "step": 25052 }, { "epoch": 0.47, "learning_rate": 2.8417325978180587e-06, "loss": 0.7344, "step": 25053 }, { "epoch": 0.47, "learning_rate": 2.841581265587025e-06, "loss": 0.6852, "step": 25054 }, { "epoch": 0.47, "learning_rate": 2.8414299320805373e-06, "loss": 0.802, "step": 25055 }, { "epoch": 0.47, "learning_rate": 2.8412785972991614e-06, "loss": 1.1562, "step": 25056 }, { "epoch": 0.47, "learning_rate": 2.841127261243461e-06, "loss": 1.0221, "step": 25057 }, { "epoch": 0.47, "learning_rate": 2.8409759239140015e-06, "loss": 1.0228, "step": 25058 }, { "epoch": 0.47, "learning_rate": 2.840824585311349e-06, "loss": 1.0245, "step": 25059 }, { "epoch": 0.47, "learning_rate": 2.8406732454360674e-06, "loss": 0.8405, "step": 25060 }, { "epoch": 0.47, "learning_rate": 2.8405219042887226e-06, "loss": 0.912, "step": 25061 }, { "epoch": 0.47, "learning_rate": 2.84037056186988e-06, "loss": 1.3212, "step": 25062 }, { "epoch": 0.47, "learning_rate": 2.8402192181801037e-06, "loss": 1.1423, "step": 25063 }, { "epoch": 0.47, "learning_rate": 2.840067873219959e-06, "loss": 0.9121, "step": 25064 }, { "epoch": 0.47, "learning_rate": 2.8399165269900127e-06, "loss": 1.1697, "step": 25065 }, { "epoch": 0.47, "learning_rate": 2.839765179490827e-06, "loss": 1.1356, "step": 25066 }, { "epoch": 0.47, "learning_rate": 2.8396138307229687e-06, "loss": 0.791, "step": 25067 }, { "epoch": 0.47, "learning_rate": 2.839462480687003e-06, "loss": 0.9544, "step": 25068 }, { "epoch": 0.47, "learning_rate": 2.8393111293834947e-06, "loss": 1.2214, "step": 25069 }, { "epoch": 0.47, "learning_rate": 2.839159776813009e-06, "loss": 0.7762, "step": 25070 }, { "epoch": 0.47, "learning_rate": 2.8390084229761116e-06, "loss": 0.9103, "step": 25071 }, { "epoch": 0.47, "learning_rate": 2.8388570678733666e-06, "loss": 0.9227, "step": 25072 }, { "epoch": 0.47, "learning_rate": 2.83870571150534e-06, "loss": 0.8172, "step": 25073 }, { "epoch": 0.47, "learning_rate": 2.838554353872596e-06, "loss": 1.0332, "step": 25074 }, { "epoch": 0.47, "learning_rate": 2.8384029949757013e-06, "loss": 0.8943, "step": 25075 }, { "epoch": 0.47, "learning_rate": 2.83825163481522e-06, "loss": 0.9424, "step": 25076 }, { "epoch": 0.47, "learning_rate": 2.838100273391717e-06, "loss": 0.8618, "step": 25077 }, { "epoch": 0.47, "learning_rate": 2.837948910705759e-06, "loss": 0.9173, "step": 25078 }, { "epoch": 0.47, "learning_rate": 2.837797546757909e-06, "loss": 0.712, "step": 25079 }, { "epoch": 0.47, "learning_rate": 2.8376461815487345e-06, "loss": 0.9074, "step": 25080 }, { "epoch": 0.47, "learning_rate": 2.837494815078798e-06, "loss": 1.0358, "step": 25081 }, { "epoch": 0.47, "learning_rate": 2.837343447348667e-06, "loss": 0.9984, "step": 25082 }, { "epoch": 0.47, "learning_rate": 2.8371920783589056e-06, "loss": 0.9935, "step": 25083 }, { "epoch": 0.47, "learning_rate": 2.83704070811008e-06, "loss": 1.0419, "step": 25084 }, { "epoch": 0.47, "learning_rate": 2.836889336602754e-06, "loss": 0.8317, "step": 25085 }, { "epoch": 0.47, "learning_rate": 2.836737963837494e-06, "loss": 1.0031, "step": 25086 }, { "epoch": 0.47, "learning_rate": 2.8365865898148648e-06, "loss": 0.9628, "step": 25087 }, { "epoch": 0.47, "learning_rate": 2.8364352145354312e-06, "loss": 0.7505, "step": 25088 }, { "epoch": 0.47, "learning_rate": 2.8362838379997593e-06, "loss": 0.8278, "step": 25089 }, { "epoch": 0.47, "learning_rate": 2.8361324602084136e-06, "loss": 0.6802, "step": 25090 }, { "epoch": 0.47, "learning_rate": 2.8359810811619594e-06, "loss": 1.0406, "step": 25091 }, { "epoch": 0.47, "learning_rate": 2.8358297008609626e-06, "loss": 0.8389, "step": 25092 }, { "epoch": 0.47, "learning_rate": 2.8356783193059877e-06, "loss": 1.023, "step": 25093 }, { "epoch": 0.47, "learning_rate": 2.8355269364976e-06, "loss": 1.051, "step": 25094 }, { "epoch": 0.47, "learning_rate": 2.8353755524363654e-06, "loss": 0.7312, "step": 25095 }, { "epoch": 0.47, "learning_rate": 2.8352241671228482e-06, "loss": 0.8681, "step": 25096 }, { "epoch": 0.47, "learning_rate": 2.8350727805576146e-06, "loss": 0.6864, "step": 25097 }, { "epoch": 0.47, "learning_rate": 2.83492139274123e-06, "loss": 0.8824, "step": 25098 }, { "epoch": 0.47, "learning_rate": 2.8347700036742586e-06, "loss": 0.854, "step": 25099 }, { "epoch": 0.47, "learning_rate": 2.8346186133572666e-06, "loss": 1.1097, "step": 25100 }, { "epoch": 0.47, "learning_rate": 2.8344672217908193e-06, "loss": 0.8728, "step": 25101 }, { "epoch": 0.47, "learning_rate": 2.8343158289754804e-06, "loss": 0.9055, "step": 25102 }, { "epoch": 0.47, "learning_rate": 2.834164434911817e-06, "loss": 0.9429, "step": 25103 }, { "epoch": 0.47, "learning_rate": 2.8340130396003946e-06, "loss": 1.0424, "step": 25104 }, { "epoch": 0.47, "learning_rate": 2.833861643041777e-06, "loss": 0.8287, "step": 25105 }, { "epoch": 0.47, "learning_rate": 2.8337102452365304e-06, "loss": 1.4061, "step": 25106 }, { "epoch": 0.47, "learning_rate": 2.8335588461852206e-06, "loss": 0.9468, "step": 25107 }, { "epoch": 0.47, "learning_rate": 2.833407445888412e-06, "loss": 0.8284, "step": 25108 }, { "epoch": 0.47, "learning_rate": 2.8332560443466692e-06, "loss": 0.89, "step": 25109 }, { "epoch": 0.47, "learning_rate": 2.8331046415605594e-06, "loss": 0.9503, "step": 25110 }, { "epoch": 0.47, "learning_rate": 2.8329532375306466e-06, "loss": 0.9683, "step": 25111 }, { "epoch": 0.47, "learning_rate": 2.8328018322574973e-06, "loss": 1.0881, "step": 25112 }, { "epoch": 0.47, "learning_rate": 2.8326504257416765e-06, "loss": 0.9367, "step": 25113 }, { "epoch": 0.47, "learning_rate": 2.8324990179837484e-06, "loss": 0.8502, "step": 25114 }, { "epoch": 0.47, "learning_rate": 2.8323476089842793e-06, "loss": 0.8061, "step": 25115 }, { "epoch": 0.47, "learning_rate": 2.832196198743834e-06, "loss": 0.7308, "step": 25116 }, { "epoch": 0.47, "learning_rate": 2.8320447872629784e-06, "loss": 0.8992, "step": 25117 }, { "epoch": 0.47, "learning_rate": 2.8318933745422784e-06, "loss": 0.9686, "step": 25118 }, { "epoch": 0.47, "learning_rate": 2.831741960582299e-06, "loss": 1.0984, "step": 25119 }, { "epoch": 0.47, "learning_rate": 2.8315905453836047e-06, "loss": 0.8556, "step": 25120 }, { "epoch": 0.47, "learning_rate": 2.8314391289467615e-06, "loss": 0.8347, "step": 25121 }, { "epoch": 0.47, "learning_rate": 2.8312877112723345e-06, "loss": 0.7089, "step": 25122 }, { "epoch": 0.47, "learning_rate": 2.8311362923608892e-06, "loss": 1.1467, "step": 25123 }, { "epoch": 0.47, "learning_rate": 2.8309848722129914e-06, "loss": 1.1271, "step": 25124 }, { "epoch": 0.47, "learning_rate": 2.8308334508292068e-06, "loss": 1.0591, "step": 25125 }, { "epoch": 0.47, "learning_rate": 2.8306820282101e-06, "loss": 0.9355, "step": 25126 }, { "epoch": 0.47, "learning_rate": 2.8305306043562357e-06, "loss": 0.9195, "step": 25127 }, { "epoch": 0.47, "learning_rate": 2.8303791792681816e-06, "loss": 0.8013, "step": 25128 }, { "epoch": 0.47, "learning_rate": 2.830227752946501e-06, "loss": 0.8604, "step": 25129 }, { "epoch": 0.47, "learning_rate": 2.83007632539176e-06, "loss": 0.9186, "step": 25130 }, { "epoch": 0.47, "learning_rate": 2.8299248966045243e-06, "loss": 1.1082, "step": 25131 }, { "epoch": 0.47, "learning_rate": 2.829773466585359e-06, "loss": 0.9461, "step": 25132 }, { "epoch": 0.47, "learning_rate": 2.8296220353348304e-06, "loss": 0.9598, "step": 25133 }, { "epoch": 0.47, "learning_rate": 2.829470602853503e-06, "loss": 0.8359, "step": 25134 }, { "epoch": 0.47, "learning_rate": 2.829319169141942e-06, "loss": 0.862, "step": 25135 }, { "epoch": 0.47, "learning_rate": 2.8291677342007134e-06, "loss": 0.7831, "step": 25136 }, { "epoch": 0.47, "learning_rate": 2.8290162980303826e-06, "loss": 1.0198, "step": 25137 }, { "epoch": 0.47, "learning_rate": 2.828864860631515e-06, "loss": 0.9518, "step": 25138 }, { "epoch": 0.47, "learning_rate": 2.8287134220046768e-06, "loss": 0.97, "step": 25139 }, { "epoch": 0.47, "learning_rate": 2.8285619821504325e-06, "loss": 0.9048, "step": 25140 }, { "epoch": 0.47, "learning_rate": 2.828410541069347e-06, "loss": 0.9597, "step": 25141 }, { "epoch": 0.47, "learning_rate": 2.828259098761987e-06, "loss": 0.9011, "step": 25142 }, { "epoch": 0.47, "learning_rate": 2.8281076552289183e-06, "loss": 1.1234, "step": 25143 }, { "epoch": 0.47, "learning_rate": 2.8279562104707043e-06, "loss": 0.9347, "step": 25144 }, { "epoch": 0.47, "learning_rate": 2.827804764487913e-06, "loss": 0.9023, "step": 25145 }, { "epoch": 0.47, "learning_rate": 2.8276533172811082e-06, "loss": 0.8322, "step": 25146 }, { "epoch": 0.47, "learning_rate": 2.827501868850856e-06, "loss": 0.9521, "step": 25147 }, { "epoch": 0.47, "learning_rate": 2.827350419197723e-06, "loss": 0.811, "step": 25148 }, { "epoch": 0.47, "learning_rate": 2.827198968322272e-06, "loss": 1.0042, "step": 25149 }, { "epoch": 0.47, "learning_rate": 2.827047516225071e-06, "loss": 1.1993, "step": 25150 }, { "epoch": 0.47, "learning_rate": 2.826896062906684e-06, "loss": 0.8768, "step": 25151 }, { "epoch": 0.47, "learning_rate": 2.8267446083676775e-06, "loss": 1.0142, "step": 25152 }, { "epoch": 0.47, "learning_rate": 2.8265931526086164e-06, "loss": 0.9037, "step": 25153 }, { "epoch": 0.47, "learning_rate": 2.826441695630067e-06, "loss": 0.9204, "step": 25154 }, { "epoch": 0.47, "learning_rate": 2.826290237432594e-06, "loss": 0.77, "step": 25155 }, { "epoch": 0.47, "learning_rate": 2.826138778016763e-06, "loss": 0.852, "step": 25156 }, { "epoch": 0.47, "learning_rate": 2.82598731738314e-06, "loss": 0.9785, "step": 25157 }, { "epoch": 0.47, "learning_rate": 2.82583585553229e-06, "loss": 0.8647, "step": 25158 }, { "epoch": 0.47, "learning_rate": 2.8256843924647793e-06, "loss": 0.7221, "step": 25159 }, { "epoch": 0.47, "learning_rate": 2.825532928181174e-06, "loss": 0.7986, "step": 25160 }, { "epoch": 0.47, "learning_rate": 2.8253814626820377e-06, "loss": 0.864, "step": 25161 }, { "epoch": 0.47, "learning_rate": 2.8252299959679365e-06, "loss": 1.0564, "step": 25162 }, { "epoch": 0.47, "learning_rate": 2.8250785280394377e-06, "loss": 1.0064, "step": 25163 }, { "epoch": 0.47, "learning_rate": 2.824927058897104e-06, "loss": 0.8614, "step": 25164 }, { "epoch": 0.47, "learning_rate": 2.8247755885415035e-06, "loss": 0.7317, "step": 25165 }, { "epoch": 0.47, "learning_rate": 2.8246241169732013e-06, "loss": 0.6689, "step": 25166 }, { "epoch": 0.47, "learning_rate": 2.8244726441927628e-06, "loss": 0.993, "step": 25167 }, { "epoch": 0.47, "learning_rate": 2.8243211702007525e-06, "loss": 1.0415, "step": 25168 }, { "epoch": 0.47, "learning_rate": 2.8241696949977374e-06, "loss": 1.0276, "step": 25169 }, { "epoch": 0.47, "learning_rate": 2.824018218584283e-06, "loss": 0.9052, "step": 25170 }, { "epoch": 0.47, "learning_rate": 2.8238667409609536e-06, "loss": 1.0269, "step": 25171 }, { "epoch": 0.47, "learning_rate": 2.823715262128316e-06, "loss": 0.8636, "step": 25172 }, { "epoch": 0.47, "learning_rate": 2.8235637820869353e-06, "loss": 0.8579, "step": 25173 }, { "epoch": 0.47, "learning_rate": 2.823412300837378e-06, "loss": 0.859, "step": 25174 }, { "epoch": 0.47, "learning_rate": 2.823260818380209e-06, "loss": 1.149, "step": 25175 }, { "epoch": 0.47, "learning_rate": 2.823109334715994e-06, "loss": 1.0703, "step": 25176 }, { "epoch": 0.48, "learning_rate": 2.822957849845298e-06, "loss": 0.9857, "step": 25177 }, { "epoch": 0.48, "learning_rate": 2.822806363768688e-06, "loss": 0.8984, "step": 25178 }, { "epoch": 0.48, "learning_rate": 2.8226548764867283e-06, "loss": 0.8748, "step": 25179 }, { "epoch": 0.48, "learning_rate": 2.8225033879999857e-06, "loss": 0.8214, "step": 25180 }, { "epoch": 0.48, "learning_rate": 2.822351898309026e-06, "loss": 1.1662, "step": 25181 }, { "epoch": 0.48, "learning_rate": 2.822200407414413e-06, "loss": 1.1809, "step": 25182 }, { "epoch": 0.48, "learning_rate": 2.822048915316714e-06, "loss": 0.9988, "step": 25183 }, { "epoch": 0.48, "learning_rate": 2.8218974220164945e-06, "loss": 0.8009, "step": 25184 }, { "epoch": 0.48, "learning_rate": 2.8217459275143187e-06, "loss": 1.001, "step": 25185 }, { "epoch": 0.48, "learning_rate": 2.8215944318107546e-06, "loss": 0.916, "step": 25186 }, { "epoch": 0.48, "learning_rate": 2.821442934906367e-06, "loss": 0.7861, "step": 25187 }, { "epoch": 0.48, "learning_rate": 2.8212914368017208e-06, "loss": 0.9262, "step": 25188 }, { "epoch": 0.48, "learning_rate": 2.821139937497382e-06, "loss": 0.9241, "step": 25189 }, { "epoch": 0.48, "learning_rate": 2.820988436993917e-06, "loss": 0.8736, "step": 25190 }, { "epoch": 0.48, "learning_rate": 2.8208369352918914e-06, "loss": 0.8571, "step": 25191 }, { "epoch": 0.48, "learning_rate": 2.8206854323918697e-06, "loss": 0.9713, "step": 25192 }, { "epoch": 0.48, "learning_rate": 2.8205339282944182e-06, "loss": 1.0109, "step": 25193 }, { "epoch": 0.48, "learning_rate": 2.820382423000103e-06, "loss": 1.1255, "step": 25194 }, { "epoch": 0.48, "learning_rate": 2.8202309165094904e-06, "loss": 1.0125, "step": 25195 }, { "epoch": 0.48, "learning_rate": 2.8200794088231455e-06, "loss": 0.9557, "step": 25196 }, { "epoch": 0.48, "learning_rate": 2.819927899941633e-06, "loss": 1.0502, "step": 25197 }, { "epoch": 0.48, "learning_rate": 2.8197763898655193e-06, "loss": 0.8004, "step": 25198 }, { "epoch": 0.48, "learning_rate": 2.8196248785953713e-06, "loss": 1.0948, "step": 25199 }, { "epoch": 0.48, "learning_rate": 2.819473366131753e-06, "loss": 1.2287, "step": 25200 }, { "epoch": 0.48, "learning_rate": 2.8193218524752316e-06, "loss": 0.874, "step": 25201 }, { "epoch": 0.48, "learning_rate": 2.8191703376263723e-06, "loss": 0.9662, "step": 25202 }, { "epoch": 0.48, "learning_rate": 2.8190188215857407e-06, "loss": 0.8911, "step": 25203 }, { "epoch": 0.48, "learning_rate": 2.818867304353902e-06, "loss": 0.8589, "step": 25204 }, { "epoch": 0.48, "learning_rate": 2.8187157859314235e-06, "loss": 0.8651, "step": 25205 }, { "epoch": 0.48, "learning_rate": 2.8185642663188683e-06, "loss": 1.1719, "step": 25206 }, { "epoch": 0.48, "learning_rate": 2.8184127455168052e-06, "loss": 1.1151, "step": 25207 }, { "epoch": 0.48, "learning_rate": 2.818261223525799e-06, "loss": 0.9734, "step": 25208 }, { "epoch": 0.48, "learning_rate": 2.8181097003464142e-06, "loss": 0.9572, "step": 25209 }, { "epoch": 0.48, "learning_rate": 2.817958175979218e-06, "loss": 0.9414, "step": 25210 }, { "epoch": 0.48, "learning_rate": 2.8178066504247766e-06, "loss": 0.9161, "step": 25211 }, { "epoch": 0.48, "learning_rate": 2.8176551236836535e-06, "loss": 1.2193, "step": 25212 }, { "epoch": 0.48, "learning_rate": 2.8175035957564162e-06, "loss": 1.2231, "step": 25213 }, { "epoch": 0.48, "learning_rate": 2.8173520666436306e-06, "loss": 0.8172, "step": 25214 }, { "epoch": 0.48, "learning_rate": 2.8172005363458615e-06, "loss": 1.0074, "step": 25215 }, { "epoch": 0.48, "learning_rate": 2.8170490048636756e-06, "loss": 1.0649, "step": 25216 }, { "epoch": 0.48, "learning_rate": 2.8168974721976393e-06, "loss": 0.9051, "step": 25217 }, { "epoch": 0.48, "learning_rate": 2.8167459383483165e-06, "loss": 0.8687, "step": 25218 }, { "epoch": 0.48, "learning_rate": 2.8165944033162745e-06, "loss": 1.2888, "step": 25219 }, { "epoch": 0.48, "learning_rate": 2.816442867102078e-06, "loss": 0.9931, "step": 25220 }, { "epoch": 0.48, "learning_rate": 2.8162913297062944e-06, "loss": 0.7907, "step": 25221 }, { "epoch": 0.48, "learning_rate": 2.8161397911294885e-06, "loss": 0.8676, "step": 25222 }, { "epoch": 0.48, "learning_rate": 2.815988251372227e-06, "loss": 0.8591, "step": 25223 }, { "epoch": 0.48, "learning_rate": 2.8158367104350736e-06, "loss": 1.0519, "step": 25224 }, { "epoch": 0.48, "learning_rate": 2.8156851683185966e-06, "loss": 1.0129, "step": 25225 }, { "epoch": 0.48, "learning_rate": 2.815533625023361e-06, "loss": 0.9473, "step": 25226 }, { "epoch": 0.48, "learning_rate": 2.8153820805499315e-06, "loss": 0.881, "step": 25227 }, { "epoch": 0.48, "learning_rate": 2.815230534898875e-06, "loss": 0.8699, "step": 25228 }, { "epoch": 0.48, "learning_rate": 2.8150789880707586e-06, "loss": 0.9136, "step": 25229 }, { "epoch": 0.48, "learning_rate": 2.8149274400661464e-06, "loss": 0.8034, "step": 25230 }, { "epoch": 0.48, "learning_rate": 2.8147758908856044e-06, "loss": 1.0947, "step": 25231 }, { "epoch": 0.48, "learning_rate": 2.8146243405296996e-06, "loss": 1.0081, "step": 25232 }, { "epoch": 0.48, "learning_rate": 2.8144727889989965e-06, "loss": 0.9067, "step": 25233 }, { "epoch": 0.48, "learning_rate": 2.814321236294062e-06, "loss": 1.1212, "step": 25234 }, { "epoch": 0.48, "learning_rate": 2.814169682415461e-06, "loss": 0.8921, "step": 25235 }, { "epoch": 0.48, "learning_rate": 2.8140181273637607e-06, "loss": 0.9623, "step": 25236 }, { "epoch": 0.48, "learning_rate": 2.8138665711395256e-06, "loss": 1.0796, "step": 25237 }, { "epoch": 0.48, "learning_rate": 2.8137150137433235e-06, "loss": 0.8897, "step": 25238 }, { "epoch": 0.48, "learning_rate": 2.8135634551757184e-06, "loss": 0.8763, "step": 25239 }, { "epoch": 0.48, "learning_rate": 2.813411895437277e-06, "loss": 1.0036, "step": 25240 }, { "epoch": 0.48, "learning_rate": 2.813260334528565e-06, "loss": 0.8546, "step": 25241 }, { "epoch": 0.48, "learning_rate": 2.8131087724501487e-06, "loss": 0.8045, "step": 25242 }, { "epoch": 0.48, "learning_rate": 2.8129572092025943e-06, "loss": 0.8789, "step": 25243 }, { "epoch": 0.48, "learning_rate": 2.8128056447864673e-06, "loss": 1.0464, "step": 25244 }, { "epoch": 0.48, "learning_rate": 2.812654079202333e-06, "loss": 0.9904, "step": 25245 }, { "epoch": 0.48, "learning_rate": 2.8125025124507583e-06, "loss": 0.8607, "step": 25246 }, { "epoch": 0.48, "learning_rate": 2.812350944532309e-06, "loss": 0.6764, "step": 25247 }, { "epoch": 0.48, "learning_rate": 2.81219937544755e-06, "loss": 0.8489, "step": 25248 }, { "epoch": 0.48, "learning_rate": 2.8120478051970483e-06, "loss": 1.0428, "step": 25249 }, { "epoch": 0.48, "learning_rate": 2.8118962337813704e-06, "loss": 1.0809, "step": 25250 }, { "epoch": 0.48, "learning_rate": 2.811744661201081e-06, "loss": 0.8684, "step": 25251 }, { "epoch": 0.48, "learning_rate": 2.811593087456747e-06, "loss": 0.8506, "step": 25252 }, { "epoch": 0.48, "learning_rate": 2.8114415125489342e-06, "loss": 0.6666, "step": 25253 }, { "epoch": 0.48, "learning_rate": 2.8112899364782077e-06, "loss": 0.6629, "step": 25254 }, { "epoch": 0.48, "learning_rate": 2.8111383592451343e-06, "loss": 1.0737, "step": 25255 }, { "epoch": 0.48, "learning_rate": 2.8109867808502794e-06, "loss": 1.2581, "step": 25256 }, { "epoch": 0.48, "learning_rate": 2.8108352012942096e-06, "loss": 0.9494, "step": 25257 }, { "epoch": 0.48, "learning_rate": 2.8106836205774913e-06, "loss": 0.9304, "step": 25258 }, { "epoch": 0.48, "learning_rate": 2.8105320387006898e-06, "loss": 0.8571, "step": 25259 }, { "epoch": 0.48, "learning_rate": 2.8103804556643705e-06, "loss": 0.846, "step": 25260 }, { "epoch": 0.48, "learning_rate": 2.8102288714691e-06, "loss": 1.1245, "step": 25261 }, { "epoch": 0.48, "learning_rate": 2.810077286115445e-06, "loss": 1.1668, "step": 25262 }, { "epoch": 0.48, "learning_rate": 2.809925699603971e-06, "loss": 1.0649, "step": 25263 }, { "epoch": 0.48, "learning_rate": 2.8097741119352438e-06, "loss": 0.9492, "step": 25264 }, { "epoch": 0.48, "learning_rate": 2.8096225231098295e-06, "loss": 0.9604, "step": 25265 }, { "epoch": 0.48, "learning_rate": 2.8094709331282936e-06, "loss": 0.9995, "step": 25266 }, { "epoch": 0.48, "learning_rate": 2.809319341991204e-06, "loss": 0.9902, "step": 25267 }, { "epoch": 0.48, "learning_rate": 2.809167749699125e-06, "loss": 0.9882, "step": 25268 }, { "epoch": 0.48, "learning_rate": 2.809016156252622e-06, "loss": 1.0381, "step": 25269 }, { "epoch": 0.48, "learning_rate": 2.8088645616522632e-06, "loss": 1.0434, "step": 25270 }, { "epoch": 0.48, "learning_rate": 2.8087129658986132e-06, "loss": 0.8049, "step": 25271 }, { "epoch": 0.48, "learning_rate": 2.8085613689922387e-06, "loss": 1.0117, "step": 25272 }, { "epoch": 0.48, "learning_rate": 2.808409770933706e-06, "loss": 0.9414, "step": 25273 }, { "epoch": 0.48, "learning_rate": 2.8082581717235803e-06, "loss": 0.8741, "step": 25274 }, { "epoch": 0.48, "learning_rate": 2.8081065713624273e-06, "loss": 0.9058, "step": 25275 }, { "epoch": 0.48, "learning_rate": 2.8079549698508146e-06, "loss": 0.9732, "step": 25276 }, { "epoch": 0.48, "learning_rate": 2.807803367189307e-06, "loss": 0.9073, "step": 25277 }, { "epoch": 0.48, "learning_rate": 2.807651763378471e-06, "loss": 0.8015, "step": 25278 }, { "epoch": 0.48, "learning_rate": 2.8075001584188736e-06, "loss": 0.7982, "step": 25279 }, { "epoch": 0.48, "learning_rate": 2.8073485523110794e-06, "loss": 0.788, "step": 25280 }, { "epoch": 0.48, "learning_rate": 2.8071969450556554e-06, "loss": 1.1, "step": 25281 }, { "epoch": 0.48, "learning_rate": 2.807045336653167e-06, "loss": 1.145, "step": 25282 }, { "epoch": 0.48, "learning_rate": 2.806893727104181e-06, "loss": 1.0358, "step": 25283 }, { "epoch": 0.48, "learning_rate": 2.8067421164092627e-06, "loss": 0.9778, "step": 25284 }, { "epoch": 0.48, "learning_rate": 2.80659050456898e-06, "loss": 1.0425, "step": 25285 }, { "epoch": 0.48, "learning_rate": 2.8064388915838967e-06, "loss": 1.016, "step": 25286 }, { "epoch": 0.48, "learning_rate": 2.80628727745458e-06, "loss": 1.0568, "step": 25287 }, { "epoch": 0.48, "learning_rate": 2.806135662181597e-06, "loss": 1.099, "step": 25288 }, { "epoch": 0.48, "learning_rate": 2.805984045765512e-06, "loss": 0.7126, "step": 25289 }, { "epoch": 0.48, "learning_rate": 2.805832428206892e-06, "loss": 0.967, "step": 25290 }, { "epoch": 0.48, "learning_rate": 2.805680809506303e-06, "loss": 0.813, "step": 25291 }, { "epoch": 0.48, "learning_rate": 2.805529189664311e-06, "loss": 1.027, "step": 25292 }, { "epoch": 0.48, "learning_rate": 2.8053775686814827e-06, "loss": 0.9548, "step": 25293 }, { "epoch": 0.48, "learning_rate": 2.8052259465583846e-06, "loss": 0.9843, "step": 25294 }, { "epoch": 0.48, "learning_rate": 2.8050743232955812e-06, "loss": 1.0008, "step": 25295 }, { "epoch": 0.48, "learning_rate": 2.80492269889364e-06, "loss": 0.8807, "step": 25296 }, { "epoch": 0.48, "learning_rate": 2.804771073353127e-06, "loss": 0.8521, "step": 25297 }, { "epoch": 0.48, "learning_rate": 2.8046194466746078e-06, "loss": 0.6919, "step": 25298 }, { "epoch": 0.48, "learning_rate": 2.8044678188586487e-06, "loss": 0.9859, "step": 25299 }, { "epoch": 0.48, "learning_rate": 2.8043161899058168e-06, "loss": 1.072, "step": 25300 }, { "epoch": 0.48, "learning_rate": 2.804164559816677e-06, "loss": 0.9556, "step": 25301 }, { "epoch": 0.48, "learning_rate": 2.8040129285917966e-06, "loss": 0.9449, "step": 25302 }, { "epoch": 0.48, "learning_rate": 2.8038612962317408e-06, "loss": 0.9596, "step": 25303 }, { "epoch": 0.48, "learning_rate": 2.8037096627370763e-06, "loss": 0.941, "step": 25304 }, { "epoch": 0.48, "learning_rate": 2.803558028108369e-06, "loss": 0.9948, "step": 25305 }, { "epoch": 0.48, "learning_rate": 2.803406392346186e-06, "loss": 0.961, "step": 25306 }, { "epoch": 0.48, "learning_rate": 2.8032547554510927e-06, "loss": 1.0127, "step": 25307 }, { "epoch": 0.48, "learning_rate": 2.803103117423655e-06, "loss": 1.0464, "step": 25308 }, { "epoch": 0.48, "learning_rate": 2.80295147826444e-06, "loss": 0.6806, "step": 25309 }, { "epoch": 0.48, "learning_rate": 2.8027998379740136e-06, "loss": 0.8951, "step": 25310 }, { "epoch": 0.48, "learning_rate": 2.8026481965529406e-06, "loss": 0.8861, "step": 25311 }, { "epoch": 0.48, "learning_rate": 2.80249655400179e-06, "loss": 1.1394, "step": 25312 }, { "epoch": 0.48, "learning_rate": 2.8023449103211258e-06, "loss": 0.9272, "step": 25313 }, { "epoch": 0.48, "learning_rate": 2.8021932655115152e-06, "loss": 0.9787, "step": 25314 }, { "epoch": 0.48, "learning_rate": 2.8020416195735246e-06, "loss": 0.8425, "step": 25315 }, { "epoch": 0.48, "learning_rate": 2.801889972507719e-06, "loss": 0.9018, "step": 25316 }, { "epoch": 0.48, "learning_rate": 2.8017383243146663e-06, "loss": 1.068, "step": 25317 }, { "epoch": 0.48, "learning_rate": 2.801586674994931e-06, "loss": 1.2015, "step": 25318 }, { "epoch": 0.48, "learning_rate": 2.8014350245490806e-06, "loss": 0.9282, "step": 25319 }, { "epoch": 0.48, "learning_rate": 2.801283372977682e-06, "loss": 0.8845, "step": 25320 }, { "epoch": 0.48, "learning_rate": 2.8011317202812997e-06, "loss": 0.8351, "step": 25321 }, { "epoch": 0.48, "learning_rate": 2.8009800664605007e-06, "loss": 1.022, "step": 25322 }, { "epoch": 0.48, "learning_rate": 2.8008284115158517e-06, "loss": 0.9256, "step": 25323 }, { "epoch": 0.48, "learning_rate": 2.8006767554479184e-06, "loss": 1.201, "step": 25324 }, { "epoch": 0.48, "learning_rate": 2.8005250982572675e-06, "loss": 0.7704, "step": 25325 }, { "epoch": 0.48, "learning_rate": 2.800373439944465e-06, "loss": 1.1123, "step": 25326 }, { "epoch": 0.48, "learning_rate": 2.800221780510078e-06, "loss": 1.0121, "step": 25327 }, { "epoch": 0.48, "learning_rate": 2.8000701199546707e-06, "loss": 0.8278, "step": 25328 }, { "epoch": 0.48, "learning_rate": 2.7999184582788114e-06, "loss": 0.9609, "step": 25329 }, { "epoch": 0.48, "learning_rate": 2.7997667954830665e-06, "loss": 0.8824, "step": 25330 }, { "epoch": 0.48, "learning_rate": 2.799615131568001e-06, "loss": 0.9366, "step": 25331 }, { "epoch": 0.48, "learning_rate": 2.7994634665341808e-06, "loss": 0.9948, "step": 25332 }, { "epoch": 0.48, "learning_rate": 2.7993118003821746e-06, "loss": 1.0168, "step": 25333 }, { "epoch": 0.48, "learning_rate": 2.799160133112547e-06, "loss": 0.8866, "step": 25334 }, { "epoch": 0.48, "learning_rate": 2.799008464725864e-06, "loss": 0.8386, "step": 25335 }, { "epoch": 0.48, "learning_rate": 2.7988567952226935e-06, "loss": 0.7767, "step": 25336 }, { "epoch": 0.48, "learning_rate": 2.7987051246036003e-06, "loss": 1.2653, "step": 25337 }, { "epoch": 0.48, "learning_rate": 2.7985534528691514e-06, "loss": 0.9698, "step": 25338 }, { "epoch": 0.48, "learning_rate": 2.798401780019913e-06, "loss": 0.6745, "step": 25339 }, { "epoch": 0.48, "learning_rate": 2.7982501060564514e-06, "loss": 0.9865, "step": 25340 }, { "epoch": 0.48, "learning_rate": 2.7980984309793335e-06, "loss": 0.698, "step": 25341 }, { "epoch": 0.48, "learning_rate": 2.7979467547891254e-06, "loss": 0.9442, "step": 25342 }, { "epoch": 0.48, "learning_rate": 2.7977950774863925e-06, "loss": 0.8733, "step": 25343 }, { "epoch": 0.48, "learning_rate": 2.7976433990717023e-06, "loss": 1.086, "step": 25344 }, { "epoch": 0.48, "learning_rate": 2.79749171954562e-06, "loss": 0.9266, "step": 25345 }, { "epoch": 0.48, "learning_rate": 2.7973400389087135e-06, "loss": 0.7545, "step": 25346 }, { "epoch": 0.48, "learning_rate": 2.7971883571615483e-06, "loss": 0.6482, "step": 25347 }, { "epoch": 0.48, "learning_rate": 2.7970366743046916e-06, "loss": 0.7677, "step": 25348 }, { "epoch": 0.48, "learning_rate": 2.796884990338708e-06, "loss": 1.2429, "step": 25349 }, { "epoch": 0.48, "learning_rate": 2.7967333052641653e-06, "loss": 1.2607, "step": 25350 }, { "epoch": 0.48, "learning_rate": 2.7965816190816302e-06, "loss": 0.864, "step": 25351 }, { "epoch": 0.48, "learning_rate": 2.7964299317916678e-06, "loss": 0.8962, "step": 25352 }, { "epoch": 0.48, "learning_rate": 2.796278243394844e-06, "loss": 0.9802, "step": 25353 }, { "epoch": 0.48, "learning_rate": 2.796126553891728e-06, "loss": 0.7938, "step": 25354 }, { "epoch": 0.48, "learning_rate": 2.7959748632828844e-06, "loss": 0.8828, "step": 25355 }, { "epoch": 0.48, "learning_rate": 2.795823171568879e-06, "loss": 1.0913, "step": 25356 }, { "epoch": 0.48, "learning_rate": 2.7956714787502796e-06, "loss": 0.8857, "step": 25357 }, { "epoch": 0.48, "learning_rate": 2.7955197848276515e-06, "loss": 0.9894, "step": 25358 }, { "epoch": 0.48, "learning_rate": 2.795368089801562e-06, "loss": 0.9107, "step": 25359 }, { "epoch": 0.48, "learning_rate": 2.7952163936725764e-06, "loss": 0.8211, "step": 25360 }, { "epoch": 0.48, "learning_rate": 2.795064696441262e-06, "loss": 0.9331, "step": 25361 }, { "epoch": 0.48, "learning_rate": 2.7949129981081852e-06, "loss": 1.118, "step": 25362 }, { "epoch": 0.48, "learning_rate": 2.7947612986739133e-06, "loss": 0.9438, "step": 25363 }, { "epoch": 0.48, "learning_rate": 2.79460959813901e-06, "loss": 0.7197, "step": 25364 }, { "epoch": 0.48, "learning_rate": 2.7944578965040446e-06, "loss": 0.9914, "step": 25365 }, { "epoch": 0.48, "learning_rate": 2.794306193769582e-06, "loss": 0.9037, "step": 25366 }, { "epoch": 0.48, "learning_rate": 2.7941544899361894e-06, "loss": 0.873, "step": 25367 }, { "epoch": 0.48, "learning_rate": 2.7940027850044326e-06, "loss": 1.1111, "step": 25368 }, { "epoch": 0.48, "learning_rate": 2.7938510789748793e-06, "loss": 0.9752, "step": 25369 }, { "epoch": 0.48, "learning_rate": 2.7936993718480943e-06, "loss": 0.9799, "step": 25370 }, { "epoch": 0.48, "learning_rate": 2.7935476636246455e-06, "loss": 1.1421, "step": 25371 }, { "epoch": 0.48, "learning_rate": 2.793395954305098e-06, "loss": 0.7811, "step": 25372 }, { "epoch": 0.48, "learning_rate": 2.7932442438900193e-06, "loss": 0.8651, "step": 25373 }, { "epoch": 0.48, "learning_rate": 2.793092532379975e-06, "loss": 1.1558, "step": 25374 }, { "epoch": 0.48, "learning_rate": 2.792940819775533e-06, "loss": 1.0759, "step": 25375 }, { "epoch": 0.48, "learning_rate": 2.792789106077258e-06, "loss": 0.9055, "step": 25376 }, { "epoch": 0.48, "learning_rate": 2.792637391285719e-06, "loss": 0.8119, "step": 25377 }, { "epoch": 0.48, "learning_rate": 2.7924856754014802e-06, "loss": 0.8703, "step": 25378 }, { "epoch": 0.48, "learning_rate": 2.7923339584251086e-06, "loss": 0.742, "step": 25379 }, { "epoch": 0.48, "learning_rate": 2.7921822403571706e-06, "loss": 0.9672, "step": 25380 }, { "epoch": 0.48, "learning_rate": 2.7920305211982334e-06, "loss": 1.1864, "step": 25381 }, { "epoch": 0.48, "learning_rate": 2.7918788009488633e-06, "loss": 0.9748, "step": 25382 }, { "epoch": 0.48, "learning_rate": 2.7917270796096274e-06, "loss": 0.8942, "step": 25383 }, { "epoch": 0.48, "learning_rate": 2.7915753571810905e-06, "loss": 0.861, "step": 25384 }, { "epoch": 0.48, "learning_rate": 2.7914236336638207e-06, "loss": 0.9121, "step": 25385 }, { "epoch": 0.48, "learning_rate": 2.7912719090583838e-06, "loss": 0.9418, "step": 25386 }, { "epoch": 0.48, "learning_rate": 2.7911201833653464e-06, "loss": 1.0522, "step": 25387 }, { "epoch": 0.48, "learning_rate": 2.790968456585275e-06, "loss": 0.845, "step": 25388 }, { "epoch": 0.48, "learning_rate": 2.7908167287187372e-06, "loss": 0.9328, "step": 25389 }, { "epoch": 0.48, "learning_rate": 2.7906649997662976e-06, "loss": 0.9579, "step": 25390 }, { "epoch": 0.48, "learning_rate": 2.790513269728524e-06, "loss": 0.9545, "step": 25391 }, { "epoch": 0.48, "learning_rate": 2.790361538605984e-06, "loss": 0.8378, "step": 25392 }, { "epoch": 0.48, "learning_rate": 2.7902098063992415e-06, "loss": 1.0304, "step": 25393 }, { "epoch": 0.48, "learning_rate": 2.790058073108865e-06, "loss": 1.1107, "step": 25394 }, { "epoch": 0.48, "learning_rate": 2.7899063387354203e-06, "loss": 1.0923, "step": 25395 }, { "epoch": 0.48, "learning_rate": 2.7897546032794744e-06, "loss": 0.9386, "step": 25396 }, { "epoch": 0.48, "learning_rate": 2.789602866741594e-06, "loss": 0.6688, "step": 25397 }, { "epoch": 0.48, "learning_rate": 2.7894511291223452e-06, "loss": 0.9545, "step": 25398 }, { "epoch": 0.48, "learning_rate": 2.7892993904222944e-06, "loss": 1.0722, "step": 25399 }, { "epoch": 0.48, "learning_rate": 2.7891476506420086e-06, "loss": 1.0259, "step": 25400 }, { "epoch": 0.48, "learning_rate": 2.7889959097820547e-06, "loss": 1.1274, "step": 25401 }, { "epoch": 0.48, "learning_rate": 2.7888441678429982e-06, "loss": 0.8534, "step": 25402 }, { "epoch": 0.48, "learning_rate": 2.788692424825407e-06, "loss": 0.8806, "step": 25403 }, { "epoch": 0.48, "learning_rate": 2.7885406807298475e-06, "loss": 0.8538, "step": 25404 }, { "epoch": 0.48, "learning_rate": 2.7883889355568857e-06, "loss": 0.9954, "step": 25405 }, { "epoch": 0.48, "learning_rate": 2.788237189307088e-06, "loss": 1.0953, "step": 25406 }, { "epoch": 0.48, "learning_rate": 2.788085441981022e-06, "loss": 1.0859, "step": 25407 }, { "epoch": 0.48, "learning_rate": 2.7879336935792534e-06, "loss": 0.8931, "step": 25408 }, { "epoch": 0.48, "learning_rate": 2.787781944102349e-06, "loss": 0.7953, "step": 25409 }, { "epoch": 0.48, "learning_rate": 2.7876301935508763e-06, "loss": 0.7863, "step": 25410 }, { "epoch": 0.48, "learning_rate": 2.7874784419254013e-06, "loss": 0.5436, "step": 25411 }, { "epoch": 0.48, "learning_rate": 2.78732668922649e-06, "loss": 0.9746, "step": 25412 }, { "epoch": 0.48, "learning_rate": 2.7871749354547106e-06, "loss": 1.0295, "step": 25413 }, { "epoch": 0.48, "learning_rate": 2.787023180610628e-06, "loss": 0.8256, "step": 25414 }, { "epoch": 0.48, "learning_rate": 2.7868714246948097e-06, "loss": 0.9459, "step": 25415 }, { "epoch": 0.48, "learning_rate": 2.7867196677078225e-06, "loss": 0.8684, "step": 25416 }, { "epoch": 0.48, "learning_rate": 2.7865679096502326e-06, "loss": 0.8395, "step": 25417 }, { "epoch": 0.48, "learning_rate": 2.7864161505226067e-06, "loss": 1.3043, "step": 25418 }, { "epoch": 0.48, "learning_rate": 2.7862643903255128e-06, "loss": 1.1911, "step": 25419 }, { "epoch": 0.48, "learning_rate": 2.7861126290595154e-06, "loss": 0.7553, "step": 25420 }, { "epoch": 0.48, "learning_rate": 2.7859608667251824e-06, "loss": 0.8697, "step": 25421 }, { "epoch": 0.48, "learning_rate": 2.7858091033230806e-06, "loss": 0.8282, "step": 25422 }, { "epoch": 0.48, "learning_rate": 2.7856573388537756e-06, "loss": 0.8106, "step": 25423 }, { "epoch": 0.48, "learning_rate": 2.7855055733178356e-06, "loss": 1.0536, "step": 25424 }, { "epoch": 0.48, "learning_rate": 2.7853538067158263e-06, "loss": 1.0283, "step": 25425 }, { "epoch": 0.48, "learning_rate": 2.7852020390483147e-06, "loss": 0.8362, "step": 25426 }, { "epoch": 0.48, "learning_rate": 2.7850502703158675e-06, "loss": 1.142, "step": 25427 }, { "epoch": 0.48, "learning_rate": 2.784898500519052e-06, "loss": 0.8361, "step": 25428 }, { "epoch": 0.48, "learning_rate": 2.7847467296584324e-06, "loss": 0.7894, "step": 25429 }, { "epoch": 0.48, "learning_rate": 2.784594957734579e-06, "loss": 0.9849, "step": 25430 }, { "epoch": 0.48, "learning_rate": 2.784443184748056e-06, "loss": 0.8617, "step": 25431 }, { "epoch": 0.48, "learning_rate": 2.784291410699431e-06, "loss": 1.1473, "step": 25432 }, { "epoch": 0.48, "learning_rate": 2.7841396355892703e-06, "loss": 0.8487, "step": 25433 }, { "epoch": 0.48, "learning_rate": 2.7839878594181417e-06, "loss": 1.0621, "step": 25434 }, { "epoch": 0.48, "learning_rate": 2.7838360821866104e-06, "loss": 0.811, "step": 25435 }, { "epoch": 0.48, "learning_rate": 2.783684303895244e-06, "loss": 0.9266, "step": 25436 }, { "epoch": 0.48, "learning_rate": 2.7835325245446095e-06, "loss": 1.1347, "step": 25437 }, { "epoch": 0.48, "learning_rate": 2.7833807441352724e-06, "loss": 1.2759, "step": 25438 }, { "epoch": 0.48, "learning_rate": 2.7832289626678005e-06, "loss": 1.0042, "step": 25439 }, { "epoch": 0.48, "learning_rate": 2.7830771801427614e-06, "loss": 0.8658, "step": 25440 }, { "epoch": 0.48, "learning_rate": 2.78292539656072e-06, "loss": 0.8691, "step": 25441 }, { "epoch": 0.48, "learning_rate": 2.782773611922244e-06, "loss": 0.9127, "step": 25442 }, { "epoch": 0.48, "learning_rate": 2.7826218262278993e-06, "loss": 0.8541, "step": 25443 }, { "epoch": 0.48, "learning_rate": 2.7824700394782537e-06, "loss": 1.1724, "step": 25444 }, { "epoch": 0.48, "learning_rate": 2.782318251673874e-06, "loss": 0.9719, "step": 25445 }, { "epoch": 0.48, "learning_rate": 2.782166462815327e-06, "loss": 0.8501, "step": 25446 }, { "epoch": 0.48, "learning_rate": 2.782014672903178e-06, "loss": 0.8279, "step": 25447 }, { "epoch": 0.48, "learning_rate": 2.7818628819379957e-06, "loss": 0.726, "step": 25448 }, { "epoch": 0.48, "learning_rate": 2.7817110899203465e-06, "loss": 1.1405, "step": 25449 }, { "epoch": 0.48, "learning_rate": 2.7815592968507954e-06, "loss": 1.1625, "step": 25450 }, { "epoch": 0.48, "learning_rate": 2.781407502729911e-06, "loss": 1.0031, "step": 25451 }, { "epoch": 0.48, "learning_rate": 2.7812557075582603e-06, "loss": 0.9742, "step": 25452 }, { "epoch": 0.48, "learning_rate": 2.7811039113364087e-06, "loss": 0.877, "step": 25453 }, { "epoch": 0.48, "learning_rate": 2.7809521140649237e-06, "loss": 0.8326, "step": 25454 }, { "epoch": 0.48, "learning_rate": 2.7808003157443727e-06, "loss": 1.1641, "step": 25455 }, { "epoch": 0.48, "learning_rate": 2.780648516375321e-06, "loss": 0.9669, "step": 25456 }, { "epoch": 0.48, "learning_rate": 2.780496715958337e-06, "loss": 0.8423, "step": 25457 }, { "epoch": 0.48, "learning_rate": 2.7803449144939866e-06, "loss": 0.8253, "step": 25458 }, { "epoch": 0.48, "learning_rate": 2.7801931119828367e-06, "loss": 1.0021, "step": 25459 }, { "epoch": 0.48, "learning_rate": 2.7800413084254545e-06, "loss": 0.984, "step": 25460 }, { "epoch": 0.48, "learning_rate": 2.779889503822407e-06, "loss": 0.8328, "step": 25461 }, { "epoch": 0.48, "learning_rate": 2.779737698174261e-06, "loss": 0.9381, "step": 25462 }, { "epoch": 0.48, "learning_rate": 2.779585891481582e-06, "loss": 0.9977, "step": 25463 }, { "epoch": 0.48, "learning_rate": 2.7794340837449385e-06, "loss": 0.9578, "step": 25464 }, { "epoch": 0.48, "learning_rate": 2.7792822749648964e-06, "loss": 0.8131, "step": 25465 }, { "epoch": 0.48, "learning_rate": 2.7791304651420225e-06, "loss": 0.8064, "step": 25466 }, { "epoch": 0.48, "learning_rate": 2.7789786542768848e-06, "loss": 0.6949, "step": 25467 }, { "epoch": 0.48, "learning_rate": 2.7788268423700494e-06, "loss": 1.1204, "step": 25468 }, { "epoch": 0.48, "learning_rate": 2.778675029422082e-06, "loss": 1.0937, "step": 25469 }, { "epoch": 0.48, "learning_rate": 2.778523215433552e-06, "loss": 0.7721, "step": 25470 }, { "epoch": 0.48, "learning_rate": 2.778371400405023e-06, "loss": 0.8791, "step": 25471 }, { "epoch": 0.48, "learning_rate": 2.778219584337065e-06, "loss": 0.9156, "step": 25472 }, { "epoch": 0.48, "learning_rate": 2.778067767230244e-06, "loss": 0.8181, "step": 25473 }, { "epoch": 0.48, "learning_rate": 2.777915949085126e-06, "loss": 0.9794, "step": 25474 }, { "epoch": 0.48, "learning_rate": 2.7777641299022782e-06, "loss": 0.9471, "step": 25475 }, { "epoch": 0.48, "learning_rate": 2.777612309682268e-06, "loss": 0.9954, "step": 25476 }, { "epoch": 0.48, "learning_rate": 2.777460488425662e-06, "loss": 1.063, "step": 25477 }, { "epoch": 0.48, "learning_rate": 2.777308666133026e-06, "loss": 0.7405, "step": 25478 }, { "epoch": 0.48, "learning_rate": 2.7771568428049293e-06, "loss": 0.7838, "step": 25479 }, { "epoch": 0.48, "learning_rate": 2.7770050184419365e-06, "loss": 0.9013, "step": 25480 }, { "epoch": 0.48, "learning_rate": 2.7768531930446157e-06, "loss": 1.1175, "step": 25481 }, { "epoch": 0.48, "learning_rate": 2.7767013666135345e-06, "loss": 1.1035, "step": 25482 }, { "epoch": 0.48, "learning_rate": 2.776549539149258e-06, "loss": 0.7986, "step": 25483 }, { "epoch": 0.48, "learning_rate": 2.7763977106523536e-06, "loss": 0.9214, "step": 25484 }, { "epoch": 0.48, "learning_rate": 2.7762458811233895e-06, "loss": 0.816, "step": 25485 }, { "epoch": 0.48, "learning_rate": 2.7760940505629307e-06, "loss": 0.8469, "step": 25486 }, { "epoch": 0.48, "learning_rate": 2.775942218971547e-06, "loss": 1.0351, "step": 25487 }, { "epoch": 0.48, "learning_rate": 2.775790386349802e-06, "loss": 0.8058, "step": 25488 }, { "epoch": 0.48, "learning_rate": 2.775638552698264e-06, "loss": 0.7807, "step": 25489 }, { "epoch": 0.48, "learning_rate": 2.7754867180175012e-06, "loss": 0.9706, "step": 25490 }, { "epoch": 0.48, "learning_rate": 2.775334882308078e-06, "loss": 0.7444, "step": 25491 }, { "epoch": 0.48, "learning_rate": 2.7751830455705634e-06, "loss": 0.895, "step": 25492 }, { "epoch": 0.48, "learning_rate": 2.775031207805525e-06, "loss": 1.0127, "step": 25493 }, { "epoch": 0.48, "learning_rate": 2.7748793690135275e-06, "loss": 1.0177, "step": 25494 }, { "epoch": 0.48, "learning_rate": 2.7747275291951383e-06, "loss": 0.823, "step": 25495 }, { "epoch": 0.48, "learning_rate": 2.774575688350926e-06, "loss": 0.772, "step": 25496 }, { "epoch": 0.48, "learning_rate": 2.774423846481456e-06, "loss": 0.7767, "step": 25497 }, { "epoch": 0.48, "learning_rate": 2.7742720035872954e-06, "loss": 0.7811, "step": 25498 }, { "epoch": 0.48, "learning_rate": 2.7741201596690123e-06, "loss": 0.9631, "step": 25499 }, { "epoch": 0.48, "learning_rate": 2.773968314727172e-06, "loss": 0.8336, "step": 25500 }, { "epoch": 0.48, "learning_rate": 2.7738164687623424e-06, "loss": 1.0876, "step": 25501 }, { "epoch": 0.48, "learning_rate": 2.7736646217750916e-06, "loss": 0.8135, "step": 25502 }, { "epoch": 0.48, "learning_rate": 2.773512773765985e-06, "loss": 0.991, "step": 25503 }, { "epoch": 0.48, "learning_rate": 2.77336092473559e-06, "loss": 0.7423, "step": 25504 }, { "epoch": 0.48, "learning_rate": 2.773209074684474e-06, "loss": 0.9367, "step": 25505 }, { "epoch": 0.48, "learning_rate": 2.7730572236132033e-06, "loss": 1.1432, "step": 25506 }, { "epoch": 0.48, "learning_rate": 2.7729053715223447e-06, "loss": 0.9654, "step": 25507 }, { "epoch": 0.48, "learning_rate": 2.772753518412467e-06, "loss": 0.8558, "step": 25508 }, { "epoch": 0.48, "learning_rate": 2.772601664284135e-06, "loss": 0.8462, "step": 25509 }, { "epoch": 0.48, "learning_rate": 2.772449809137918e-06, "loss": 0.9213, "step": 25510 }, { "epoch": 0.48, "learning_rate": 2.772297952974381e-06, "loss": 0.8321, "step": 25511 }, { "epoch": 0.48, "learning_rate": 2.7721460957940914e-06, "loss": 1.2341, "step": 25512 }, { "epoch": 0.48, "learning_rate": 2.7719942375976165e-06, "loss": 0.9716, "step": 25513 }, { "epoch": 0.48, "learning_rate": 2.7718423783855246e-06, "loss": 0.9205, "step": 25514 }, { "epoch": 0.48, "learning_rate": 2.771690518158381e-06, "loss": 0.7686, "step": 25515 }, { "epoch": 0.48, "learning_rate": 2.7715386569167536e-06, "loss": 0.9325, "step": 25516 }, { "epoch": 0.48, "learning_rate": 2.7713867946612087e-06, "loss": 0.8431, "step": 25517 }, { "epoch": 0.48, "learning_rate": 2.7712349313923143e-06, "loss": 0.9142, "step": 25518 }, { "epoch": 0.48, "learning_rate": 2.7710830671106366e-06, "loss": 0.9403, "step": 25519 }, { "epoch": 0.48, "learning_rate": 2.7709312018167435e-06, "loss": 0.9592, "step": 25520 }, { "epoch": 0.48, "learning_rate": 2.770779335511201e-06, "loss": 0.9807, "step": 25521 }, { "epoch": 0.48, "learning_rate": 2.7706274681945765e-06, "loss": 1.0112, "step": 25522 }, { "epoch": 0.48, "learning_rate": 2.770475599867438e-06, "loss": 0.8556, "step": 25523 }, { "epoch": 0.48, "learning_rate": 2.770323730530352e-06, "loss": 0.8764, "step": 25524 }, { "epoch": 0.48, "learning_rate": 2.770171860183885e-06, "loss": 0.9435, "step": 25525 }, { "epoch": 0.48, "learning_rate": 2.770019988828605e-06, "loss": 0.9064, "step": 25526 }, { "epoch": 0.48, "learning_rate": 2.769868116465078e-06, "loss": 0.677, "step": 25527 }, { "epoch": 0.48, "learning_rate": 2.7697162430938725e-06, "loss": 0.911, "step": 25528 }, { "epoch": 0.48, "learning_rate": 2.769564368715555e-06, "loss": 0.7623, "step": 25529 }, { "epoch": 0.48, "learning_rate": 2.7694124933306914e-06, "loss": 1.068, "step": 25530 }, { "epoch": 0.48, "learning_rate": 2.7692606169398506e-06, "loss": 1.0866, "step": 25531 }, { "epoch": 0.48, "learning_rate": 2.769108739543599e-06, "loss": 0.8663, "step": 25532 }, { "epoch": 0.48, "learning_rate": 2.768956861142502e-06, "loss": 0.9442, "step": 25533 }, { "epoch": 0.48, "learning_rate": 2.76880498173713e-06, "loss": 0.8995, "step": 25534 }, { "epoch": 0.48, "learning_rate": 2.768653101328048e-06, "loss": 0.9828, "step": 25535 }, { "epoch": 0.48, "learning_rate": 2.768501219915824e-06, "loss": 0.7773, "step": 25536 }, { "epoch": 0.48, "learning_rate": 2.7683493375010238e-06, "loss": 1.098, "step": 25537 }, { "epoch": 0.48, "learning_rate": 2.7681974540842166e-06, "loss": 1.0458, "step": 25538 }, { "epoch": 0.48, "learning_rate": 2.7680455696659674e-06, "loss": 0.9142, "step": 25539 }, { "epoch": 0.48, "learning_rate": 2.767893684246844e-06, "loss": 0.7461, "step": 25540 }, { "epoch": 0.48, "learning_rate": 2.7677417978274145e-06, "loss": 0.9003, "step": 25541 }, { "epoch": 0.48, "learning_rate": 2.767589910408245e-06, "loss": 0.8983, "step": 25542 }, { "epoch": 0.48, "learning_rate": 2.7674380219899026e-06, "loss": 1.1475, "step": 25543 }, { "epoch": 0.48, "learning_rate": 2.7672861325729562e-06, "loss": 0.847, "step": 25544 }, { "epoch": 0.48, "learning_rate": 2.76713424215797e-06, "loss": 0.684, "step": 25545 }, { "epoch": 0.48, "learning_rate": 2.7669823507455136e-06, "loss": 0.8471, "step": 25546 }, { "epoch": 0.48, "learning_rate": 2.7668304583361527e-06, "loss": 1.0349, "step": 25547 }, { "epoch": 0.48, "learning_rate": 2.766678564930456e-06, "loss": 0.9376, "step": 25548 }, { "epoch": 0.48, "learning_rate": 2.7665266705289883e-06, "loss": 1.1404, "step": 25549 }, { "epoch": 0.48, "learning_rate": 2.7663747751323196e-06, "loss": 1.0513, "step": 25550 }, { "epoch": 0.48, "learning_rate": 2.766222878741015e-06, "loss": 0.9406, "step": 25551 }, { "epoch": 0.48, "learning_rate": 2.7660709813556426e-06, "loss": 0.8467, "step": 25552 }, { "epoch": 0.48, "learning_rate": 2.765919082976769e-06, "loss": 0.899, "step": 25553 }, { "epoch": 0.48, "learning_rate": 2.7657671836049614e-06, "loss": 1.0153, "step": 25554 }, { "epoch": 0.48, "learning_rate": 2.7656152832407872e-06, "loss": 0.8729, "step": 25555 }, { "epoch": 0.48, "learning_rate": 2.765463381884815e-06, "loss": 0.9816, "step": 25556 }, { "epoch": 0.48, "learning_rate": 2.7653114795376095e-06, "loss": 0.9489, "step": 25557 }, { "epoch": 0.48, "learning_rate": 2.76515957619974e-06, "loss": 0.8899, "step": 25558 }, { "epoch": 0.48, "learning_rate": 2.765007671871772e-06, "loss": 0.8262, "step": 25559 }, { "epoch": 0.48, "learning_rate": 2.7648557665542736e-06, "loss": 0.8026, "step": 25560 }, { "epoch": 0.48, "learning_rate": 2.764703860247812e-06, "loss": 0.7144, "step": 25561 }, { "epoch": 0.48, "learning_rate": 2.764551952952954e-06, "loss": 1.0941, "step": 25562 }, { "epoch": 0.48, "learning_rate": 2.7644000446702672e-06, "loss": 0.9095, "step": 25563 }, { "epoch": 0.48, "learning_rate": 2.764248135400319e-06, "loss": 0.9399, "step": 25564 }, { "epoch": 0.48, "learning_rate": 2.7640962251436764e-06, "loss": 0.7673, "step": 25565 }, { "epoch": 0.48, "learning_rate": 2.7639443139009064e-06, "loss": 0.8988, "step": 25566 }, { "epoch": 0.48, "learning_rate": 2.7637924016725763e-06, "loss": 1.0878, "step": 25567 }, { "epoch": 0.48, "learning_rate": 2.7636404884592537e-06, "loss": 1.2039, "step": 25568 }, { "epoch": 0.48, "learning_rate": 2.763488574261506e-06, "loss": 1.027, "step": 25569 }, { "epoch": 0.48, "learning_rate": 2.7633366590798993e-06, "loss": 0.9612, "step": 25570 }, { "epoch": 0.48, "learning_rate": 2.7631847429150023e-06, "loss": 0.8501, "step": 25571 }, { "epoch": 0.48, "learning_rate": 2.763032825767381e-06, "loss": 0.9412, "step": 25572 }, { "epoch": 0.48, "learning_rate": 2.762880907637603e-06, "loss": 0.6699, "step": 25573 }, { "epoch": 0.48, "learning_rate": 2.7627289885262365e-06, "loss": 1.0248, "step": 25574 }, { "epoch": 0.48, "learning_rate": 2.762577068433847e-06, "loss": 1.0216, "step": 25575 }, { "epoch": 0.48, "learning_rate": 2.762425147361003e-06, "loss": 1.0238, "step": 25576 }, { "epoch": 0.48, "learning_rate": 2.762273225308273e-06, "loss": 0.9152, "step": 25577 }, { "epoch": 0.48, "learning_rate": 2.762121302276221e-06, "loss": 1.0764, "step": 25578 }, { "epoch": 0.48, "learning_rate": 2.7619693782654174e-06, "loss": 1.0115, "step": 25579 }, { "epoch": 0.48, "learning_rate": 2.7618174532764276e-06, "loss": 0.8216, "step": 25580 }, { "epoch": 0.48, "learning_rate": 2.761665527309819e-06, "loss": 1.0657, "step": 25581 }, { "epoch": 0.48, "learning_rate": 2.7615136003661604e-06, "loss": 1.0887, "step": 25582 }, { "epoch": 0.48, "learning_rate": 2.761361672446017e-06, "loss": 0.785, "step": 25583 }, { "epoch": 0.48, "learning_rate": 2.7612097435499575e-06, "loss": 0.8734, "step": 25584 }, { "epoch": 0.48, "learning_rate": 2.7610578136785487e-06, "loss": 0.9127, "step": 25585 }, { "epoch": 0.48, "learning_rate": 2.7609058828323586e-06, "loss": 0.9892, "step": 25586 }, { "epoch": 0.48, "learning_rate": 2.7607539510119536e-06, "loss": 1.3419, "step": 25587 }, { "epoch": 0.48, "learning_rate": 2.760602018217901e-06, "loss": 1.0779, "step": 25588 }, { "epoch": 0.48, "learning_rate": 2.7604500844507688e-06, "loss": 0.8009, "step": 25589 }, { "epoch": 0.48, "learning_rate": 2.7602981497111236e-06, "loss": 0.6776, "step": 25590 }, { "epoch": 0.48, "learning_rate": 2.7601462139995335e-06, "loss": 0.7775, "step": 25591 }, { "epoch": 0.48, "learning_rate": 2.7599942773165656e-06, "loss": 0.8643, "step": 25592 }, { "epoch": 0.48, "learning_rate": 2.7598423396627865e-06, "loss": 1.0181, "step": 25593 }, { "epoch": 0.48, "learning_rate": 2.7596904010387643e-06, "loss": 1.1351, "step": 25594 }, { "epoch": 0.48, "learning_rate": 2.7595384614450663e-06, "loss": 0.892, "step": 25595 }, { "epoch": 0.48, "learning_rate": 2.759386520882259e-06, "loss": 0.6892, "step": 25596 }, { "epoch": 0.48, "learning_rate": 2.7592345793509113e-06, "loss": 1.0618, "step": 25597 }, { "epoch": 0.48, "learning_rate": 2.7590826368515892e-06, "loss": 0.9347, "step": 25598 }, { "epoch": 0.48, "learning_rate": 2.7589306933848602e-06, "loss": 0.9482, "step": 25599 }, { "epoch": 0.48, "learning_rate": 2.7587787489512923e-06, "loss": 1.1283, "step": 25600 }, { "epoch": 0.48, "learning_rate": 2.758626803551453e-06, "loss": 0.9758, "step": 25601 }, { "epoch": 0.48, "learning_rate": 2.758474857185908e-06, "loss": 0.928, "step": 25602 }, { "epoch": 0.48, "learning_rate": 2.7583229098552266e-06, "loss": 0.9484, "step": 25603 }, { "epoch": 0.48, "learning_rate": 2.758170961559975e-06, "loss": 0.8111, "step": 25604 }, { "epoch": 0.48, "learning_rate": 2.7580190123007213e-06, "loss": 0.7613, "step": 25605 }, { "epoch": 0.48, "learning_rate": 2.7578670620780325e-06, "loss": 1.1533, "step": 25606 }, { "epoch": 0.48, "learning_rate": 2.7577151108924753e-06, "loss": 0.9526, "step": 25607 }, { "epoch": 0.48, "learning_rate": 2.7575631587446182e-06, "loss": 0.9429, "step": 25608 }, { "epoch": 0.48, "learning_rate": 2.757411205635028e-06, "loss": 0.9434, "step": 25609 }, { "epoch": 0.48, "learning_rate": 2.7572592515642725e-06, "loss": 0.9918, "step": 25610 }, { "epoch": 0.48, "learning_rate": 2.757107296532919e-06, "loss": 0.8829, "step": 25611 }, { "epoch": 0.48, "learning_rate": 2.756955340541535e-06, "loss": 1.0051, "step": 25612 }, { "epoch": 0.48, "learning_rate": 2.7568033835906866e-06, "loss": 1.0102, "step": 25613 }, { "epoch": 0.48, "learning_rate": 2.756651425680943e-06, "loss": 1.0264, "step": 25614 }, { "epoch": 0.48, "learning_rate": 2.756499466812871e-06, "loss": 0.8324, "step": 25615 }, { "epoch": 0.48, "learning_rate": 2.7563475069870377e-06, "loss": 0.9448, "step": 25616 }, { "epoch": 0.48, "learning_rate": 2.7561955462040097e-06, "loss": 0.6436, "step": 25617 }, { "epoch": 0.48, "learning_rate": 2.7560435844643563e-06, "loss": 0.9063, "step": 25618 }, { "epoch": 0.48, "learning_rate": 2.7558916217686436e-06, "loss": 0.9968, "step": 25619 }, { "epoch": 0.48, "learning_rate": 2.75573965811744e-06, "loss": 0.9334, "step": 25620 }, { "epoch": 0.48, "learning_rate": 2.7555876935113124e-06, "loss": 0.9804, "step": 25621 }, { "epoch": 0.48, "learning_rate": 2.7554357279508275e-06, "loss": 0.8549, "step": 25622 }, { "epoch": 0.48, "learning_rate": 2.755283761436554e-06, "loss": 0.7422, "step": 25623 }, { "epoch": 0.48, "learning_rate": 2.7551317939690588e-06, "loss": 1.035, "step": 25624 }, { "epoch": 0.48, "learning_rate": 2.7549798255489085e-06, "loss": 1.0368, "step": 25625 }, { "epoch": 0.48, "learning_rate": 2.7548278561766717e-06, "loss": 0.9486, "step": 25626 }, { "epoch": 0.48, "learning_rate": 2.754675885852916e-06, "loss": 0.8115, "step": 25627 }, { "epoch": 0.48, "learning_rate": 2.754523914578208e-06, "loss": 0.7459, "step": 25628 }, { "epoch": 0.48, "learning_rate": 2.7543719423531157e-06, "loss": 0.7782, "step": 25629 }, { "epoch": 0.48, "learning_rate": 2.754219969178206e-06, "loss": 0.9871, "step": 25630 }, { "epoch": 0.48, "learning_rate": 2.7540679950540467e-06, "loss": 1.0435, "step": 25631 }, { "epoch": 0.48, "learning_rate": 2.7539160199812053e-06, "loss": 0.867, "step": 25632 }, { "epoch": 0.48, "learning_rate": 2.7537640439602502e-06, "loss": 0.855, "step": 25633 }, { "epoch": 0.48, "learning_rate": 2.753612066991747e-06, "loss": 0.8513, "step": 25634 }, { "epoch": 0.48, "learning_rate": 2.7534600890762647e-06, "loss": 0.8796, "step": 25635 }, { "epoch": 0.48, "learning_rate": 2.75330811021437e-06, "loss": 0.9674, "step": 25636 }, { "epoch": 0.48, "learning_rate": 2.7531561304066305e-06, "loss": 1.1868, "step": 25637 }, { "epoch": 0.48, "learning_rate": 2.7530041496536132e-06, "loss": 1.0818, "step": 25638 }, { "epoch": 0.48, "learning_rate": 2.7528521679558866e-06, "loss": 0.9498, "step": 25639 }, { "epoch": 0.48, "learning_rate": 2.752700185314018e-06, "loss": 0.9667, "step": 25640 }, { "epoch": 0.48, "learning_rate": 2.7525482017285743e-06, "loss": 0.9064, "step": 25641 }, { "epoch": 0.48, "learning_rate": 2.752396217200124e-06, "loss": 0.9087, "step": 25642 }, { "epoch": 0.48, "learning_rate": 2.7522442317292337e-06, "loss": 1.0088, "step": 25643 }, { "epoch": 0.48, "learning_rate": 2.7520922453164706e-06, "loss": 0.7993, "step": 25644 }, { "epoch": 0.48, "learning_rate": 2.751940257962403e-06, "loss": 0.9055, "step": 25645 }, { "epoch": 0.48, "learning_rate": 2.7517882696675985e-06, "loss": 0.8973, "step": 25646 }, { "epoch": 0.48, "learning_rate": 2.751636280432624e-06, "loss": 0.9883, "step": 25647 }, { "epoch": 0.48, "learning_rate": 2.751484290258048e-06, "loss": 0.908, "step": 25648 }, { "epoch": 0.48, "learning_rate": 2.751332299144437e-06, "loss": 1.225, "step": 25649 }, { "epoch": 0.48, "learning_rate": 2.7511803070923586e-06, "loss": 1.0815, "step": 25650 }, { "epoch": 0.48, "learning_rate": 2.751028314102381e-06, "loss": 0.8582, "step": 25651 }, { "epoch": 0.48, "learning_rate": 2.750876320175071e-06, "loss": 1.0334, "step": 25652 }, { "epoch": 0.48, "learning_rate": 2.750724325310997e-06, "loss": 1.0311, "step": 25653 }, { "epoch": 0.48, "learning_rate": 2.7505723295107256e-06, "loss": 0.9858, "step": 25654 }, { "epoch": 0.48, "learning_rate": 2.7504203327748247e-06, "loss": 0.9905, "step": 25655 }, { "epoch": 0.48, "learning_rate": 2.750268335103862e-06, "loss": 1.2752, "step": 25656 }, { "epoch": 0.48, "learning_rate": 2.750116336498406e-06, "loss": 0.9253, "step": 25657 }, { "epoch": 0.48, "learning_rate": 2.7499643369590223e-06, "loss": 0.7863, "step": 25658 }, { "epoch": 0.48, "learning_rate": 2.7498123364862793e-06, "loss": 0.8569, "step": 25659 }, { "epoch": 0.48, "learning_rate": 2.7496603350807454e-06, "loss": 0.8695, "step": 25660 }, { "epoch": 0.48, "learning_rate": 2.749508332742987e-06, "loss": 0.8975, "step": 25661 }, { "epoch": 0.48, "learning_rate": 2.749356329473572e-06, "loss": 0.9554, "step": 25662 }, { "epoch": 0.48, "learning_rate": 2.749204325273069e-06, "loss": 0.955, "step": 25663 }, { "epoch": 0.48, "learning_rate": 2.749052320142044e-06, "loss": 0.9165, "step": 25664 }, { "epoch": 0.48, "learning_rate": 2.748900314081065e-06, "loss": 0.915, "step": 25665 }, { "epoch": 0.48, "learning_rate": 2.7487483070907e-06, "loss": 0.8711, "step": 25666 }, { "epoch": 0.48, "learning_rate": 2.7485962991715166e-06, "loss": 0.8951, "step": 25667 }, { "epoch": 0.48, "learning_rate": 2.748444290324082e-06, "loss": 1.0581, "step": 25668 }, { "epoch": 0.48, "learning_rate": 2.748292280548965e-06, "loss": 0.9501, "step": 25669 }, { "epoch": 0.48, "learning_rate": 2.7481402698467313e-06, "loss": 0.8717, "step": 25670 }, { "epoch": 0.48, "learning_rate": 2.7479882582179494e-06, "loss": 0.7558, "step": 25671 }, { "epoch": 0.48, "learning_rate": 2.7478362456631873e-06, "loss": 0.8879, "step": 25672 }, { "epoch": 0.48, "learning_rate": 2.747684232183012e-06, "loss": 0.8319, "step": 25673 }, { "epoch": 0.48, "learning_rate": 2.7475322177779915e-06, "loss": 0.7948, "step": 25674 }, { "epoch": 0.48, "learning_rate": 2.747380202448694e-06, "loss": 1.2737, "step": 25675 }, { "epoch": 0.48, "learning_rate": 2.7472281861956855e-06, "loss": 1.0717, "step": 25676 }, { "epoch": 0.48, "learning_rate": 2.7470761690195345e-06, "loss": 1.0395, "step": 25677 }, { "epoch": 0.48, "learning_rate": 2.74692415092081e-06, "loss": 0.9651, "step": 25678 }, { "epoch": 0.48, "learning_rate": 2.7467721319000766e-06, "loss": 0.8813, "step": 25679 }, { "epoch": 0.48, "learning_rate": 2.746620111957904e-06, "loss": 0.7152, "step": 25680 }, { "epoch": 0.48, "learning_rate": 2.74646809109486e-06, "loss": 1.1969, "step": 25681 }, { "epoch": 0.48, "learning_rate": 2.7463160693115116e-06, "loss": 1.0468, "step": 25682 }, { "epoch": 0.48, "learning_rate": 2.746164046608426e-06, "loss": 0.9868, "step": 25683 }, { "epoch": 0.48, "learning_rate": 2.7460120229861723e-06, "loss": 0.9286, "step": 25684 }, { "epoch": 0.48, "learning_rate": 2.7458599984453168e-06, "loss": 0.7728, "step": 25685 }, { "epoch": 0.48, "learning_rate": 2.7457079729864274e-06, "loss": 0.7287, "step": 25686 }, { "epoch": 0.48, "learning_rate": 2.7455559466100718e-06, "loss": 1.0316, "step": 25687 }, { "epoch": 0.48, "learning_rate": 2.745403919316818e-06, "loss": 1.0401, "step": 25688 }, { "epoch": 0.48, "learning_rate": 2.7452518911072334e-06, "loss": 0.843, "step": 25689 }, { "epoch": 0.48, "learning_rate": 2.7450998619818865e-06, "loss": 0.8315, "step": 25690 }, { "epoch": 0.48, "learning_rate": 2.7449478319413434e-06, "loss": 0.8517, "step": 25691 }, { "epoch": 0.48, "learning_rate": 2.744795800986173e-06, "loss": 0.824, "step": 25692 }, { "epoch": 0.48, "learning_rate": 2.7446437691169424e-06, "loss": 0.9456, "step": 25693 }, { "epoch": 0.48, "learning_rate": 2.7444917363342195e-06, "loss": 1.2267, "step": 25694 }, { "epoch": 0.48, "learning_rate": 2.744339702638572e-06, "loss": 1.1424, "step": 25695 }, { "epoch": 0.48, "learning_rate": 2.744187668030568e-06, "loss": 0.9799, "step": 25696 }, { "epoch": 0.48, "learning_rate": 2.7440356325107744e-06, "loss": 1.0177, "step": 25697 }, { "epoch": 0.48, "learning_rate": 2.743883596079759e-06, "loss": 0.8599, "step": 25698 }, { "epoch": 0.48, "learning_rate": 2.74373155873809e-06, "loss": 0.9102, "step": 25699 }, { "epoch": 0.48, "learning_rate": 2.7435795204863347e-06, "loss": 1.2736, "step": 25700 }, { "epoch": 0.48, "learning_rate": 2.74342748132506e-06, "loss": 0.9394, "step": 25701 }, { "epoch": 0.48, "learning_rate": 2.7432754412548364e-06, "loss": 0.8154, "step": 25702 }, { "epoch": 0.48, "learning_rate": 2.7431234002762287e-06, "loss": 0.9176, "step": 25703 }, { "epoch": 0.48, "learning_rate": 2.7429713583898053e-06, "loss": 1.0166, "step": 25704 }, { "epoch": 0.48, "learning_rate": 2.742819315596135e-06, "loss": 0.8021, "step": 25705 }, { "epoch": 0.48, "learning_rate": 2.7426672718957848e-06, "loss": 0.9924, "step": 25706 }, { "epoch": 0.49, "learning_rate": 2.7425152272893226e-06, "loss": 0.9294, "step": 25707 }, { "epoch": 0.49, "learning_rate": 2.7423631817773157e-06, "loss": 0.7318, "step": 25708 }, { "epoch": 0.49, "learning_rate": 2.7422111353603317e-06, "loss": 0.9666, "step": 25709 }, { "epoch": 0.49, "learning_rate": 2.7420590880389387e-06, "loss": 0.9536, "step": 25710 }, { "epoch": 0.49, "learning_rate": 2.7419070398137053e-06, "loss": 0.7851, "step": 25711 }, { "epoch": 0.49, "learning_rate": 2.741754990685198e-06, "loss": 0.9596, "step": 25712 }, { "epoch": 0.49, "learning_rate": 2.741602940653985e-06, "loss": 0.8848, "step": 25713 }, { "epoch": 0.49, "learning_rate": 2.7414508897206336e-06, "loss": 0.9318, "step": 25714 }, { "epoch": 0.49, "learning_rate": 2.7412988378857125e-06, "loss": 0.8844, "step": 25715 }, { "epoch": 0.49, "learning_rate": 2.7411467851497886e-06, "loss": 0.8238, "step": 25716 }, { "epoch": 0.49, "learning_rate": 2.7409947315134313e-06, "loss": 1.0087, "step": 25717 }, { "epoch": 0.49, "learning_rate": 2.7408426769772057e-06, "loss": 0.9967, "step": 25718 }, { "epoch": 0.49, "learning_rate": 2.740690621541681e-06, "loss": 1.1194, "step": 25719 }, { "epoch": 0.49, "learning_rate": 2.7405385652074255e-06, "loss": 0.8933, "step": 25720 }, { "epoch": 0.49, "learning_rate": 2.740386507975006e-06, "loss": 0.8536, "step": 25721 }, { "epoch": 0.49, "learning_rate": 2.7402344498449907e-06, "loss": 0.9282, "step": 25722 }, { "epoch": 0.49, "learning_rate": 2.7400823908179468e-06, "loss": 0.9927, "step": 25723 }, { "epoch": 0.49, "learning_rate": 2.739930330894443e-06, "loss": 0.9159, "step": 25724 }, { "epoch": 0.49, "learning_rate": 2.7397782700750473e-06, "loss": 0.8163, "step": 25725 }, { "epoch": 0.49, "learning_rate": 2.7396262083603263e-06, "loss": 0.7372, "step": 25726 }, { "epoch": 0.49, "learning_rate": 2.7394741457508484e-06, "loss": 0.7408, "step": 25727 }, { "epoch": 0.49, "learning_rate": 2.7393220822471816e-06, "loss": 0.9862, "step": 25728 }, { "epoch": 0.49, "learning_rate": 2.7391700178498933e-06, "loss": 1.0573, "step": 25729 }, { "epoch": 0.49, "learning_rate": 2.739017952559551e-06, "loss": 0.8493, "step": 25730 }, { "epoch": 0.49, "learning_rate": 2.738865886376724e-06, "loss": 0.9635, "step": 25731 }, { "epoch": 0.49, "learning_rate": 2.7387138193019787e-06, "loss": 1.0536, "step": 25732 }, { "epoch": 0.49, "learning_rate": 2.738561751335883e-06, "loss": 1.0865, "step": 25733 }, { "epoch": 0.49, "learning_rate": 2.7384096824790057e-06, "loss": 1.006, "step": 25734 }, { "epoch": 0.49, "learning_rate": 2.738257612731913e-06, "loss": 0.8913, "step": 25735 }, { "epoch": 0.49, "learning_rate": 2.738105542095174e-06, "loss": 0.851, "step": 25736 }, { "epoch": 0.49, "learning_rate": 2.737953470569357e-06, "loss": 0.9289, "step": 25737 }, { "epoch": 0.49, "learning_rate": 2.7378013981550283e-06, "loss": 1.046, "step": 25738 }, { "epoch": 0.49, "learning_rate": 2.7376493248527564e-06, "loss": 0.9763, "step": 25739 }, { "epoch": 0.49, "learning_rate": 2.7374972506631104e-06, "loss": 0.9011, "step": 25740 }, { "epoch": 0.49, "learning_rate": 2.7373451755866556e-06, "loss": 0.7353, "step": 25741 }, { "epoch": 0.49, "learning_rate": 2.7371930996239616e-06, "loss": 0.8434, "step": 25742 }, { "epoch": 0.49, "learning_rate": 2.7370410227755956e-06, "loss": 0.9995, "step": 25743 }, { "epoch": 0.49, "learning_rate": 2.7368889450421255e-06, "loss": 0.9299, "step": 25744 }, { "epoch": 0.49, "learning_rate": 2.73673686642412e-06, "loss": 0.9137, "step": 25745 }, { "epoch": 0.49, "learning_rate": 2.7365847869221464e-06, "loss": 0.9351, "step": 25746 }, { "epoch": 0.49, "learning_rate": 2.736432706536772e-06, "loss": 0.8799, "step": 25747 }, { "epoch": 0.49, "learning_rate": 2.7362806252685652e-06, "loss": 0.8431, "step": 25748 }, { "epoch": 0.49, "learning_rate": 2.7361285431180936e-06, "loss": 1.1652, "step": 25749 }, { "epoch": 0.49, "learning_rate": 2.735976460085925e-06, "loss": 1.0969, "step": 25750 }, { "epoch": 0.49, "learning_rate": 2.7358243761726283e-06, "loss": 0.9911, "step": 25751 }, { "epoch": 0.49, "learning_rate": 2.735672291378771e-06, "loss": 0.8414, "step": 25752 }, { "epoch": 0.49, "learning_rate": 2.7355202057049197e-06, "loss": 0.835, "step": 25753 }, { "epoch": 0.49, "learning_rate": 2.735368119151643e-06, "loss": 1.1512, "step": 25754 }, { "epoch": 0.49, "learning_rate": 2.73521603171951e-06, "loss": 0.8797, "step": 25755 }, { "epoch": 0.49, "learning_rate": 2.735063943409086e-06, "loss": 1.0562, "step": 25756 }, { "epoch": 0.49, "learning_rate": 2.734911854220941e-06, "loss": 1.0679, "step": 25757 }, { "epoch": 0.49, "learning_rate": 2.7347597641556434e-06, "loss": 0.9454, "step": 25758 }, { "epoch": 0.49, "learning_rate": 2.7346076732137596e-06, "loss": 0.9764, "step": 25759 }, { "epoch": 0.49, "learning_rate": 2.7344555813958574e-06, "loss": 0.8018, "step": 25760 }, { "epoch": 0.49, "learning_rate": 2.7343034887025056e-06, "loss": 0.7883, "step": 25761 }, { "epoch": 0.49, "learning_rate": 2.7341513951342716e-06, "loss": 0.9929, "step": 25762 }, { "epoch": 0.49, "learning_rate": 2.7339993006917235e-06, "loss": 0.9341, "step": 25763 }, { "epoch": 0.49, "learning_rate": 2.7338472053754287e-06, "loss": 1.0267, "step": 25764 }, { "epoch": 0.49, "learning_rate": 2.7336951091859565e-06, "loss": 0.8271, "step": 25765 }, { "epoch": 0.49, "learning_rate": 2.733543012123873e-06, "loss": 1.0497, "step": 25766 }, { "epoch": 0.49, "learning_rate": 2.7333909141897487e-06, "loss": 0.8549, "step": 25767 }, { "epoch": 0.49, "learning_rate": 2.7332388153841483e-06, "loss": 0.9218, "step": 25768 }, { "epoch": 0.49, "learning_rate": 2.7330867157076417e-06, "loss": 1.1486, "step": 25769 }, { "epoch": 0.49, "learning_rate": 2.7329346151607965e-06, "loss": 1.0169, "step": 25770 }, { "epoch": 0.49, "learning_rate": 2.7327825137441806e-06, "loss": 0.7569, "step": 25771 }, { "epoch": 0.49, "learning_rate": 2.732630411458362e-06, "loss": 0.7836, "step": 25772 }, { "epoch": 0.49, "learning_rate": 2.7324783083039084e-06, "loss": 0.7737, "step": 25773 }, { "epoch": 0.49, "learning_rate": 2.7323262042813884e-06, "loss": 0.8152, "step": 25774 }, { "epoch": 0.49, "learning_rate": 2.732174099391369e-06, "loss": 1.1545, "step": 25775 }, { "epoch": 0.49, "learning_rate": 2.7320219936344187e-06, "loss": 0.6772, "step": 25776 }, { "epoch": 0.49, "learning_rate": 2.7318698870111056e-06, "loss": 0.9499, "step": 25777 }, { "epoch": 0.49, "learning_rate": 2.7317177795219966e-06, "loss": 0.8207, "step": 25778 }, { "epoch": 0.49, "learning_rate": 2.731565671167662e-06, "loss": 0.9776, "step": 25779 }, { "epoch": 0.49, "learning_rate": 2.7314135619486678e-06, "loss": 0.9089, "step": 25780 }, { "epoch": 0.49, "learning_rate": 2.7312614518655817e-06, "loss": 1.1494, "step": 25781 }, { "epoch": 0.49, "learning_rate": 2.731109340918973e-06, "loss": 0.9778, "step": 25782 }, { "epoch": 0.49, "learning_rate": 2.7309572291094095e-06, "loss": 0.8122, "step": 25783 }, { "epoch": 0.49, "learning_rate": 2.730805116437457e-06, "loss": 0.9302, "step": 25784 }, { "epoch": 0.49, "learning_rate": 2.7306530029036875e-06, "loss": 0.8354, "step": 25785 }, { "epoch": 0.49, "learning_rate": 2.730500888508666e-06, "loss": 0.9369, "step": 25786 }, { "epoch": 0.49, "learning_rate": 2.7303487732529606e-06, "loss": 0.9678, "step": 25787 }, { "epoch": 0.49, "learning_rate": 2.7301966571371407e-06, "loss": 0.9104, "step": 25788 }, { "epoch": 0.49, "learning_rate": 2.730044540161773e-06, "loss": 0.8827, "step": 25789 }, { "epoch": 0.49, "learning_rate": 2.7298924223274267e-06, "loss": 1.0208, "step": 25790 }, { "epoch": 0.49, "learning_rate": 2.7297403036346687e-06, "loss": 0.7141, "step": 25791 }, { "epoch": 0.49, "learning_rate": 2.729588184084067e-06, "loss": 0.9687, "step": 25792 }, { "epoch": 0.49, "learning_rate": 2.7294360636761908e-06, "loss": 1.1013, "step": 25793 }, { "epoch": 0.49, "learning_rate": 2.7292839424116075e-06, "loss": 0.9471, "step": 25794 }, { "epoch": 0.49, "learning_rate": 2.7291318202908847e-06, "loss": 0.9423, "step": 25795 }, { "epoch": 0.49, "learning_rate": 2.7289796973145906e-06, "loss": 1.0768, "step": 25796 }, { "epoch": 0.49, "learning_rate": 2.7288275734832933e-06, "loss": 0.9827, "step": 25797 }, { "epoch": 0.49, "learning_rate": 2.7286754487975604e-06, "loss": 0.7897, "step": 25798 }, { "epoch": 0.49, "learning_rate": 2.7285233232579607e-06, "loss": 1.0238, "step": 25799 }, { "epoch": 0.49, "learning_rate": 2.7283711968650626e-06, "loss": 1.0154, "step": 25800 }, { "epoch": 0.49, "learning_rate": 2.7282190696194327e-06, "loss": 0.8842, "step": 25801 }, { "epoch": 0.49, "learning_rate": 2.7280669415216398e-06, "loss": 0.8317, "step": 25802 }, { "epoch": 0.49, "learning_rate": 2.727914812572253e-06, "loss": 0.9972, "step": 25803 }, { "epoch": 0.49, "learning_rate": 2.7277626827718383e-06, "loss": 0.8931, "step": 25804 }, { "epoch": 0.49, "learning_rate": 2.7276105521209645e-06, "loss": 1.0444, "step": 25805 }, { "epoch": 0.49, "learning_rate": 2.7274584206202006e-06, "loss": 1.2744, "step": 25806 }, { "epoch": 0.49, "learning_rate": 2.7273062882701134e-06, "loss": 0.9942, "step": 25807 }, { "epoch": 0.49, "learning_rate": 2.7271541550712716e-06, "loss": 1.0164, "step": 25808 }, { "epoch": 0.49, "learning_rate": 2.7270020210242437e-06, "loss": 0.7393, "step": 25809 }, { "epoch": 0.49, "learning_rate": 2.7268498861295967e-06, "loss": 0.9474, "step": 25810 }, { "epoch": 0.49, "learning_rate": 2.726697750387899e-06, "loss": 0.8595, "step": 25811 }, { "epoch": 0.49, "learning_rate": 2.726545613799719e-06, "loss": 1.0825, "step": 25812 }, { "epoch": 0.49, "learning_rate": 2.7263934763656246e-06, "loss": 1.1986, "step": 25813 }, { "epoch": 0.49, "learning_rate": 2.726241338086184e-06, "loss": 0.7489, "step": 25814 }, { "epoch": 0.49, "learning_rate": 2.726089198961965e-06, "loss": 0.888, "step": 25815 }, { "epoch": 0.49, "learning_rate": 2.725937058993536e-06, "loss": 1.011, "step": 25816 }, { "epoch": 0.49, "learning_rate": 2.7257849181814653e-06, "loss": 0.9091, "step": 25817 }, { "epoch": 0.49, "learning_rate": 2.72563277652632e-06, "loss": 1.0797, "step": 25818 }, { "epoch": 0.49, "learning_rate": 2.7254806340286694e-06, "loss": 0.9641, "step": 25819 }, { "epoch": 0.49, "learning_rate": 2.725328490689081e-06, "loss": 0.9463, "step": 25820 }, { "epoch": 0.49, "learning_rate": 2.7251763465081225e-06, "loss": 0.8589, "step": 25821 }, { "epoch": 0.49, "learning_rate": 2.725024201486363e-06, "loss": 0.7733, "step": 25822 }, { "epoch": 0.49, "learning_rate": 2.7248720556243695e-06, "loss": 0.8557, "step": 25823 }, { "epoch": 0.49, "learning_rate": 2.7247199089227113e-06, "loss": 0.9968, "step": 25824 }, { "epoch": 0.49, "learning_rate": 2.7245677613819555e-06, "loss": 0.9481, "step": 25825 }, { "epoch": 0.49, "learning_rate": 2.7244156130026693e-06, "loss": 0.719, "step": 25826 }, { "epoch": 0.49, "learning_rate": 2.7242634637854236e-06, "loss": 1.0773, "step": 25827 }, { "epoch": 0.49, "learning_rate": 2.7241113137307846e-06, "loss": 0.9808, "step": 25828 }, { "epoch": 0.49, "learning_rate": 2.7239591628393207e-06, "loss": 0.8918, "step": 25829 }, { "epoch": 0.49, "learning_rate": 2.723807011111601e-06, "loss": 0.976, "step": 25830 }, { "epoch": 0.49, "learning_rate": 2.723654858548192e-06, "loss": 0.9576, "step": 25831 }, { "epoch": 0.49, "learning_rate": 2.7235027051496625e-06, "loss": 0.9926, "step": 25832 }, { "epoch": 0.49, "learning_rate": 2.7233505509165807e-06, "loss": 0.8868, "step": 25833 }, { "epoch": 0.49, "learning_rate": 2.723198395849515e-06, "loss": 1.051, "step": 25834 }, { "epoch": 0.49, "learning_rate": 2.7230462399490332e-06, "loss": 0.777, "step": 25835 }, { "epoch": 0.49, "learning_rate": 2.722894083215704e-06, "loss": 0.8163, "step": 25836 }, { "epoch": 0.49, "learning_rate": 2.7227419256500954e-06, "loss": 1.1193, "step": 25837 }, { "epoch": 0.49, "learning_rate": 2.722589767252775e-06, "loss": 0.8955, "step": 25838 }, { "epoch": 0.49, "learning_rate": 2.7224376080243103e-06, "loss": 0.9149, "step": 25839 }, { "epoch": 0.49, "learning_rate": 2.722285447965271e-06, "loss": 0.8361, "step": 25840 }, { "epoch": 0.49, "learning_rate": 2.7221332870762252e-06, "loss": 0.9106, "step": 25841 }, { "epoch": 0.49, "learning_rate": 2.72198112535774e-06, "loss": 0.9634, "step": 25842 }, { "epoch": 0.49, "learning_rate": 2.7218289628103837e-06, "loss": 1.0536, "step": 25843 }, { "epoch": 0.49, "learning_rate": 2.721676799434726e-06, "loss": 0.9048, "step": 25844 }, { "epoch": 0.49, "learning_rate": 2.721524635231333e-06, "loss": 0.8176, "step": 25845 }, { "epoch": 0.49, "learning_rate": 2.7213724702007737e-06, "loss": 1.1766, "step": 25846 }, { "epoch": 0.49, "learning_rate": 2.721220304343617e-06, "loss": 0.9305, "step": 25847 }, { "epoch": 0.49, "learning_rate": 2.72106813766043e-06, "loss": 0.8669, "step": 25848 }, { "epoch": 0.49, "learning_rate": 2.7209159701517813e-06, "loss": 0.8762, "step": 25849 }, { "epoch": 0.49, "learning_rate": 2.72076380181824e-06, "loss": 1.0987, "step": 25850 }, { "epoch": 0.49, "learning_rate": 2.720611632660373e-06, "loss": 0.9345, "step": 25851 }, { "epoch": 0.49, "learning_rate": 2.7204594626787484e-06, "loss": 0.7801, "step": 25852 }, { "epoch": 0.49, "learning_rate": 2.720307291873935e-06, "loss": 1.0829, "step": 25853 }, { "epoch": 0.49, "learning_rate": 2.720155120246501e-06, "loss": 0.8906, "step": 25854 }, { "epoch": 0.49, "learning_rate": 2.720002947797015e-06, "loss": 1.0726, "step": 25855 }, { "epoch": 0.49, "learning_rate": 2.7198507745260442e-06, "loss": 1.1835, "step": 25856 }, { "epoch": 0.49, "learning_rate": 2.719698600434158e-06, "loss": 0.9636, "step": 25857 }, { "epoch": 0.49, "learning_rate": 2.719546425521923e-06, "loss": 0.8183, "step": 25858 }, { "epoch": 0.49, "learning_rate": 2.7193942497899094e-06, "loss": 0.9231, "step": 25859 }, { "epoch": 0.49, "learning_rate": 2.719242073238684e-06, "loss": 0.8857, "step": 25860 }, { "epoch": 0.49, "learning_rate": 2.719089895868815e-06, "loss": 0.8908, "step": 25861 }, { "epoch": 0.49, "learning_rate": 2.7189377176808716e-06, "loss": 0.9329, "step": 25862 }, { "epoch": 0.49, "learning_rate": 2.7187855386754215e-06, "loss": 1.0391, "step": 25863 }, { "epoch": 0.49, "learning_rate": 2.7186333588530323e-06, "loss": 0.5641, "step": 25864 }, { "epoch": 0.49, "learning_rate": 2.7184811782142735e-06, "loss": 0.9206, "step": 25865 }, { "epoch": 0.49, "learning_rate": 2.7183289967597128e-06, "loss": 0.856, "step": 25866 }, { "epoch": 0.49, "learning_rate": 2.718176814489917e-06, "loss": 0.7758, "step": 25867 }, { "epoch": 0.49, "learning_rate": 2.718024631405457e-06, "loss": 0.8781, "step": 25868 }, { "epoch": 0.49, "learning_rate": 2.717872447506899e-06, "loss": 1.0726, "step": 25869 }, { "epoch": 0.49, "learning_rate": 2.7177202627948124e-06, "loss": 0.8632, "step": 25870 }, { "epoch": 0.49, "learning_rate": 2.7175680772697653e-06, "loss": 0.9571, "step": 25871 }, { "epoch": 0.49, "learning_rate": 2.717415890932325e-06, "loss": 0.807, "step": 25872 }, { "epoch": 0.49, "learning_rate": 2.7172637037830607e-06, "loss": 0.9456, "step": 25873 }, { "epoch": 0.49, "learning_rate": 2.7171115158225403e-06, "loss": 1.0441, "step": 25874 }, { "epoch": 0.49, "learning_rate": 2.716959327051332e-06, "loss": 1.202, "step": 25875 }, { "epoch": 0.49, "learning_rate": 2.7168071374700045e-06, "loss": 1.1751, "step": 25876 }, { "epoch": 0.49, "learning_rate": 2.716654947079126e-06, "loss": 0.8812, "step": 25877 }, { "epoch": 0.49, "learning_rate": 2.7165027558792643e-06, "loss": 0.8549, "step": 25878 }, { "epoch": 0.49, "learning_rate": 2.7163505638709873e-06, "loss": 0.8655, "step": 25879 }, { "epoch": 0.49, "learning_rate": 2.7161983710548658e-06, "loss": 0.9197, "step": 25880 }, { "epoch": 0.49, "learning_rate": 2.7160461774314638e-06, "loss": 1.1914, "step": 25881 }, { "epoch": 0.49, "learning_rate": 2.715893983001353e-06, "loss": 1.1851, "step": 25882 }, { "epoch": 0.49, "learning_rate": 2.7157417877651017e-06, "loss": 0.8855, "step": 25883 }, { "epoch": 0.49, "learning_rate": 2.7155895917232763e-06, "loss": 0.7911, "step": 25884 }, { "epoch": 0.49, "learning_rate": 2.7154373948764455e-06, "loss": 1.0483, "step": 25885 }, { "epoch": 0.49, "learning_rate": 2.715285197225179e-06, "loss": 0.9531, "step": 25886 }, { "epoch": 0.49, "learning_rate": 2.715132998770044e-06, "loss": 1.2201, "step": 25887 }, { "epoch": 0.49, "learning_rate": 2.714980799511609e-06, "loss": 1.0996, "step": 25888 }, { "epoch": 0.49, "learning_rate": 2.714828599450442e-06, "loss": 0.8211, "step": 25889 }, { "epoch": 0.49, "learning_rate": 2.714676398587111e-06, "loss": 0.8769, "step": 25890 }, { "epoch": 0.49, "learning_rate": 2.7145241969221856e-06, "loss": 0.9328, "step": 25891 }, { "epoch": 0.49, "learning_rate": 2.714371994456234e-06, "loss": 0.801, "step": 25892 }, { "epoch": 0.49, "learning_rate": 2.714219791189823e-06, "loss": 0.9978, "step": 25893 }, { "epoch": 0.49, "learning_rate": 2.7140675871235222e-06, "loss": 0.9209, "step": 25894 }, { "epoch": 0.49, "learning_rate": 2.7139153822578996e-06, "loss": 0.998, "step": 25895 }, { "epoch": 0.49, "learning_rate": 2.7137631765935236e-06, "loss": 0.8427, "step": 25896 }, { "epoch": 0.49, "learning_rate": 2.7136109701309622e-06, "loss": 0.9021, "step": 25897 }, { "epoch": 0.49, "learning_rate": 2.7134587628707842e-06, "loss": 0.6829, "step": 25898 }, { "epoch": 0.49, "learning_rate": 2.713306554813558e-06, "loss": 0.9157, "step": 25899 }, { "epoch": 0.49, "learning_rate": 2.713154345959851e-06, "loss": 1.1824, "step": 25900 }, { "epoch": 0.49, "learning_rate": 2.7130021363102333e-06, "loss": 0.9613, "step": 25901 }, { "epoch": 0.49, "learning_rate": 2.7128499258652702e-06, "loss": 0.8585, "step": 25902 }, { "epoch": 0.49, "learning_rate": 2.7126977146255333e-06, "loss": 0.9, "step": 25903 }, { "epoch": 0.49, "learning_rate": 2.71254550259159e-06, "loss": 0.881, "step": 25904 }, { "epoch": 0.49, "learning_rate": 2.712393289764008e-06, "loss": 1.1079, "step": 25905 }, { "epoch": 0.49, "learning_rate": 2.7122410761433552e-06, "loss": 1.1713, "step": 25906 }, { "epoch": 0.49, "learning_rate": 2.712088861730202e-06, "loss": 0.9104, "step": 25907 }, { "epoch": 0.49, "learning_rate": 2.711936646525115e-06, "loss": 0.8017, "step": 25908 }, { "epoch": 0.49, "learning_rate": 2.711784430528663e-06, "loss": 0.9212, "step": 25909 }, { "epoch": 0.49, "learning_rate": 2.711632213741414e-06, "loss": 0.956, "step": 25910 }, { "epoch": 0.49, "learning_rate": 2.711479996163937e-06, "loss": 0.7362, "step": 25911 }, { "epoch": 0.49, "learning_rate": 2.7113277777968e-06, "loss": 0.7845, "step": 25912 }, { "epoch": 0.49, "learning_rate": 2.7111755586405725e-06, "loss": 1.0694, "step": 25913 }, { "epoch": 0.49, "learning_rate": 2.711023338695821e-06, "loss": 0.8066, "step": 25914 }, { "epoch": 0.49, "learning_rate": 2.7108711179631153e-06, "loss": 0.7946, "step": 25915 }, { "epoch": 0.49, "learning_rate": 2.7107188964430233e-06, "loss": 0.7973, "step": 25916 }, { "epoch": 0.49, "learning_rate": 2.710566674136113e-06, "loss": 0.9481, "step": 25917 }, { "epoch": 0.49, "learning_rate": 2.710414451042953e-06, "loss": 0.947, "step": 25918 }, { "epoch": 0.49, "learning_rate": 2.710262227164113e-06, "loss": 0.9312, "step": 25919 }, { "epoch": 0.49, "learning_rate": 2.7101100025001596e-06, "loss": 0.9604, "step": 25920 }, { "epoch": 0.49, "learning_rate": 2.7099577770516617e-06, "loss": 0.9439, "step": 25921 }, { "epoch": 0.49, "learning_rate": 2.7098055508191887e-06, "loss": 0.8145, "step": 25922 }, { "epoch": 0.49, "learning_rate": 2.709653323803307e-06, "loss": 0.8398, "step": 25923 }, { "epoch": 0.49, "learning_rate": 2.709501096004587e-06, "loss": 0.9915, "step": 25924 }, { "epoch": 0.49, "learning_rate": 2.709348867423596e-06, "loss": 1.4153, "step": 25925 }, { "epoch": 0.49, "learning_rate": 2.709196638060903e-06, "loss": 0.8916, "step": 25926 }, { "epoch": 0.49, "learning_rate": 2.7090444079170763e-06, "loss": 0.9149, "step": 25927 }, { "epoch": 0.49, "learning_rate": 2.7088921769926845e-06, "loss": 0.9229, "step": 25928 }, { "epoch": 0.49, "learning_rate": 2.7087399452882952e-06, "loss": 0.903, "step": 25929 }, { "epoch": 0.49, "learning_rate": 2.708587712804477e-06, "loss": 0.7514, "step": 25930 }, { "epoch": 0.49, "learning_rate": 2.708435479541799e-06, "loss": 0.8453, "step": 25931 }, { "epoch": 0.49, "learning_rate": 2.708283245500829e-06, "loss": 1.0432, "step": 25932 }, { "epoch": 0.49, "learning_rate": 2.7081310106821364e-06, "loss": 0.7195, "step": 25933 }, { "epoch": 0.49, "learning_rate": 2.707978775086289e-06, "loss": 0.869, "step": 25934 }, { "epoch": 0.49, "learning_rate": 2.707826538713855e-06, "loss": 0.969, "step": 25935 }, { "epoch": 0.49, "learning_rate": 2.7076743015654023e-06, "loss": 0.9415, "step": 25936 }, { "epoch": 0.49, "learning_rate": 2.7075220636415013e-06, "loss": 1.0641, "step": 25937 }, { "epoch": 0.49, "learning_rate": 2.7073698249427184e-06, "loss": 0.919, "step": 25938 }, { "epoch": 0.49, "learning_rate": 2.7072175854696233e-06, "loss": 0.947, "step": 25939 }, { "epoch": 0.49, "learning_rate": 2.707065345222784e-06, "loss": 1.0555, "step": 25940 }, { "epoch": 0.49, "learning_rate": 2.7069131042027695e-06, "loss": 0.924, "step": 25941 }, { "epoch": 0.49, "learning_rate": 2.706760862410147e-06, "loss": 0.7272, "step": 25942 }, { "epoch": 0.49, "learning_rate": 2.7066086198454868e-06, "loss": 1.1577, "step": 25943 }, { "epoch": 0.49, "learning_rate": 2.7064563765093556e-06, "loss": 0.986, "step": 25944 }, { "epoch": 0.49, "learning_rate": 2.7063041324023224e-06, "loss": 0.8146, "step": 25945 }, { "epoch": 0.49, "learning_rate": 2.7061518875249564e-06, "loss": 0.9417, "step": 25946 }, { "epoch": 0.49, "learning_rate": 2.7059996418778254e-06, "loss": 0.9312, "step": 25947 }, { "epoch": 0.49, "learning_rate": 2.7058473954614984e-06, "loss": 0.7377, "step": 25948 }, { "epoch": 0.49, "learning_rate": 2.7056951482765435e-06, "loss": 0.8262, "step": 25949 }, { "epoch": 0.49, "learning_rate": 2.705542900323529e-06, "loss": 0.9924, "step": 25950 }, { "epoch": 0.49, "learning_rate": 2.7053906516030235e-06, "loss": 0.8903, "step": 25951 }, { "epoch": 0.49, "learning_rate": 2.705238402115596e-06, "loss": 1.1499, "step": 25952 }, { "epoch": 0.49, "learning_rate": 2.7050861518618137e-06, "loss": 0.8628, "step": 25953 }, { "epoch": 0.49, "learning_rate": 2.704933900842247e-06, "loss": 0.8159, "step": 25954 }, { "epoch": 0.49, "learning_rate": 2.704781649057463e-06, "loss": 1.0645, "step": 25955 }, { "epoch": 0.49, "learning_rate": 2.7046293965080307e-06, "loss": 1.2326, "step": 25956 }, { "epoch": 0.49, "learning_rate": 2.7044771431945185e-06, "loss": 1.0248, "step": 25957 }, { "epoch": 0.49, "learning_rate": 2.7043248891174945e-06, "loss": 0.9064, "step": 25958 }, { "epoch": 0.49, "learning_rate": 2.7041726342775277e-06, "loss": 0.9883, "step": 25959 }, { "epoch": 0.49, "learning_rate": 2.704020378675187e-06, "loss": 0.8649, "step": 25960 }, { "epoch": 0.49, "learning_rate": 2.70386812231104e-06, "loss": 1.0539, "step": 25961 }, { "epoch": 0.49, "learning_rate": 2.7037158651856564e-06, "loss": 0.9872, "step": 25962 }, { "epoch": 0.49, "learning_rate": 2.703563607299604e-06, "loss": 1.2555, "step": 25963 }, { "epoch": 0.49, "learning_rate": 2.7034113486534507e-06, "loss": 1.0317, "step": 25964 }, { "epoch": 0.49, "learning_rate": 2.703259089247765e-06, "loss": 0.7585, "step": 25965 }, { "epoch": 0.49, "learning_rate": 2.7031068290831173e-06, "loss": 0.8571, "step": 25966 }, { "epoch": 0.49, "learning_rate": 2.7029545681600746e-06, "loss": 0.9981, "step": 25967 }, { "epoch": 0.49, "learning_rate": 2.702802306479206e-06, "loss": 1.0258, "step": 25968 }, { "epoch": 0.49, "learning_rate": 2.70265004404108e-06, "loss": 1.0775, "step": 25969 }, { "epoch": 0.49, "learning_rate": 2.702497780846264e-06, "loss": 0.7602, "step": 25970 }, { "epoch": 0.49, "learning_rate": 2.7023455168953277e-06, "loss": 1.0085, "step": 25971 }, { "epoch": 0.49, "learning_rate": 2.70219325218884e-06, "loss": 0.7274, "step": 25972 }, { "epoch": 0.49, "learning_rate": 2.7020409867273683e-06, "loss": 0.8632, "step": 25973 }, { "epoch": 0.49, "learning_rate": 2.7018887205114818e-06, "loss": 1.0828, "step": 25974 }, { "epoch": 0.49, "learning_rate": 2.70173645354175e-06, "loss": 1.1594, "step": 25975 }, { "epoch": 0.49, "learning_rate": 2.7015841858187397e-06, "loss": 0.8034, "step": 25976 }, { "epoch": 0.49, "learning_rate": 2.7014319173430205e-06, "loss": 0.8108, "step": 25977 }, { "epoch": 0.49, "learning_rate": 2.70127964811516e-06, "loss": 0.8568, "step": 25978 }, { "epoch": 0.49, "learning_rate": 2.701127378135728e-06, "loss": 0.786, "step": 25979 }, { "epoch": 0.49, "learning_rate": 2.700975107405292e-06, "loss": 0.8526, "step": 25980 }, { "epoch": 0.49, "learning_rate": 2.700822835924422e-06, "loss": 1.0505, "step": 25981 }, { "epoch": 0.49, "learning_rate": 2.700670563693685e-06, "loss": 0.946, "step": 25982 }, { "epoch": 0.49, "learning_rate": 2.7005182907136505e-06, "loss": 0.9447, "step": 25983 }, { "epoch": 0.49, "learning_rate": 2.700366016984888e-06, "loss": 0.8608, "step": 25984 }, { "epoch": 0.49, "learning_rate": 2.700213742507963e-06, "loss": 0.9356, "step": 25985 }, { "epoch": 0.49, "learning_rate": 2.7000614672834463e-06, "loss": 0.894, "step": 25986 }, { "epoch": 0.49, "learning_rate": 2.6999091913119074e-06, "loss": 0.9893, "step": 25987 }, { "epoch": 0.49, "learning_rate": 2.699756914593913e-06, "loss": 0.9324, "step": 25988 }, { "epoch": 0.49, "learning_rate": 2.699604637130032e-06, "loss": 0.881, "step": 25989 }, { "epoch": 0.49, "learning_rate": 2.699452358920835e-06, "loss": 0.8945, "step": 25990 }, { "epoch": 0.49, "learning_rate": 2.6993000799668874e-06, "loss": 0.78, "step": 25991 }, { "epoch": 0.49, "learning_rate": 2.69914780026876e-06, "loss": 0.8363, "step": 25992 }, { "epoch": 0.49, "learning_rate": 2.698995519827021e-06, "loss": 1.0353, "step": 25993 }, { "epoch": 0.49, "learning_rate": 2.698843238642238e-06, "loss": 0.9406, "step": 25994 }, { "epoch": 0.49, "learning_rate": 2.698690956714981e-06, "loss": 0.9623, "step": 25995 }, { "epoch": 0.49, "learning_rate": 2.6985386740458185e-06, "loss": 0.864, "step": 25996 }, { "epoch": 0.49, "learning_rate": 2.698386390635318e-06, "loss": 0.9482, "step": 25997 }, { "epoch": 0.49, "learning_rate": 2.698234106484049e-06, "loss": 0.8802, "step": 25998 }, { "epoch": 0.49, "learning_rate": 2.6980818215925797e-06, "loss": 1.2873, "step": 25999 }, { "epoch": 0.49, "learning_rate": 2.6979295359614795e-06, "loss": 1.3266, "step": 26000 }, { "epoch": 0.49, "learning_rate": 2.6977772495913156e-06, "loss": 0.988, "step": 26001 }, { "epoch": 0.49, "learning_rate": 2.6976249624826588e-06, "loss": 0.9457, "step": 26002 }, { "epoch": 0.49, "learning_rate": 2.6974726746360758e-06, "loss": 1.0104, "step": 26003 }, { "epoch": 0.49, "learning_rate": 2.6973203860521358e-06, "loss": 0.8409, "step": 26004 }, { "epoch": 0.49, "learning_rate": 2.697168096731408e-06, "loss": 0.8501, "step": 26005 }, { "epoch": 0.49, "learning_rate": 2.69701580667446e-06, "loss": 0.9181, "step": 26006 }, { "epoch": 0.49, "learning_rate": 2.6968635158818603e-06, "loss": 1.0407, "step": 26007 }, { "epoch": 0.49, "learning_rate": 2.696711224354179e-06, "loss": 0.7779, "step": 26008 }, { "epoch": 0.49, "learning_rate": 2.6965589320919842e-06, "loss": 0.8852, "step": 26009 }, { "epoch": 0.49, "learning_rate": 2.6964066390958445e-06, "loss": 0.8388, "step": 26010 }, { "epoch": 0.49, "learning_rate": 2.696254345366329e-06, "loss": 1.0775, "step": 26011 }, { "epoch": 0.49, "learning_rate": 2.6961020509040047e-06, "loss": 0.8893, "step": 26012 }, { "epoch": 0.49, "learning_rate": 2.695949755709442e-06, "loss": 0.979, "step": 26013 }, { "epoch": 0.49, "learning_rate": 2.695797459783208e-06, "loss": 0.9285, "step": 26014 }, { "epoch": 0.49, "learning_rate": 2.695645163125873e-06, "loss": 0.9194, "step": 26015 }, { "epoch": 0.49, "learning_rate": 2.6954928657380047e-06, "loss": 0.6837, "step": 26016 }, { "epoch": 0.49, "learning_rate": 2.6953405676201727e-06, "loss": 0.8439, "step": 26017 }, { "epoch": 0.49, "learning_rate": 2.695188268772944e-06, "loss": 1.1193, "step": 26018 }, { "epoch": 0.49, "learning_rate": 2.695035969196889e-06, "loss": 0.9861, "step": 26019 }, { "epoch": 0.49, "learning_rate": 2.6948836688925757e-06, "loss": 0.7802, "step": 26020 }, { "epoch": 0.49, "learning_rate": 2.6947313678605725e-06, "loss": 0.7462, "step": 26021 }, { "epoch": 0.49, "learning_rate": 2.694579066101448e-06, "loss": 0.8908, "step": 26022 }, { "epoch": 0.49, "learning_rate": 2.6944267636157724e-06, "loss": 0.927, "step": 26023 }, { "epoch": 0.49, "learning_rate": 2.694274460404112e-06, "loss": 1.1298, "step": 26024 }, { "epoch": 0.49, "learning_rate": 2.694122156467037e-06, "loss": 0.8862, "step": 26025 }, { "epoch": 0.49, "learning_rate": 2.6939698518051166e-06, "loss": 0.8453, "step": 26026 }, { "epoch": 0.49, "learning_rate": 2.6938175464189178e-06, "loss": 0.9021, "step": 26027 }, { "epoch": 0.49, "learning_rate": 2.6936652403090097e-06, "loss": 0.8336, "step": 26028 }, { "epoch": 0.49, "learning_rate": 2.693512933475963e-06, "loss": 0.8074, "step": 26029 }, { "epoch": 0.49, "learning_rate": 2.693360625920344e-06, "loss": 0.9896, "step": 26030 }, { "epoch": 0.49, "learning_rate": 2.6932083176427226e-06, "loss": 1.1354, "step": 26031 }, { "epoch": 0.49, "learning_rate": 2.693056008643668e-06, "loss": 0.8855, "step": 26032 }, { "epoch": 0.49, "learning_rate": 2.692903698923747e-06, "loss": 1.0367, "step": 26033 }, { "epoch": 0.49, "learning_rate": 2.6927513884835297e-06, "loss": 0.9451, "step": 26034 }, { "epoch": 0.49, "learning_rate": 2.692599077323585e-06, "loss": 0.9907, "step": 26035 }, { "epoch": 0.49, "learning_rate": 2.6924467654444813e-06, "loss": 1.0267, "step": 26036 }, { "epoch": 0.49, "learning_rate": 2.692294452846787e-06, "loss": 0.9827, "step": 26037 }, { "epoch": 0.49, "learning_rate": 2.6921421395310715e-06, "loss": 1.0034, "step": 26038 }, { "epoch": 0.49, "learning_rate": 2.6919898254979034e-06, "loss": 0.9201, "step": 26039 }, { "epoch": 0.49, "learning_rate": 2.69183751074785e-06, "loss": 0.8268, "step": 26040 }, { "epoch": 0.49, "learning_rate": 2.691685195281482e-06, "loss": 0.8877, "step": 26041 }, { "epoch": 0.49, "learning_rate": 2.691532879099367e-06, "loss": 0.8683, "step": 26042 }, { "epoch": 0.49, "learning_rate": 2.6913805622020743e-06, "loss": 1.2582, "step": 26043 }, { "epoch": 0.49, "learning_rate": 2.691228244590173e-06, "loss": 1.0369, "step": 26044 }, { "epoch": 0.49, "learning_rate": 2.6910759262642307e-06, "loss": 0.7805, "step": 26045 }, { "epoch": 0.49, "learning_rate": 2.6909236072248166e-06, "loss": 0.8184, "step": 26046 }, { "epoch": 0.49, "learning_rate": 2.6907712874725007e-06, "loss": 0.9775, "step": 26047 }, { "epoch": 0.49, "learning_rate": 2.690618967007849e-06, "loss": 0.7199, "step": 26048 }, { "epoch": 0.49, "learning_rate": 2.6904666458314326e-06, "loss": 0.8987, "step": 26049 }, { "epoch": 0.49, "learning_rate": 2.69031432394382e-06, "loss": 1.002, "step": 26050 }, { "epoch": 0.49, "learning_rate": 2.690162001345579e-06, "loss": 0.886, "step": 26051 }, { "epoch": 0.49, "learning_rate": 2.690009678037279e-06, "loss": 0.9702, "step": 26052 }, { "epoch": 0.49, "learning_rate": 2.6898573540194893e-06, "loss": 0.8161, "step": 26053 }, { "epoch": 0.49, "learning_rate": 2.689705029292778e-06, "loss": 0.722, "step": 26054 }, { "epoch": 0.49, "learning_rate": 2.6895527038577133e-06, "loss": 0.6979, "step": 26055 }, { "epoch": 0.49, "learning_rate": 2.689400377714865e-06, "loss": 1.0306, "step": 26056 }, { "epoch": 0.49, "learning_rate": 2.689248050864801e-06, "loss": 1.1329, "step": 26057 }, { "epoch": 0.49, "learning_rate": 2.689095723308091e-06, "loss": 0.9453, "step": 26058 }, { "epoch": 0.49, "learning_rate": 2.6889433950453037e-06, "loss": 0.9238, "step": 26059 }, { "epoch": 0.49, "learning_rate": 2.688791066077007e-06, "loss": 0.8978, "step": 26060 }, { "epoch": 0.49, "learning_rate": 2.6886387364037703e-06, "loss": 0.7528, "step": 26061 }, { "epoch": 0.49, "learning_rate": 2.688486406026162e-06, "loss": 0.8647, "step": 26062 }, { "epoch": 0.49, "learning_rate": 2.6883340749447525e-06, "loss": 1.0175, "step": 26063 }, { "epoch": 0.49, "learning_rate": 2.688181743160108e-06, "loss": 0.9843, "step": 26064 }, { "epoch": 0.49, "learning_rate": 2.6880294106728e-06, "loss": 1.0651, "step": 26065 }, { "epoch": 0.49, "learning_rate": 2.6878770774833944e-06, "loss": 0.8993, "step": 26066 }, { "epoch": 0.49, "learning_rate": 2.6877247435924625e-06, "loss": 0.8918, "step": 26067 }, { "epoch": 0.49, "learning_rate": 2.6875724090005723e-06, "loss": 0.7911, "step": 26068 }, { "epoch": 0.49, "learning_rate": 2.687420073708292e-06, "loss": 1.0549, "step": 26069 }, { "epoch": 0.49, "learning_rate": 2.6872677377161903e-06, "loss": 0.849, "step": 26070 }, { "epoch": 0.49, "learning_rate": 2.687115401024838e-06, "loss": 0.8698, "step": 26071 }, { "epoch": 0.49, "learning_rate": 2.6869630636348014e-06, "loss": 0.9073, "step": 26072 }, { "epoch": 0.49, "learning_rate": 2.686810725546652e-06, "loss": 0.9124, "step": 26073 }, { "epoch": 0.49, "learning_rate": 2.686658386760956e-06, "loss": 1.1229, "step": 26074 }, { "epoch": 0.49, "learning_rate": 2.686506047278283e-06, "loss": 0.9727, "step": 26075 }, { "epoch": 0.49, "learning_rate": 2.6863537070992025e-06, "loss": 0.8343, "step": 26076 }, { "epoch": 0.49, "learning_rate": 2.6862013662242823e-06, "loss": 1.0181, "step": 26077 }, { "epoch": 0.49, "learning_rate": 2.6860490246540926e-06, "loss": 0.9674, "step": 26078 }, { "epoch": 0.49, "learning_rate": 2.685896682389202e-06, "loss": 0.8086, "step": 26079 }, { "epoch": 0.49, "learning_rate": 2.685744339430178e-06, "loss": 1.2151, "step": 26080 }, { "epoch": 0.49, "learning_rate": 2.6855919957775907e-06, "loss": 0.9589, "step": 26081 }, { "epoch": 0.49, "learning_rate": 2.6854396514320085e-06, "loss": 0.9016, "step": 26082 }, { "epoch": 0.49, "learning_rate": 2.6852873063940006e-06, "loss": 0.8425, "step": 26083 }, { "epoch": 0.49, "learning_rate": 2.6851349606641345e-06, "loss": 0.7758, "step": 26084 }, { "epoch": 0.49, "learning_rate": 2.684982614242982e-06, "loss": 0.7028, "step": 26085 }, { "epoch": 0.49, "learning_rate": 2.6848302671311087e-06, "loss": 0.9383, "step": 26086 }, { "epoch": 0.49, "learning_rate": 2.684677919329085e-06, "loss": 1.154, "step": 26087 }, { "epoch": 0.49, "learning_rate": 2.6845255708374806e-06, "loss": 1.1697, "step": 26088 }, { "epoch": 0.49, "learning_rate": 2.6843732216568624e-06, "loss": 0.8259, "step": 26089 }, { "epoch": 0.49, "learning_rate": 2.6842208717878e-06, "loss": 0.8841, "step": 26090 }, { "epoch": 0.49, "learning_rate": 2.684068521230863e-06, "loss": 0.9833, "step": 26091 }, { "epoch": 0.49, "learning_rate": 2.68391616998662e-06, "loss": 0.8708, "step": 26092 }, { "epoch": 0.49, "learning_rate": 2.683763818055639e-06, "loss": 0.9138, "step": 26093 }, { "epoch": 0.49, "learning_rate": 2.6836114654384907e-06, "loss": 1.0845, "step": 26094 }, { "epoch": 0.49, "learning_rate": 2.6834591121357422e-06, "loss": 0.7659, "step": 26095 }, { "epoch": 0.49, "learning_rate": 2.6833067581479626e-06, "loss": 1.0356, "step": 26096 }, { "epoch": 0.49, "learning_rate": 2.683154403475721e-06, "loss": 0.921, "step": 26097 }, { "epoch": 0.49, "learning_rate": 2.6830020481195873e-06, "loss": 1.0185, "step": 26098 }, { "epoch": 0.49, "learning_rate": 2.682849692080129e-06, "loss": 1.2684, "step": 26099 }, { "epoch": 0.49, "learning_rate": 2.6826973353579162e-06, "loss": 0.877, "step": 26100 }, { "epoch": 0.49, "learning_rate": 2.6825449779535166e-06, "loss": 1.0119, "step": 26101 }, { "epoch": 0.49, "learning_rate": 2.6823926198674997e-06, "loss": 0.938, "step": 26102 }, { "epoch": 0.49, "learning_rate": 2.6822402611004346e-06, "loss": 0.8927, "step": 26103 }, { "epoch": 0.49, "learning_rate": 2.6820879016528894e-06, "loss": 0.9412, "step": 26104 }, { "epoch": 0.49, "learning_rate": 2.6819355415254338e-06, "loss": 0.9023, "step": 26105 }, { "epoch": 0.49, "learning_rate": 2.6817831807186374e-06, "loss": 0.9401, "step": 26106 }, { "epoch": 0.49, "learning_rate": 2.681630819233067e-06, "loss": 0.7312, "step": 26107 }, { "epoch": 0.49, "learning_rate": 2.681478457069293e-06, "loss": 0.853, "step": 26108 }, { "epoch": 0.49, "learning_rate": 2.6813260942278845e-06, "loss": 1.0251, "step": 26109 }, { "epoch": 0.49, "learning_rate": 2.681173730709409e-06, "loss": 0.8322, "step": 26110 }, { "epoch": 0.49, "learning_rate": 2.681021366514436e-06, "loss": 1.0378, "step": 26111 }, { "epoch": 0.49, "learning_rate": 2.680869001643537e-06, "loss": 1.1026, "step": 26112 }, { "epoch": 0.49, "learning_rate": 2.680716636097277e-06, "loss": 1.0423, "step": 26113 }, { "epoch": 0.49, "learning_rate": 2.6805642698762265e-06, "loss": 0.7999, "step": 26114 }, { "epoch": 0.49, "learning_rate": 2.6804119029809556e-06, "loss": 0.8347, "step": 26115 }, { "epoch": 0.49, "learning_rate": 2.6802595354120314e-06, "loss": 0.7542, "step": 26116 }, { "epoch": 0.49, "learning_rate": 2.6801071671700235e-06, "loss": 0.8371, "step": 26117 }, { "epoch": 0.49, "learning_rate": 2.6799547982555015e-06, "loss": 1.2294, "step": 26118 }, { "epoch": 0.49, "learning_rate": 2.6798024286690333e-06, "loss": 1.2639, "step": 26119 }, { "epoch": 0.49, "learning_rate": 2.6796500584111886e-06, "loss": 0.8197, "step": 26120 }, { "epoch": 0.49, "learning_rate": 2.679497687482536e-06, "loss": 0.8208, "step": 26121 }, { "epoch": 0.49, "learning_rate": 2.6793453158836447e-06, "loss": 0.9193, "step": 26122 }, { "epoch": 0.49, "learning_rate": 2.679192943615083e-06, "loss": 1.004, "step": 26123 }, { "epoch": 0.49, "learning_rate": 2.679040570677421e-06, "loss": 1.145, "step": 26124 }, { "epoch": 0.49, "learning_rate": 2.6788881970712267e-06, "loss": 1.4303, "step": 26125 }, { "epoch": 0.49, "learning_rate": 2.6787358227970694e-06, "loss": 1.1158, "step": 26126 }, { "epoch": 0.49, "learning_rate": 2.6785834478555184e-06, "loss": 0.9788, "step": 26127 }, { "epoch": 0.49, "learning_rate": 2.678431072247142e-06, "loss": 1.0035, "step": 26128 }, { "epoch": 0.49, "learning_rate": 2.6782786959725088e-06, "loss": 0.9836, "step": 26129 }, { "epoch": 0.49, "learning_rate": 2.6781263190321895e-06, "loss": 0.9097, "step": 26130 }, { "epoch": 0.49, "learning_rate": 2.6779739414267516e-06, "loss": 1.0286, "step": 26131 }, { "epoch": 0.49, "learning_rate": 2.6778215631567633e-06, "loss": 0.9513, "step": 26132 }, { "epoch": 0.49, "learning_rate": 2.6776691842227966e-06, "loss": 0.8683, "step": 26133 }, { "epoch": 0.49, "learning_rate": 2.6775168046254175e-06, "loss": 0.9255, "step": 26134 }, { "epoch": 0.49, "learning_rate": 2.677364424365196e-06, "loss": 0.936, "step": 26135 }, { "epoch": 0.49, "learning_rate": 2.677212043442702e-06, "loss": 1.2176, "step": 26136 }, { "epoch": 0.49, "learning_rate": 2.6770596618585033e-06, "loss": 1.0838, "step": 26137 }, { "epoch": 0.49, "learning_rate": 2.676907279613169e-06, "loss": 0.7847, "step": 26138 }, { "epoch": 0.49, "learning_rate": 2.676754896707268e-06, "loss": 0.9966, "step": 26139 }, { "epoch": 0.49, "learning_rate": 2.6766025131413703e-06, "loss": 0.8836, "step": 26140 }, { "epoch": 0.49, "learning_rate": 2.6764501289160437e-06, "loss": 0.8514, "step": 26141 }, { "epoch": 0.49, "learning_rate": 2.676297744031859e-06, "loss": 0.9587, "step": 26142 }, { "epoch": 0.49, "learning_rate": 2.6761453584893827e-06, "loss": 1.0162, "step": 26143 }, { "epoch": 0.49, "learning_rate": 2.6759929722891853e-06, "loss": 0.9498, "step": 26144 }, { "epoch": 0.49, "learning_rate": 2.675840585431835e-06, "loss": 0.7572, "step": 26145 }, { "epoch": 0.49, "learning_rate": 2.6756881979179024e-06, "loss": 0.9982, "step": 26146 }, { "epoch": 0.49, "learning_rate": 2.6755358097479545e-06, "loss": 0.8769, "step": 26147 }, { "epoch": 0.49, "learning_rate": 2.6753834209225623e-06, "loss": 1.0099, "step": 26148 }, { "epoch": 0.49, "learning_rate": 2.675231031442293e-06, "loss": 1.0905, "step": 26149 }, { "epoch": 0.49, "learning_rate": 2.675078641307717e-06, "loss": 0.9941, "step": 26150 }, { "epoch": 0.49, "learning_rate": 2.6749262505194024e-06, "loss": 0.9574, "step": 26151 }, { "epoch": 0.49, "learning_rate": 2.674773859077918e-06, "loss": 0.8936, "step": 26152 }, { "epoch": 0.49, "learning_rate": 2.6746214669838338e-06, "loss": 0.8849, "step": 26153 }, { "epoch": 0.49, "learning_rate": 2.6744690742377188e-06, "loss": 0.9069, "step": 26154 }, { "epoch": 0.49, "learning_rate": 2.674316680840141e-06, "loss": 1.0677, "step": 26155 }, { "epoch": 0.49, "learning_rate": 2.6741642867916704e-06, "loss": 1.1788, "step": 26156 }, { "epoch": 0.49, "learning_rate": 2.674011892092876e-06, "loss": 0.7929, "step": 26157 }, { "epoch": 0.49, "learning_rate": 2.673859496744326e-06, "loss": 0.7861, "step": 26158 }, { "epoch": 0.49, "learning_rate": 2.6737071007465903e-06, "loss": 0.9307, "step": 26159 }, { "epoch": 0.49, "learning_rate": 2.6735547041002376e-06, "loss": 0.7887, "step": 26160 }, { "epoch": 0.49, "learning_rate": 2.6734023068058364e-06, "loss": 1.0093, "step": 26161 }, { "epoch": 0.49, "learning_rate": 2.673249908863956e-06, "loss": 1.0827, "step": 26162 }, { "epoch": 0.49, "learning_rate": 2.673097510275167e-06, "loss": 1.0499, "step": 26163 }, { "epoch": 0.49, "learning_rate": 2.672945111040037e-06, "loss": 0.7294, "step": 26164 }, { "epoch": 0.49, "learning_rate": 2.6727927111591346e-06, "loss": 0.969, "step": 26165 }, { "epoch": 0.49, "learning_rate": 2.67264031063303e-06, "loss": 0.9839, "step": 26166 }, { "epoch": 0.49, "learning_rate": 2.6724879094622914e-06, "loss": 0.7867, "step": 26167 }, { "epoch": 0.49, "learning_rate": 2.6723355076474885e-06, "loss": 0.8547, "step": 26168 }, { "epoch": 0.49, "learning_rate": 2.6721831051891903e-06, "loss": 1.0291, "step": 26169 }, { "epoch": 0.49, "learning_rate": 2.6720307020879654e-06, "loss": 0.8508, "step": 26170 }, { "epoch": 0.49, "learning_rate": 2.671878298344383e-06, "loss": 0.958, "step": 26171 }, { "epoch": 0.49, "learning_rate": 2.671725893959013e-06, "loss": 0.8328, "step": 26172 }, { "epoch": 0.49, "learning_rate": 2.671573488932423e-06, "loss": 0.8867, "step": 26173 }, { "epoch": 0.49, "learning_rate": 2.671421083265182e-06, "loss": 1.016, "step": 26174 }, { "epoch": 0.49, "learning_rate": 2.6712686769578617e-06, "loss": 1.0139, "step": 26175 }, { "epoch": 0.49, "learning_rate": 2.671116270011029e-06, "loss": 0.9385, "step": 26176 }, { "epoch": 0.49, "learning_rate": 2.670963862425253e-06, "loss": 0.7766, "step": 26177 }, { "epoch": 0.49, "learning_rate": 2.670811454201103e-06, "loss": 0.9039, "step": 26178 }, { "epoch": 0.49, "learning_rate": 2.670659045339149e-06, "loss": 0.7979, "step": 26179 }, { "epoch": 0.49, "learning_rate": 2.670506635839959e-06, "loss": 0.9757, "step": 26180 }, { "epoch": 0.49, "learning_rate": 2.6703542257041022e-06, "loss": 1.1042, "step": 26181 }, { "epoch": 0.49, "learning_rate": 2.6702018149321478e-06, "loss": 1.0226, "step": 26182 }, { "epoch": 0.49, "learning_rate": 2.6700494035246654e-06, "loss": 0.9978, "step": 26183 }, { "epoch": 0.49, "learning_rate": 2.669896991482224e-06, "loss": 0.9681, "step": 26184 }, { "epoch": 0.49, "learning_rate": 2.669744578805392e-06, "loss": 0.8165, "step": 26185 }, { "epoch": 0.49, "learning_rate": 2.669592165494739e-06, "loss": 0.993, "step": 26186 }, { "epoch": 0.49, "learning_rate": 2.669439751550834e-06, "loss": 1.0966, "step": 26187 }, { "epoch": 0.49, "learning_rate": 2.669287336974246e-06, "loss": 1.0598, "step": 26188 }, { "epoch": 0.49, "learning_rate": 2.6691349217655453e-06, "loss": 0.7993, "step": 26189 }, { "epoch": 0.49, "learning_rate": 2.6689825059252994e-06, "loss": 0.724, "step": 26190 }, { "epoch": 0.49, "learning_rate": 2.6688300894540774e-06, "loss": 0.8432, "step": 26191 }, { "epoch": 0.49, "learning_rate": 2.66867767235245e-06, "loss": 0.851, "step": 26192 }, { "epoch": 0.49, "learning_rate": 2.668525254620985e-06, "loss": 0.9052, "step": 26193 }, { "epoch": 0.49, "learning_rate": 2.668372836260251e-06, "loss": 0.838, "step": 26194 }, { "epoch": 0.49, "learning_rate": 2.668220417270819e-06, "loss": 1.0746, "step": 26195 }, { "epoch": 0.49, "learning_rate": 2.6680679976532566e-06, "loss": 0.8045, "step": 26196 }, { "epoch": 0.49, "learning_rate": 2.6679155774081335e-06, "loss": 0.8324, "step": 26197 }, { "epoch": 0.49, "learning_rate": 2.6677631565360197e-06, "loss": 0.7728, "step": 26198 }, { "epoch": 0.49, "learning_rate": 2.6676107350374827e-06, "loss": 0.8705, "step": 26199 }, { "epoch": 0.49, "learning_rate": 2.6674583129130916e-06, "loss": 1.1544, "step": 26200 }, { "epoch": 0.49, "learning_rate": 2.667305890163417e-06, "loss": 0.9749, "step": 26201 }, { "epoch": 0.49, "learning_rate": 2.6671534667890277e-06, "loss": 0.8526, "step": 26202 }, { "epoch": 0.49, "learning_rate": 2.667001042790492e-06, "loss": 0.83, "step": 26203 }, { "epoch": 0.49, "learning_rate": 2.66684861816838e-06, "loss": 0.7681, "step": 26204 }, { "epoch": 0.49, "learning_rate": 2.66669619292326e-06, "loss": 0.9806, "step": 26205 }, { "epoch": 0.49, "learning_rate": 2.666543767055701e-06, "loss": 1.1403, "step": 26206 }, { "epoch": 0.49, "learning_rate": 2.666391340566274e-06, "loss": 0.9854, "step": 26207 }, { "epoch": 0.49, "learning_rate": 2.666238913455545e-06, "loss": 0.9601, "step": 26208 }, { "epoch": 0.49, "learning_rate": 2.6660864857240863e-06, "loss": 0.8731, "step": 26209 }, { "epoch": 0.49, "learning_rate": 2.6659340573724657e-06, "loss": 0.8925, "step": 26210 }, { "epoch": 0.49, "learning_rate": 2.665781628401252e-06, "loss": 1.0391, "step": 26211 }, { "epoch": 0.49, "learning_rate": 2.665629198811015e-06, "loss": 1.0903, "step": 26212 }, { "epoch": 0.49, "learning_rate": 2.665476768602324e-06, "loss": 1.0693, "step": 26213 }, { "epoch": 0.49, "learning_rate": 2.6653243377757477e-06, "loss": 0.8242, "step": 26214 }, { "epoch": 0.49, "learning_rate": 2.6651719063318547e-06, "loss": 0.8398, "step": 26215 }, { "epoch": 0.49, "learning_rate": 2.6650194742712153e-06, "loss": 0.9346, "step": 26216 }, { "epoch": 0.49, "learning_rate": 2.6648670415943985e-06, "loss": 0.7612, "step": 26217 }, { "epoch": 0.49, "learning_rate": 2.6647146083019725e-06, "loss": 0.8494, "step": 26218 }, { "epoch": 0.49, "learning_rate": 2.6645621743945082e-06, "loss": 1.0486, "step": 26219 }, { "epoch": 0.49, "learning_rate": 2.6644097398725737e-06, "loss": 0.8326, "step": 26220 }, { "epoch": 0.49, "learning_rate": 2.6642573047367376e-06, "loss": 0.7538, "step": 26221 }, { "epoch": 0.49, "learning_rate": 2.66410486898757e-06, "loss": 0.826, "step": 26222 }, { "epoch": 0.49, "learning_rate": 2.6639524326256393e-06, "loss": 0.8221, "step": 26223 }, { "epoch": 0.49, "learning_rate": 2.663799995651516e-06, "loss": 0.9884, "step": 26224 }, { "epoch": 0.49, "learning_rate": 2.663647558065769e-06, "loss": 1.2712, "step": 26225 }, { "epoch": 0.49, "learning_rate": 2.663495119868966e-06, "loss": 1.0681, "step": 26226 }, { "epoch": 0.49, "learning_rate": 2.663342681061678e-06, "loss": 0.9543, "step": 26227 }, { "epoch": 0.49, "learning_rate": 2.6631902416444733e-06, "loss": 0.6277, "step": 26228 }, { "epoch": 0.49, "learning_rate": 2.6630378016179202e-06, "loss": 0.8088, "step": 26229 }, { "epoch": 0.49, "learning_rate": 2.66288536098259e-06, "loss": 0.967, "step": 26230 }, { "epoch": 0.49, "learning_rate": 2.6627329197390507e-06, "loss": 0.9235, "step": 26231 }, { "epoch": 0.49, "learning_rate": 2.6625804778878717e-06, "loss": 1.0067, "step": 26232 }, { "epoch": 0.49, "learning_rate": 2.6624280354296217e-06, "loss": 0.7491, "step": 26233 }, { "epoch": 0.49, "learning_rate": 2.662275592364871e-06, "loss": 0.9483, "step": 26234 }, { "epoch": 0.49, "learning_rate": 2.6621231486941884e-06, "loss": 0.9139, "step": 26235 }, { "epoch": 0.49, "learning_rate": 2.661970704418142e-06, "loss": 0.8841, "step": 26236 }, { "epoch": 0.5, "learning_rate": 2.6618182595373026e-06, "loss": 0.9461, "step": 26237 }, { "epoch": 0.5, "learning_rate": 2.6616658140522384e-06, "loss": 1.1118, "step": 26238 }, { "epoch": 0.5, "learning_rate": 2.661513367963519e-06, "loss": 1.0565, "step": 26239 }, { "epoch": 0.5, "learning_rate": 2.6613609212717147e-06, "loss": 0.8471, "step": 26240 }, { "epoch": 0.5, "learning_rate": 2.6612084739773923e-06, "loss": 0.8439, "step": 26241 }, { "epoch": 0.5, "learning_rate": 2.661056026081123e-06, "loss": 0.6502, "step": 26242 }, { "epoch": 0.5, "learning_rate": 2.6609035775834756e-06, "loss": 1.0537, "step": 26243 }, { "epoch": 0.5, "learning_rate": 2.6607511284850184e-06, "loss": 1.0561, "step": 26244 }, { "epoch": 0.5, "learning_rate": 2.6605986787863223e-06, "loss": 0.8735, "step": 26245 }, { "epoch": 0.5, "learning_rate": 2.6604462284879557e-06, "loss": 0.7057, "step": 26246 }, { "epoch": 0.5, "learning_rate": 2.6602937775904874e-06, "loss": 0.8639, "step": 26247 }, { "epoch": 0.5, "learning_rate": 2.660141326094487e-06, "loss": 0.8203, "step": 26248 }, { "epoch": 0.5, "learning_rate": 2.6599888740005243e-06, "loss": 1.1447, "step": 26249 }, { "epoch": 0.5, "learning_rate": 2.6598364213091673e-06, "loss": 1.215, "step": 26250 }, { "epoch": 0.5, "learning_rate": 2.6596839680209857e-06, "loss": 1.0632, "step": 26251 }, { "epoch": 0.5, "learning_rate": 2.65953151413655e-06, "loss": 0.9984, "step": 26252 }, { "epoch": 0.5, "learning_rate": 2.6593790596564284e-06, "loss": 0.9629, "step": 26253 }, { "epoch": 0.5, "learning_rate": 2.65922660458119e-06, "loss": 0.7252, "step": 26254 }, { "epoch": 0.5, "learning_rate": 2.659074148911405e-06, "loss": 0.963, "step": 26255 }, { "epoch": 0.5, "learning_rate": 2.6589216926476414e-06, "loss": 1.0414, "step": 26256 }, { "epoch": 0.5, "learning_rate": 2.6587692357904687e-06, "loss": 0.9612, "step": 26257 }, { "epoch": 0.5, "learning_rate": 2.658616778340457e-06, "loss": 1.065, "step": 26258 }, { "epoch": 0.5, "learning_rate": 2.6584643202981753e-06, "loss": 1.0916, "step": 26259 }, { "epoch": 0.5, "learning_rate": 2.658311861664192e-06, "loss": 0.8347, "step": 26260 }, { "epoch": 0.5, "learning_rate": 2.658159402439078e-06, "loss": 0.8438, "step": 26261 }, { "epoch": 0.5, "learning_rate": 2.658006942623401e-06, "loss": 1.1444, "step": 26262 }, { "epoch": 0.5, "learning_rate": 2.657854482217731e-06, "loss": 0.9305, "step": 26263 }, { "epoch": 0.5, "learning_rate": 2.657702021222637e-06, "loss": 0.7773, "step": 26264 }, { "epoch": 0.5, "learning_rate": 2.657549559638689e-06, "loss": 0.8099, "step": 26265 }, { "epoch": 0.5, "learning_rate": 2.6573970974664552e-06, "loss": 1.1354, "step": 26266 }, { "epoch": 0.5, "learning_rate": 2.657244634706506e-06, "loss": 0.8542, "step": 26267 }, { "epoch": 0.5, "learning_rate": 2.65709217135941e-06, "loss": 1.1089, "step": 26268 }, { "epoch": 0.5, "learning_rate": 2.656939707425737e-06, "loss": 1.0536, "step": 26269 }, { "epoch": 0.5, "learning_rate": 2.656787242906056e-06, "loss": 0.8846, "step": 26270 }, { "epoch": 0.5, "learning_rate": 2.656634777800935e-06, "loss": 0.6789, "step": 26271 }, { "epoch": 0.5, "learning_rate": 2.656482312110945e-06, "loss": 1.0541, "step": 26272 }, { "epoch": 0.5, "learning_rate": 2.656329845836656e-06, "loss": 0.7712, "step": 26273 }, { "epoch": 0.5, "learning_rate": 2.6561773789786347e-06, "loss": 1.0569, "step": 26274 }, { "epoch": 0.5, "learning_rate": 2.6560249115374525e-06, "loss": 0.7593, "step": 26275 }, { "epoch": 0.5, "learning_rate": 2.6558724435136784e-06, "loss": 0.9519, "step": 26276 }, { "epoch": 0.5, "learning_rate": 2.655719974907881e-06, "loss": 0.8393, "step": 26277 }, { "epoch": 0.5, "learning_rate": 2.65556750572063e-06, "loss": 0.7868, "step": 26278 }, { "epoch": 0.5, "learning_rate": 2.655415035952495e-06, "loss": 0.797, "step": 26279 }, { "epoch": 0.5, "learning_rate": 2.6552625656040445e-06, "loss": 1.0037, "step": 26280 }, { "epoch": 0.5, "learning_rate": 2.6551100946758486e-06, "loss": 0.9926, "step": 26281 }, { "epoch": 0.5, "learning_rate": 2.6549576231684767e-06, "loss": 0.9866, "step": 26282 }, { "epoch": 0.5, "learning_rate": 2.6548051510824973e-06, "loss": 0.9485, "step": 26283 }, { "epoch": 0.5, "learning_rate": 2.6546526784184803e-06, "loss": 1.0521, "step": 26284 }, { "epoch": 0.5, "learning_rate": 2.6545002051769947e-06, "loss": 0.9241, "step": 26285 }, { "epoch": 0.5, "learning_rate": 2.6543477313586102e-06, "loss": 0.8788, "step": 26286 }, { "epoch": 0.5, "learning_rate": 2.654195256963896e-06, "loss": 1.0814, "step": 26287 }, { "epoch": 0.5, "learning_rate": 2.6540427819934223e-06, "loss": 0.9688, "step": 26288 }, { "epoch": 0.5, "learning_rate": 2.6538903064477568e-06, "loss": 0.7863, "step": 26289 }, { "epoch": 0.5, "learning_rate": 2.653737830327469e-06, "loss": 0.8446, "step": 26290 }, { "epoch": 0.5, "learning_rate": 2.65358535363313e-06, "loss": 0.9615, "step": 26291 }, { "epoch": 0.5, "learning_rate": 2.6534328763653072e-06, "loss": 1.0574, "step": 26292 }, { "epoch": 0.5, "learning_rate": 2.653280398524571e-06, "loss": 1.1596, "step": 26293 }, { "epoch": 0.5, "learning_rate": 2.6531279201114913e-06, "loss": 1.0441, "step": 26294 }, { "epoch": 0.5, "learning_rate": 2.6529754411266357e-06, "loss": 0.8847, "step": 26295 }, { "epoch": 0.5, "learning_rate": 2.6528229615705745e-06, "loss": 1.1036, "step": 26296 }, { "epoch": 0.5, "learning_rate": 2.6526704814438774e-06, "loss": 0.9281, "step": 26297 }, { "epoch": 0.5, "learning_rate": 2.6525180007471136e-06, "loss": 0.8798, "step": 26298 }, { "epoch": 0.5, "learning_rate": 2.652365519480852e-06, "loss": 0.9875, "step": 26299 }, { "epoch": 0.5, "learning_rate": 2.652213037645662e-06, "loss": 1.1975, "step": 26300 }, { "epoch": 0.5, "learning_rate": 2.652060555242113e-06, "loss": 1.096, "step": 26301 }, { "epoch": 0.5, "learning_rate": 2.6519080722707744e-06, "loss": 0.7941, "step": 26302 }, { "epoch": 0.5, "learning_rate": 2.651755588732217e-06, "loss": 1.0444, "step": 26303 }, { "epoch": 0.5, "learning_rate": 2.651603104627008e-06, "loss": 0.8917, "step": 26304 }, { "epoch": 0.5, "learning_rate": 2.651450619955718e-06, "loss": 0.9972, "step": 26305 }, { "epoch": 0.5, "learning_rate": 2.6512981347189155e-06, "loss": 1.0027, "step": 26306 }, { "epoch": 0.5, "learning_rate": 2.65114564891717e-06, "loss": 0.9374, "step": 26307 }, { "epoch": 0.5, "learning_rate": 2.6509931625510526e-06, "loss": 0.7958, "step": 26308 }, { "epoch": 0.5, "learning_rate": 2.650840675621131e-06, "loss": 0.9071, "step": 26309 }, { "epoch": 0.5, "learning_rate": 2.6506881881279738e-06, "loss": 0.8587, "step": 26310 }, { "epoch": 0.5, "learning_rate": 2.6505357000721534e-06, "loss": 0.939, "step": 26311 }, { "epoch": 0.5, "learning_rate": 2.650383211454236e-06, "loss": 1.024, "step": 26312 }, { "epoch": 0.5, "learning_rate": 2.650230722274792e-06, "loss": 0.9063, "step": 26313 }, { "epoch": 0.5, "learning_rate": 2.6500782325343923e-06, "loss": 0.8599, "step": 26314 }, { "epoch": 0.5, "learning_rate": 2.649925742233604e-06, "loss": 0.9223, "step": 26315 }, { "epoch": 0.5, "learning_rate": 2.649773251372998e-06, "loss": 0.8837, "step": 26316 }, { "epoch": 0.5, "learning_rate": 2.6496207599531438e-06, "loss": 0.8282, "step": 26317 }, { "epoch": 0.5, "learning_rate": 2.6494682679746096e-06, "loss": 1.0959, "step": 26318 }, { "epoch": 0.5, "learning_rate": 2.6493157754379655e-06, "loss": 1.048, "step": 26319 }, { "epoch": 0.5, "learning_rate": 2.6491632823437806e-06, "loss": 1.0531, "step": 26320 }, { "epoch": 0.5, "learning_rate": 2.6490107886926253e-06, "loss": 0.79, "step": 26321 }, { "epoch": 0.5, "learning_rate": 2.6488582944850677e-06, "loss": 0.904, "step": 26322 }, { "epoch": 0.5, "learning_rate": 2.6487057997216785e-06, "loss": 0.7391, "step": 26323 }, { "epoch": 0.5, "learning_rate": 2.648553304403026e-06, "loss": 1.028, "step": 26324 }, { "epoch": 0.5, "learning_rate": 2.6484008085296797e-06, "loss": 1.0296, "step": 26325 }, { "epoch": 0.5, "learning_rate": 2.6482483121022096e-06, "loss": 1.0103, "step": 26326 }, { "epoch": 0.5, "learning_rate": 2.648095815121185e-06, "loss": 0.6925, "step": 26327 }, { "epoch": 0.5, "learning_rate": 2.647943317587175e-06, "loss": 1.0323, "step": 26328 }, { "epoch": 0.5, "learning_rate": 2.6477908195007495e-06, "loss": 0.8271, "step": 26329 }, { "epoch": 0.5, "learning_rate": 2.6476383208624773e-06, "loss": 0.9893, "step": 26330 }, { "epoch": 0.5, "learning_rate": 2.647485821672928e-06, "loss": 0.9621, "step": 26331 }, { "epoch": 0.5, "learning_rate": 2.647333321932672e-06, "loss": 1.0244, "step": 26332 }, { "epoch": 0.5, "learning_rate": 2.6471808216422767e-06, "loss": 0.9744, "step": 26333 }, { "epoch": 0.5, "learning_rate": 2.647028320802313e-06, "loss": 1.0287, "step": 26334 }, { "epoch": 0.5, "learning_rate": 2.6468758194133505e-06, "loss": 0.7768, "step": 26335 }, { "epoch": 0.5, "learning_rate": 2.6467233174759578e-06, "loss": 0.7401, "step": 26336 }, { "epoch": 0.5, "learning_rate": 2.646570814990705e-06, "loss": 1.0887, "step": 26337 }, { "epoch": 0.5, "learning_rate": 2.6464183119581614e-06, "loss": 0.9926, "step": 26338 }, { "epoch": 0.5, "learning_rate": 2.646265808378896e-06, "loss": 0.825, "step": 26339 }, { "epoch": 0.5, "learning_rate": 2.6461133042534788e-06, "loss": 1.0006, "step": 26340 }, { "epoch": 0.5, "learning_rate": 2.6459607995824787e-06, "loss": 0.8435, "step": 26341 }, { "epoch": 0.5, "learning_rate": 2.6458082943664654e-06, "loss": 1.0741, "step": 26342 }, { "epoch": 0.5, "learning_rate": 2.6456557886060085e-06, "loss": 1.0504, "step": 26343 }, { "epoch": 0.5, "learning_rate": 2.645503282301678e-06, "loss": 0.9408, "step": 26344 }, { "epoch": 0.5, "learning_rate": 2.645350775454042e-06, "loss": 0.9757, "step": 26345 }, { "epoch": 0.5, "learning_rate": 2.6451982680636712e-06, "loss": 0.9631, "step": 26346 }, { "epoch": 0.5, "learning_rate": 2.6450457601311335e-06, "loss": 0.9057, "step": 26347 }, { "epoch": 0.5, "learning_rate": 2.6448932516570003e-06, "loss": 0.7804, "step": 26348 }, { "epoch": 0.5, "learning_rate": 2.6447407426418397e-06, "loss": 1.0606, "step": 26349 }, { "epoch": 0.5, "learning_rate": 2.644588233086222e-06, "loss": 1.149, "step": 26350 }, { "epoch": 0.5, "learning_rate": 2.6444357229907162e-06, "loss": 1.1114, "step": 26351 }, { "epoch": 0.5, "learning_rate": 2.6442832123558914e-06, "loss": 0.8808, "step": 26352 }, { "epoch": 0.5, "learning_rate": 2.6441307011823184e-06, "loss": 0.9242, "step": 26353 }, { "epoch": 0.5, "learning_rate": 2.6439781894705653e-06, "loss": 0.8102, "step": 26354 }, { "epoch": 0.5, "learning_rate": 2.6438256772212012e-06, "loss": 0.8353, "step": 26355 }, { "epoch": 0.5, "learning_rate": 2.6436731644347975e-06, "loss": 1.02, "step": 26356 }, { "epoch": 0.5, "learning_rate": 2.643520651111922e-06, "loss": 0.9465, "step": 26357 }, { "epoch": 0.5, "learning_rate": 2.643368137253145e-06, "loss": 0.9615, "step": 26358 }, { "epoch": 0.5, "learning_rate": 2.6432156228590368e-06, "loss": 0.9267, "step": 26359 }, { "epoch": 0.5, "learning_rate": 2.6430631079301644e-06, "loss": 0.8972, "step": 26360 }, { "epoch": 0.5, "learning_rate": 2.642910592467099e-06, "loss": 0.8722, "step": 26361 }, { "epoch": 0.5, "learning_rate": 2.6427580764704102e-06, "loss": 1.0259, "step": 26362 }, { "epoch": 0.5, "learning_rate": 2.6426055599406668e-06, "loss": 0.8716, "step": 26363 }, { "epoch": 0.5, "learning_rate": 2.642453042878439e-06, "loss": 0.9655, "step": 26364 }, { "epoch": 0.5, "learning_rate": 2.642300525284296e-06, "loss": 0.9948, "step": 26365 }, { "epoch": 0.5, "learning_rate": 2.6421480071588067e-06, "loss": 0.9576, "step": 26366 }, { "epoch": 0.5, "learning_rate": 2.6419954885025413e-06, "loss": 0.707, "step": 26367 }, { "epoch": 0.5, "learning_rate": 2.6418429693160693e-06, "loss": 1.1015, "step": 26368 }, { "epoch": 0.5, "learning_rate": 2.641690449599959e-06, "loss": 1.068, "step": 26369 }, { "epoch": 0.5, "learning_rate": 2.6415379293547817e-06, "loss": 0.9945, "step": 26370 }, { "epoch": 0.5, "learning_rate": 2.6413854085811068e-06, "loss": 0.9655, "step": 26371 }, { "epoch": 0.5, "learning_rate": 2.6412328872795024e-06, "loss": 0.9748, "step": 26372 }, { "epoch": 0.5, "learning_rate": 2.6410803654505383e-06, "loss": 0.8022, "step": 26373 }, { "epoch": 0.5, "learning_rate": 2.6409278430947854e-06, "loss": 0.886, "step": 26374 }, { "epoch": 0.5, "learning_rate": 2.6407753202128116e-06, "loss": 1.0215, "step": 26375 }, { "epoch": 0.5, "learning_rate": 2.640622796805187e-06, "loss": 0.9971, "step": 26376 }, { "epoch": 0.5, "learning_rate": 2.6404702728724817e-06, "loss": 0.9504, "step": 26377 }, { "epoch": 0.5, "learning_rate": 2.640317748415264e-06, "loss": 0.9242, "step": 26378 }, { "epoch": 0.5, "learning_rate": 2.6401652234341047e-06, "loss": 0.6901, "step": 26379 }, { "epoch": 0.5, "learning_rate": 2.6400126979295733e-06, "loss": 1.1172, "step": 26380 }, { "epoch": 0.5, "learning_rate": 2.6398601719022374e-06, "loss": 1.084, "step": 26381 }, { "epoch": 0.5, "learning_rate": 2.639707645352669e-06, "loss": 1.1649, "step": 26382 }, { "epoch": 0.5, "learning_rate": 2.639555118281436e-06, "loss": 0.8915, "step": 26383 }, { "epoch": 0.5, "learning_rate": 2.6394025906891087e-06, "loss": 0.9161, "step": 26384 }, { "epoch": 0.5, "learning_rate": 2.6392500625762558e-06, "loss": 0.8686, "step": 26385 }, { "epoch": 0.5, "learning_rate": 2.6390975339434487e-06, "loss": 0.8215, "step": 26386 }, { "epoch": 0.5, "learning_rate": 2.6389450047912546e-06, "loss": 1.1538, "step": 26387 }, { "epoch": 0.5, "learning_rate": 2.6387924751202443e-06, "loss": 0.7119, "step": 26388 }, { "epoch": 0.5, "learning_rate": 2.6386399449309875e-06, "loss": 0.7686, "step": 26389 }, { "epoch": 0.5, "learning_rate": 2.638487414224053e-06, "loss": 0.8174, "step": 26390 }, { "epoch": 0.5, "learning_rate": 2.6383348830000104e-06, "loss": 0.9665, "step": 26391 }, { "epoch": 0.5, "learning_rate": 2.6381823512594306e-06, "loss": 1.0568, "step": 26392 }, { "epoch": 0.5, "learning_rate": 2.638029819002882e-06, "loss": 1.1653, "step": 26393 }, { "epoch": 0.5, "learning_rate": 2.637877286230934e-06, "loss": 0.928, "step": 26394 }, { "epoch": 0.5, "learning_rate": 2.6377247529441565e-06, "loss": 0.7705, "step": 26395 }, { "epoch": 0.5, "learning_rate": 2.637572219143118e-06, "loss": 0.7798, "step": 26396 }, { "epoch": 0.5, "learning_rate": 2.63741968482839e-06, "loss": 0.9061, "step": 26397 }, { "epoch": 0.5, "learning_rate": 2.6372671500005415e-06, "loss": 0.7812, "step": 26398 }, { "epoch": 0.5, "learning_rate": 2.637114614660141e-06, "loss": 0.9005, "step": 26399 }, { "epoch": 0.5, "learning_rate": 2.6369620788077588e-06, "loss": 1.0001, "step": 26400 }, { "epoch": 0.5, "learning_rate": 2.636809542443965e-06, "loss": 0.9792, "step": 26401 }, { "epoch": 0.5, "learning_rate": 2.636657005569328e-06, "loss": 1.0646, "step": 26402 }, { "epoch": 0.5, "learning_rate": 2.6365044681844175e-06, "loss": 0.896, "step": 26403 }, { "epoch": 0.5, "learning_rate": 2.6363519302898045e-06, "loss": 0.8787, "step": 26404 }, { "epoch": 0.5, "learning_rate": 2.636199391886057e-06, "loss": 0.85, "step": 26405 }, { "epoch": 0.5, "learning_rate": 2.636046852973745e-06, "loss": 1.0261, "step": 26406 }, { "epoch": 0.5, "learning_rate": 2.6358943135534387e-06, "loss": 0.9145, "step": 26407 }, { "epoch": 0.5, "learning_rate": 2.635741773625707e-06, "loss": 0.9313, "step": 26408 }, { "epoch": 0.5, "learning_rate": 2.63558923319112e-06, "loss": 0.9022, "step": 26409 }, { "epoch": 0.5, "learning_rate": 2.635436692250246e-06, "loss": 0.8943, "step": 26410 }, { "epoch": 0.5, "learning_rate": 2.6352841508036563e-06, "loss": 0.8327, "step": 26411 }, { "epoch": 0.5, "learning_rate": 2.635131608851919e-06, "loss": 1.0839, "step": 26412 }, { "epoch": 0.5, "learning_rate": 2.634979066395606e-06, "loss": 1.0157, "step": 26413 }, { "epoch": 0.5, "learning_rate": 2.634826523435284e-06, "loss": 1.0069, "step": 26414 }, { "epoch": 0.5, "learning_rate": 2.6346739799715245e-06, "loss": 0.8678, "step": 26415 }, { "epoch": 0.5, "learning_rate": 2.634521436004896e-06, "loss": 0.8749, "step": 26416 }, { "epoch": 0.5, "learning_rate": 2.634368891535968e-06, "loss": 0.7388, "step": 26417 }, { "epoch": 0.5, "learning_rate": 2.6342163465653114e-06, "loss": 1.0529, "step": 26418 }, { "epoch": 0.5, "learning_rate": 2.634063801093496e-06, "loss": 0.9071, "step": 26419 }, { "epoch": 0.5, "learning_rate": 2.6339112551210895e-06, "loss": 0.8712, "step": 26420 }, { "epoch": 0.5, "learning_rate": 2.6337587086486627e-06, "loss": 0.7555, "step": 26421 }, { "epoch": 0.5, "learning_rate": 2.633606161676785e-06, "loss": 0.9211, "step": 26422 }, { "epoch": 0.5, "learning_rate": 2.633453614206026e-06, "loss": 0.6824, "step": 26423 }, { "epoch": 0.5, "learning_rate": 2.6333010662369546e-06, "loss": 1.0923, "step": 26424 }, { "epoch": 0.5, "learning_rate": 2.6331485177701414e-06, "loss": 1.2461, "step": 26425 }, { "epoch": 0.5, "learning_rate": 2.6329959688061562e-06, "loss": 0.8987, "step": 26426 }, { "epoch": 0.5, "learning_rate": 2.6328434193455683e-06, "loss": 0.8013, "step": 26427 }, { "epoch": 0.5, "learning_rate": 2.6326908693889465e-06, "loss": 0.8675, "step": 26428 }, { "epoch": 0.5, "learning_rate": 2.6325383189368613e-06, "loss": 0.8932, "step": 26429 }, { "epoch": 0.5, "learning_rate": 2.632385767989882e-06, "loss": 0.8395, "step": 26430 }, { "epoch": 0.5, "learning_rate": 2.632233216548578e-06, "loss": 1.0024, "step": 26431 }, { "epoch": 0.5, "learning_rate": 2.63208066461352e-06, "loss": 1.2436, "step": 26432 }, { "epoch": 0.5, "learning_rate": 2.631928112185277e-06, "loss": 0.7662, "step": 26433 }, { "epoch": 0.5, "learning_rate": 2.6317755592644173e-06, "loss": 0.8434, "step": 26434 }, { "epoch": 0.5, "learning_rate": 2.6316230058515123e-06, "loss": 0.9233, "step": 26435 }, { "epoch": 0.5, "learning_rate": 2.6314704519471317e-06, "loss": 0.938, "step": 26436 }, { "epoch": 0.5, "learning_rate": 2.631317897551844e-06, "loss": 1.1597, "step": 26437 }, { "epoch": 0.5, "learning_rate": 2.6311653426662183e-06, "loss": 1.0251, "step": 26438 }, { "epoch": 0.5, "learning_rate": 2.6310127872908264e-06, "loss": 0.9103, "step": 26439 }, { "epoch": 0.5, "learning_rate": 2.6308602314262362e-06, "loss": 0.7588, "step": 26440 }, { "epoch": 0.5, "learning_rate": 2.630707675073018e-06, "loss": 0.9371, "step": 26441 }, { "epoch": 0.5, "learning_rate": 2.6305551182317417e-06, "loss": 0.696, "step": 26442 }, { "epoch": 0.5, "learning_rate": 2.6304025609029763e-06, "loss": 0.958, "step": 26443 }, { "epoch": 0.5, "learning_rate": 2.630250003087292e-06, "loss": 0.9637, "step": 26444 }, { "epoch": 0.5, "learning_rate": 2.630097444785258e-06, "loss": 0.9688, "step": 26445 }, { "epoch": 0.5, "learning_rate": 2.629944885997444e-06, "loss": 0.8579, "step": 26446 }, { "epoch": 0.5, "learning_rate": 2.6297923267244195e-06, "loss": 0.9276, "step": 26447 }, { "epoch": 0.5, "learning_rate": 2.629639766966756e-06, "loss": 0.8324, "step": 26448 }, { "epoch": 0.5, "learning_rate": 2.62948720672502e-06, "loss": 0.8935, "step": 26449 }, { "epoch": 0.5, "learning_rate": 2.629334645999783e-06, "loss": 1.2215, "step": 26450 }, { "epoch": 0.5, "learning_rate": 2.6291820847916145e-06, "loss": 1.0477, "step": 26451 }, { "epoch": 0.5, "learning_rate": 2.629029523101084e-06, "loss": 0.8745, "step": 26452 }, { "epoch": 0.5, "learning_rate": 2.6288769609287613e-06, "loss": 0.9086, "step": 26453 }, { "epoch": 0.5, "learning_rate": 2.6287243982752164e-06, "loss": 0.9034, "step": 26454 }, { "epoch": 0.5, "learning_rate": 2.6285718351410176e-06, "loss": 0.7356, "step": 26455 }, { "epoch": 0.5, "learning_rate": 2.6284192715267366e-06, "loss": 1.1328, "step": 26456 }, { "epoch": 0.5, "learning_rate": 2.6282667074329413e-06, "loss": 0.8357, "step": 26457 }, { "epoch": 0.5, "learning_rate": 2.6281141428602023e-06, "loss": 0.8609, "step": 26458 }, { "epoch": 0.5, "learning_rate": 2.6279615778090883e-06, "loss": 1.035, "step": 26459 }, { "epoch": 0.5, "learning_rate": 2.6278090122801707e-06, "loss": 0.854, "step": 26460 }, { "epoch": 0.5, "learning_rate": 2.6276564462740177e-06, "loss": 0.9234, "step": 26461 }, { "epoch": 0.5, "learning_rate": 2.6275038797911995e-06, "loss": 1.1448, "step": 26462 }, { "epoch": 0.5, "learning_rate": 2.6273513128322857e-06, "loss": 0.879, "step": 26463 }, { "epoch": 0.5, "learning_rate": 2.6271987453978463e-06, "loss": 1.0238, "step": 26464 }, { "epoch": 0.5, "learning_rate": 2.6270461774884506e-06, "loss": 0.9277, "step": 26465 }, { "epoch": 0.5, "learning_rate": 2.6268936091046677e-06, "loss": 0.9243, "step": 26466 }, { "epoch": 0.5, "learning_rate": 2.6267410402470685e-06, "loss": 0.7453, "step": 26467 }, { "epoch": 0.5, "learning_rate": 2.626588470916222e-06, "loss": 0.9738, "step": 26468 }, { "epoch": 0.5, "learning_rate": 2.6264359011126982e-06, "loss": 1.0509, "step": 26469 }, { "epoch": 0.5, "learning_rate": 2.626283330837067e-06, "loss": 0.8829, "step": 26470 }, { "epoch": 0.5, "learning_rate": 2.626130760089897e-06, "loss": 0.8618, "step": 26471 }, { "epoch": 0.5, "learning_rate": 2.6259781888717583e-06, "loss": 0.9484, "step": 26472 }, { "epoch": 0.5, "learning_rate": 2.625825617183222e-06, "loss": 0.7393, "step": 26473 }, { "epoch": 0.5, "learning_rate": 2.625673045024856e-06, "loss": 0.9554, "step": 26474 }, { "epoch": 0.5, "learning_rate": 2.625520472397231e-06, "loss": 0.9416, "step": 26475 }, { "epoch": 0.5, "learning_rate": 2.625367899300916e-06, "loss": 0.9626, "step": 26476 }, { "epoch": 0.5, "learning_rate": 2.6252153257364815e-06, "loss": 0.7185, "step": 26477 }, { "epoch": 0.5, "learning_rate": 2.6250627517044974e-06, "loss": 0.9028, "step": 26478 }, { "epoch": 0.5, "learning_rate": 2.6249101772055317e-06, "loss": 0.856, "step": 26479 }, { "epoch": 0.5, "learning_rate": 2.624757602240155e-06, "loss": 0.8673, "step": 26480 }, { "epoch": 0.5, "learning_rate": 2.6246050268089385e-06, "loss": 1.1193, "step": 26481 }, { "epoch": 0.5, "learning_rate": 2.62445245091245e-06, "loss": 1.0536, "step": 26482 }, { "epoch": 0.5, "learning_rate": 2.62429987455126e-06, "loss": 0.9156, "step": 26483 }, { "epoch": 0.5, "learning_rate": 2.624147297725938e-06, "loss": 0.9176, "step": 26484 }, { "epoch": 0.5, "learning_rate": 2.6239947204370534e-06, "loss": 0.9188, "step": 26485 }, { "epoch": 0.5, "learning_rate": 2.6238421426851768e-06, "loss": 0.824, "step": 26486 }, { "epoch": 0.5, "learning_rate": 2.6236895644708773e-06, "loss": 1.0537, "step": 26487 }, { "epoch": 0.5, "learning_rate": 2.6235369857947246e-06, "loss": 0.935, "step": 26488 }, { "epoch": 0.5, "learning_rate": 2.623384406657289e-06, "loss": 0.9755, "step": 26489 }, { "epoch": 0.5, "learning_rate": 2.62323182705914e-06, "loss": 0.8299, "step": 26490 }, { "epoch": 0.5, "learning_rate": 2.6230792470008463e-06, "loss": 0.8048, "step": 26491 }, { "epoch": 0.5, "learning_rate": 2.622926666482979e-06, "loss": 0.8449, "step": 26492 }, { "epoch": 0.5, "learning_rate": 2.622774085506107e-06, "loss": 1.114, "step": 26493 }, { "epoch": 0.5, "learning_rate": 2.6226215040708003e-06, "loss": 1.1472, "step": 26494 }, { "epoch": 0.5, "learning_rate": 2.6224689221776287e-06, "loss": 1.0734, "step": 26495 }, { "epoch": 0.5, "learning_rate": 2.6223163398271628e-06, "loss": 0.95, "step": 26496 }, { "epoch": 0.5, "learning_rate": 2.6221637570199703e-06, "loss": 0.775, "step": 26497 }, { "epoch": 0.5, "learning_rate": 2.622011173756622e-06, "loss": 1.1258, "step": 26498 }, { "epoch": 0.5, "learning_rate": 2.6218585900376893e-06, "loss": 0.9359, "step": 26499 }, { "epoch": 0.5, "learning_rate": 2.621706005863739e-06, "loss": 1.0314, "step": 26500 }, { "epoch": 0.5, "learning_rate": 2.6215534212353417e-06, "loss": 0.8748, "step": 26501 }, { "epoch": 0.5, "learning_rate": 2.621400836153069e-06, "loss": 0.8707, "step": 26502 }, { "epoch": 0.5, "learning_rate": 2.6212482506174886e-06, "loss": 0.9763, "step": 26503 }, { "epoch": 0.5, "learning_rate": 2.6210956646291707e-06, "loss": 0.9514, "step": 26504 }, { "epoch": 0.5, "learning_rate": 2.6209430781886863e-06, "loss": 0.838, "step": 26505 }, { "epoch": 0.5, "learning_rate": 2.6207904912966037e-06, "loss": 1.0535, "step": 26506 }, { "epoch": 0.5, "learning_rate": 2.620637903953493e-06, "loss": 0.9258, "step": 26507 }, { "epoch": 0.5, "learning_rate": 2.6204853161599235e-06, "loss": 0.9295, "step": 26508 }, { "epoch": 0.5, "learning_rate": 2.620332727916466e-06, "loss": 1.0173, "step": 26509 }, { "epoch": 0.5, "learning_rate": 2.62018013922369e-06, "loss": 0.7735, "step": 26510 }, { "epoch": 0.5, "learning_rate": 2.620027550082165e-06, "loss": 0.9536, "step": 26511 }, { "epoch": 0.5, "learning_rate": 2.6198749604924606e-06, "loss": 1.1568, "step": 26512 }, { "epoch": 0.5, "learning_rate": 2.6197223704551465e-06, "loss": 0.8108, "step": 26513 }, { "epoch": 0.5, "learning_rate": 2.619569779970793e-06, "loss": 0.889, "step": 26514 }, { "epoch": 0.5, "learning_rate": 2.61941718903997e-06, "loss": 1.0059, "step": 26515 }, { "epoch": 0.5, "learning_rate": 2.6192645976632466e-06, "loss": 1.0817, "step": 26516 }, { "epoch": 0.5, "learning_rate": 2.619112005841193e-06, "loss": 0.8641, "step": 26517 }, { "epoch": 0.5, "learning_rate": 2.6189594135743784e-06, "loss": 1.0027, "step": 26518 }, { "epoch": 0.5, "learning_rate": 2.618806820863373e-06, "loss": 0.8271, "step": 26519 }, { "epoch": 0.5, "learning_rate": 2.6186542277087473e-06, "loss": 0.8919, "step": 26520 }, { "epoch": 0.5, "learning_rate": 2.6185016341110695e-06, "loss": 0.8588, "step": 26521 }, { "epoch": 0.5, "learning_rate": 2.61834904007091e-06, "loss": 0.881, "step": 26522 }, { "epoch": 0.5, "learning_rate": 2.61819644558884e-06, "loss": 0.8815, "step": 26523 }, { "epoch": 0.5, "learning_rate": 2.6180438506654276e-06, "loss": 0.8392, "step": 26524 }, { "epoch": 0.5, "learning_rate": 2.6178912553012427e-06, "loss": 0.8292, "step": 26525 }, { "epoch": 0.5, "learning_rate": 2.617738659496856e-06, "loss": 0.6601, "step": 26526 }, { "epoch": 0.5, "learning_rate": 2.6175860632528365e-06, "loss": 0.8499, "step": 26527 }, { "epoch": 0.5, "learning_rate": 2.6174334665697544e-06, "loss": 0.8356, "step": 26528 }, { "epoch": 0.5, "learning_rate": 2.617280869448179e-06, "loss": 0.7544, "step": 26529 }, { "epoch": 0.5, "learning_rate": 2.6171282718886804e-06, "loss": 0.8885, "step": 26530 }, { "epoch": 0.5, "learning_rate": 2.6169756738918285e-06, "loss": 1.0916, "step": 26531 }, { "epoch": 0.5, "learning_rate": 2.6168230754581936e-06, "loss": 0.8649, "step": 26532 }, { "epoch": 0.5, "learning_rate": 2.6166704765883443e-06, "loss": 0.8425, "step": 26533 }, { "epoch": 0.5, "learning_rate": 2.6165178772828508e-06, "loss": 0.9945, "step": 26534 }, { "epoch": 0.5, "learning_rate": 2.616365277542284e-06, "loss": 0.9699, "step": 26535 }, { "epoch": 0.5, "learning_rate": 2.616212677367212e-06, "loss": 1.077, "step": 26536 }, { "epoch": 0.5, "learning_rate": 2.6160600767582057e-06, "loss": 0.9145, "step": 26537 }, { "epoch": 0.5, "learning_rate": 2.6159074757158347e-06, "loss": 0.8793, "step": 26538 }, { "epoch": 0.5, "learning_rate": 2.615754874240669e-06, "loss": 0.8267, "step": 26539 }, { "epoch": 0.5, "learning_rate": 2.615602272333278e-06, "loss": 0.9312, "step": 26540 }, { "epoch": 0.5, "learning_rate": 2.6154496699942317e-06, "loss": 0.8893, "step": 26541 }, { "epoch": 0.5, "learning_rate": 2.6152970672240997e-06, "loss": 0.9816, "step": 26542 }, { "epoch": 0.5, "learning_rate": 2.615144464023452e-06, "loss": 0.9754, "step": 26543 }, { "epoch": 0.5, "learning_rate": 2.614991860392858e-06, "loss": 0.8871, "step": 26544 }, { "epoch": 0.5, "learning_rate": 2.6148392563328882e-06, "loss": 1.0706, "step": 26545 }, { "epoch": 0.5, "learning_rate": 2.614686651844113e-06, "loss": 0.7478, "step": 26546 }, { "epoch": 0.5, "learning_rate": 2.6145340469271e-06, "loss": 1.1119, "step": 26547 }, { "epoch": 0.5, "learning_rate": 2.614381441582421e-06, "loss": 0.8231, "step": 26548 }, { "epoch": 0.5, "learning_rate": 2.6142288358106457e-06, "loss": 0.9381, "step": 26549 }, { "epoch": 0.5, "learning_rate": 2.6140762296123423e-06, "loss": 1.0813, "step": 26550 }, { "epoch": 0.5, "learning_rate": 2.613923622988082e-06, "loss": 0.921, "step": 26551 }, { "epoch": 0.5, "learning_rate": 2.6137710159384357e-06, "loss": 0.8719, "step": 26552 }, { "epoch": 0.5, "learning_rate": 2.613618408463971e-06, "loss": 0.8264, "step": 26553 }, { "epoch": 0.5, "learning_rate": 2.613465800565258e-06, "loss": 0.8308, "step": 26554 }, { "epoch": 0.5, "learning_rate": 2.6133131922428685e-06, "loss": 0.9623, "step": 26555 }, { "epoch": 0.5, "learning_rate": 2.6131605834973694e-06, "loss": 0.9142, "step": 26556 }, { "epoch": 0.5, "learning_rate": 2.613007974329333e-06, "loss": 0.927, "step": 26557 }, { "epoch": 0.5, "learning_rate": 2.612855364739329e-06, "loss": 0.8608, "step": 26558 }, { "epoch": 0.5, "learning_rate": 2.612702754727926e-06, "loss": 1.0513, "step": 26559 }, { "epoch": 0.5, "learning_rate": 2.612550144295694e-06, "loss": 0.9395, "step": 26560 }, { "epoch": 0.5, "learning_rate": 2.612397533443204e-06, "loss": 1.0507, "step": 26561 }, { "epoch": 0.5, "learning_rate": 2.6122449221710243e-06, "loss": 1.27, "step": 26562 }, { "epoch": 0.5, "learning_rate": 2.612092310479726e-06, "loss": 0.9636, "step": 26563 }, { "epoch": 0.5, "learning_rate": 2.6119396983698774e-06, "loss": 1.0061, "step": 26564 }, { "epoch": 0.5, "learning_rate": 2.61178708584205e-06, "loss": 0.8492, "step": 26565 }, { "epoch": 0.5, "learning_rate": 2.6116344728968133e-06, "loss": 0.8436, "step": 26566 }, { "epoch": 0.5, "learning_rate": 2.6114818595347372e-06, "loss": 0.9352, "step": 26567 }, { "epoch": 0.5, "learning_rate": 2.611329245756391e-06, "loss": 0.9918, "step": 26568 }, { "epoch": 0.5, "learning_rate": 2.6111766315623445e-06, "loss": 1.087, "step": 26569 }, { "epoch": 0.5, "learning_rate": 2.6110240169531682e-06, "loss": 1.0501, "step": 26570 }, { "epoch": 0.5, "learning_rate": 2.6108714019294312e-06, "loss": 0.9091, "step": 26571 }, { "epoch": 0.5, "learning_rate": 2.610718786491704e-06, "loss": 0.7809, "step": 26572 }, { "epoch": 0.5, "learning_rate": 2.6105661706405567e-06, "loss": 0.8884, "step": 26573 }, { "epoch": 0.5, "learning_rate": 2.610413554376558e-06, "loss": 1.1137, "step": 26574 }, { "epoch": 0.5, "learning_rate": 2.6102609377002793e-06, "loss": 1.1186, "step": 26575 }, { "epoch": 0.5, "learning_rate": 2.610108320612289e-06, "loss": 0.8885, "step": 26576 }, { "epoch": 0.5, "learning_rate": 2.609955703113157e-06, "loss": 0.9598, "step": 26577 }, { "epoch": 0.5, "learning_rate": 2.6098030852034544e-06, "loss": 0.923, "step": 26578 }, { "epoch": 0.5, "learning_rate": 2.6096504668837513e-06, "loss": 0.7732, "step": 26579 }, { "epoch": 0.5, "learning_rate": 2.6094978481546157e-06, "loss": 0.9661, "step": 26580 }, { "epoch": 0.5, "learning_rate": 2.609345229016619e-06, "loss": 0.9398, "step": 26581 }, { "epoch": 0.5, "learning_rate": 2.609192609470331e-06, "loss": 0.9774, "step": 26582 }, { "epoch": 0.5, "learning_rate": 2.60903998951632e-06, "loss": 0.8699, "step": 26583 }, { "epoch": 0.5, "learning_rate": 2.6088873691551573e-06, "loss": 1.0715, "step": 26584 }, { "epoch": 0.5, "learning_rate": 2.6087347483874125e-06, "loss": 0.6905, "step": 26585 }, { "epoch": 0.5, "learning_rate": 2.608582127213656e-06, "loss": 0.9307, "step": 26586 }, { "epoch": 0.5, "learning_rate": 2.6084295056344566e-06, "loss": 1.0338, "step": 26587 }, { "epoch": 0.5, "learning_rate": 2.608276883650385e-06, "loss": 0.9478, "step": 26588 }, { "epoch": 0.5, "learning_rate": 2.6081242612620113e-06, "loss": 0.8906, "step": 26589 }, { "epoch": 0.5, "learning_rate": 2.6079716384699043e-06, "loss": 0.804, "step": 26590 }, { "epoch": 0.5, "learning_rate": 2.6078190152746346e-06, "loss": 0.8812, "step": 26591 }, { "epoch": 0.5, "learning_rate": 2.607666391676772e-06, "loss": 0.8493, "step": 26592 }, { "epoch": 0.5, "learning_rate": 2.607513767676886e-06, "loss": 1.0592, "step": 26593 }, { "epoch": 0.5, "learning_rate": 2.607361143275548e-06, "loss": 0.8874, "step": 26594 }, { "epoch": 0.5, "learning_rate": 2.607208518473326e-06, "loss": 1.1476, "step": 26595 }, { "epoch": 0.5, "learning_rate": 2.6070558932707905e-06, "loss": 0.9291, "step": 26596 }, { "epoch": 0.5, "learning_rate": 2.6069032676685124e-06, "loss": 0.9938, "step": 26597 }, { "epoch": 0.5, "learning_rate": 2.60675064166706e-06, "loss": 0.8095, "step": 26598 }, { "epoch": 0.5, "learning_rate": 2.606598015267004e-06, "loss": 1.0016, "step": 26599 }, { "epoch": 0.5, "learning_rate": 2.606445388468915e-06, "loss": 1.0914, "step": 26600 }, { "epoch": 0.5, "learning_rate": 2.606292761273362e-06, "loss": 0.8903, "step": 26601 }, { "epoch": 0.5, "learning_rate": 2.6061401336809142e-06, "loss": 0.8558, "step": 26602 }, { "epoch": 0.5, "learning_rate": 2.6059875056921437e-06, "loss": 0.6751, "step": 26603 }, { "epoch": 0.5, "learning_rate": 2.605834877307618e-06, "loss": 0.7057, "step": 26604 }, { "epoch": 0.5, "learning_rate": 2.605682248527909e-06, "loss": 0.746, "step": 26605 }, { "epoch": 0.5, "learning_rate": 2.6055296193535844e-06, "loss": 1.0582, "step": 26606 }, { "epoch": 0.5, "learning_rate": 2.6053769897852164e-06, "loss": 1.0936, "step": 26607 }, { "epoch": 0.5, "learning_rate": 2.605224359823374e-06, "loss": 1.0023, "step": 26608 }, { "epoch": 0.5, "learning_rate": 2.6050717294686274e-06, "loss": 0.8039, "step": 26609 }, { "epoch": 0.5, "learning_rate": 2.6049190987215457e-06, "loss": 0.7849, "step": 26610 }, { "epoch": 0.5, "learning_rate": 2.604766467582699e-06, "loss": 0.9254, "step": 26611 }, { "epoch": 0.5, "learning_rate": 2.6046138360526573e-06, "loss": 1.123, "step": 26612 }, { "epoch": 0.5, "learning_rate": 2.604461204131991e-06, "loss": 1.1296, "step": 26613 }, { "epoch": 0.5, "learning_rate": 2.60430857182127e-06, "loss": 0.8923, "step": 26614 }, { "epoch": 0.5, "learning_rate": 2.6041559391210647e-06, "loss": 1.0187, "step": 26615 }, { "epoch": 0.5, "learning_rate": 2.6040033060319436e-06, "loss": 0.8559, "step": 26616 }, { "epoch": 0.5, "learning_rate": 2.603850672554477e-06, "loss": 0.98, "step": 26617 }, { "epoch": 0.5, "learning_rate": 2.6036980386892362e-06, "loss": 1.1618, "step": 26618 }, { "epoch": 0.5, "learning_rate": 2.6035454044367887e-06, "loss": 1.0673, "step": 26619 }, { "epoch": 0.5, "learning_rate": 2.6033927697977063e-06, "loss": 0.8156, "step": 26620 }, { "epoch": 0.5, "learning_rate": 2.6032401347725593e-06, "loss": 0.807, "step": 26621 }, { "epoch": 0.5, "learning_rate": 2.6030874993619166e-06, "loss": 0.8599, "step": 26622 }, { "epoch": 0.5, "learning_rate": 2.6029348635663474e-06, "loss": 0.7578, "step": 26623 }, { "epoch": 0.5, "learning_rate": 2.602782227386424e-06, "loss": 1.0942, "step": 26624 }, { "epoch": 0.5, "learning_rate": 2.602629590822714e-06, "loss": 1.0652, "step": 26625 }, { "epoch": 0.5, "learning_rate": 2.602476953875788e-06, "loss": 0.7519, "step": 26626 }, { "epoch": 0.5, "learning_rate": 2.6023243165462166e-06, "loss": 0.7681, "step": 26627 }, { "epoch": 0.5, "learning_rate": 2.602171678834569e-06, "loss": 0.8802, "step": 26628 }, { "epoch": 0.5, "learning_rate": 2.6020190407414154e-06, "loss": 0.8463, "step": 26629 }, { "epoch": 0.5, "learning_rate": 2.601866402267327e-06, "loss": 0.8539, "step": 26630 }, { "epoch": 0.5, "learning_rate": 2.6017137634128715e-06, "loss": 0.9578, "step": 26631 }, { "epoch": 0.5, "learning_rate": 2.60156112417862e-06, "loss": 0.9665, "step": 26632 }, { "epoch": 0.5, "learning_rate": 2.6014084845651426e-06, "loss": 0.9763, "step": 26633 }, { "epoch": 0.5, "learning_rate": 2.6012558445730084e-06, "loss": 0.9212, "step": 26634 }, { "epoch": 0.5, "learning_rate": 2.6011032042027887e-06, "loss": 0.8559, "step": 26635 }, { "epoch": 0.5, "learning_rate": 2.600950563455053e-06, "loss": 0.8116, "step": 26636 }, { "epoch": 0.5, "learning_rate": 2.600797922330371e-06, "loss": 0.9864, "step": 26637 }, { "epoch": 0.5, "learning_rate": 2.600645280829312e-06, "loss": 0.9569, "step": 26638 }, { "epoch": 0.5, "learning_rate": 2.600492638952447e-06, "loss": 0.8762, "step": 26639 }, { "epoch": 0.5, "learning_rate": 2.600339996700345e-06, "loss": 0.9852, "step": 26640 }, { "epoch": 0.5, "learning_rate": 2.600187354073577e-06, "loss": 0.9148, "step": 26641 }, { "epoch": 0.5, "learning_rate": 2.6000347110727126e-06, "loss": 0.673, "step": 26642 }, { "epoch": 0.5, "learning_rate": 2.5998820676983216e-06, "loss": 0.8552, "step": 26643 }, { "epoch": 0.5, "learning_rate": 2.5997294239509736e-06, "loss": 0.8381, "step": 26644 }, { "epoch": 0.5, "learning_rate": 2.59957677983124e-06, "loss": 0.7269, "step": 26645 }, { "epoch": 0.5, "learning_rate": 2.5994241353396886e-06, "loss": 0.9924, "step": 26646 }, { "epoch": 0.5, "learning_rate": 2.5992714904768914e-06, "loss": 0.8053, "step": 26647 }, { "epoch": 0.5, "learning_rate": 2.599118845243417e-06, "loss": 0.9147, "step": 26648 }, { "epoch": 0.5, "learning_rate": 2.598966199639835e-06, "loss": 1.0298, "step": 26649 }, { "epoch": 0.5, "learning_rate": 2.5988135536667174e-06, "loss": 1.1544, "step": 26650 }, { "epoch": 0.5, "learning_rate": 2.5986609073246334e-06, "loss": 0.8447, "step": 26651 }, { "epoch": 0.5, "learning_rate": 2.598508260614152e-06, "loss": 0.9144, "step": 26652 }, { "epoch": 0.5, "learning_rate": 2.5983556135358434e-06, "loss": 0.9212, "step": 26653 }, { "epoch": 0.5, "learning_rate": 2.5982029660902784e-06, "loss": 0.8589, "step": 26654 }, { "epoch": 0.5, "learning_rate": 2.5980503182780264e-06, "loss": 1.0672, "step": 26655 }, { "epoch": 0.5, "learning_rate": 2.5978976700996585e-06, "loss": 1.0198, "step": 26656 }, { "epoch": 0.5, "learning_rate": 2.597745021555742e-06, "loss": 0.9895, "step": 26657 }, { "epoch": 0.5, "learning_rate": 2.597592372646849e-06, "loss": 0.7946, "step": 26658 }, { "epoch": 0.5, "learning_rate": 2.5974397233735505e-06, "loss": 0.8518, "step": 26659 }, { "epoch": 0.5, "learning_rate": 2.5972870737364144e-06, "loss": 0.7968, "step": 26660 }, { "epoch": 0.5, "learning_rate": 2.5971344237360095e-06, "loss": 0.7, "step": 26661 }, { "epoch": 0.5, "learning_rate": 2.5969817733729098e-06, "loss": 1.0295, "step": 26662 }, { "epoch": 0.5, "learning_rate": 2.5968291226476827e-06, "loss": 0.9905, "step": 26663 }, { "epoch": 0.5, "learning_rate": 2.596676471560898e-06, "loss": 0.9431, "step": 26664 }, { "epoch": 0.5, "learning_rate": 2.5965238201131272e-06, "loss": 0.8227, "step": 26665 }, { "epoch": 0.5, "learning_rate": 2.5963711683049385e-06, "loss": 0.9361, "step": 26666 }, { "epoch": 0.5, "learning_rate": 2.5962185161369035e-06, "loss": 0.812, "step": 26667 }, { "epoch": 0.5, "learning_rate": 2.596065863609591e-06, "loss": 1.0524, "step": 26668 }, { "epoch": 0.5, "learning_rate": 2.595913210723572e-06, "loss": 0.9326, "step": 26669 }, { "epoch": 0.5, "learning_rate": 2.5957605574794153e-06, "loss": 0.9351, "step": 26670 }, { "epoch": 0.5, "learning_rate": 2.5956079038776927e-06, "loss": 0.7345, "step": 26671 }, { "epoch": 0.5, "learning_rate": 2.595455249918972e-06, "loss": 0.848, "step": 26672 }, { "epoch": 0.5, "learning_rate": 2.5953025956038245e-06, "loss": 0.7456, "step": 26673 }, { "epoch": 0.5, "learning_rate": 2.5951499409328207e-06, "loss": 1.0372, "step": 26674 }, { "epoch": 0.5, "learning_rate": 2.5949972859065293e-06, "loss": 0.8493, "step": 26675 }, { "epoch": 0.5, "learning_rate": 2.594844630525521e-06, "loss": 0.9878, "step": 26676 }, { "epoch": 0.5, "learning_rate": 2.5946919747903667e-06, "loss": 0.9614, "step": 26677 }, { "epoch": 0.5, "learning_rate": 2.5945393187016342e-06, "loss": 0.9207, "step": 26678 }, { "epoch": 0.5, "learning_rate": 2.5943866622598957e-06, "loss": 0.8416, "step": 26679 }, { "epoch": 0.5, "learning_rate": 2.59423400546572e-06, "loss": 1.1174, "step": 26680 }, { "epoch": 0.5, "learning_rate": 2.5940813483196774e-06, "loss": 0.9194, "step": 26681 }, { "epoch": 0.5, "learning_rate": 2.5939286908223372e-06, "loss": 0.9045, "step": 26682 }, { "epoch": 0.5, "learning_rate": 2.593776032974271e-06, "loss": 0.837, "step": 26683 }, { "epoch": 0.5, "learning_rate": 2.593623374776048e-06, "loss": 0.7322, "step": 26684 }, { "epoch": 0.5, "learning_rate": 2.593470716228238e-06, "loss": 0.902, "step": 26685 }, { "epoch": 0.5, "learning_rate": 2.5933180573314114e-06, "loss": 0.7812, "step": 26686 }, { "epoch": 0.5, "learning_rate": 2.593165398086138e-06, "loss": 0.9573, "step": 26687 }, { "epoch": 0.5, "learning_rate": 2.593012738492988e-06, "loss": 0.8683, "step": 26688 }, { "epoch": 0.5, "learning_rate": 2.5928600785525306e-06, "loss": 0.9885, "step": 26689 }, { "epoch": 0.5, "learning_rate": 2.5927074182653367e-06, "loss": 0.854, "step": 26690 }, { "epoch": 0.5, "learning_rate": 2.592554757631976e-06, "loss": 0.9722, "step": 26691 }, { "epoch": 0.5, "learning_rate": 2.5924020966530196e-06, "loss": 0.9036, "step": 26692 }, { "epoch": 0.5, "learning_rate": 2.5922494353290357e-06, "loss": 1.0656, "step": 26693 }, { "epoch": 0.5, "learning_rate": 2.5920967736605957e-06, "loss": 0.9904, "step": 26694 }, { "epoch": 0.5, "learning_rate": 2.5919441116482683e-06, "loss": 1.0043, "step": 26695 }, { "epoch": 0.5, "learning_rate": 2.5917914492926254e-06, "loss": 0.9167, "step": 26696 }, { "epoch": 0.5, "learning_rate": 2.5916387865942353e-06, "loss": 0.7224, "step": 26697 }, { "epoch": 0.5, "learning_rate": 2.5914861235536705e-06, "loss": 0.8388, "step": 26698 }, { "epoch": 0.5, "learning_rate": 2.5913334601714974e-06, "loss": 0.8453, "step": 26699 }, { "epoch": 0.5, "learning_rate": 2.591180796448289e-06, "loss": 1.194, "step": 26700 }, { "epoch": 0.5, "learning_rate": 2.591028132384614e-06, "loss": 0.9107, "step": 26701 }, { "epoch": 0.5, "learning_rate": 2.590875467981042e-06, "loss": 0.9825, "step": 26702 }, { "epoch": 0.5, "learning_rate": 2.5907228032381444e-06, "loss": 0.9944, "step": 26703 }, { "epoch": 0.5, "learning_rate": 2.590570138156491e-06, "loss": 0.9855, "step": 26704 }, { "epoch": 0.5, "learning_rate": 2.590417472736651e-06, "loss": 1.0091, "step": 26705 }, { "epoch": 0.5, "learning_rate": 2.590264806979195e-06, "loss": 0.9695, "step": 26706 }, { "epoch": 0.5, "learning_rate": 2.5901121408846937e-06, "loss": 0.8711, "step": 26707 }, { "epoch": 0.5, "learning_rate": 2.589959474453716e-06, "loss": 0.8392, "step": 26708 }, { "epoch": 0.5, "learning_rate": 2.5898068076868323e-06, "loss": 1.0432, "step": 26709 }, { "epoch": 0.5, "learning_rate": 2.589654140584612e-06, "loss": 0.965, "step": 26710 }, { "epoch": 0.5, "learning_rate": 2.5895014731476265e-06, "loss": 0.7692, "step": 26711 }, { "epoch": 0.5, "learning_rate": 2.589348805376445e-06, "loss": 0.9219, "step": 26712 }, { "epoch": 0.5, "learning_rate": 2.5891961372716384e-06, "loss": 0.9671, "step": 26713 }, { "epoch": 0.5, "learning_rate": 2.5890434688337763e-06, "loss": 0.9224, "step": 26714 }, { "epoch": 0.5, "learning_rate": 2.588890800063428e-06, "loss": 0.9628, "step": 26715 }, { "epoch": 0.5, "learning_rate": 2.5887381309611638e-06, "loss": 0.9394, "step": 26716 }, { "epoch": 0.5, "learning_rate": 2.5885854615275547e-06, "loss": 0.7356, "step": 26717 }, { "epoch": 0.5, "learning_rate": 2.58843279176317e-06, "loss": 1.0806, "step": 26718 }, { "epoch": 0.5, "learning_rate": 2.5882801216685805e-06, "loss": 0.8947, "step": 26719 }, { "epoch": 0.5, "learning_rate": 2.5881274512443554e-06, "loss": 0.8589, "step": 26720 }, { "epoch": 0.5, "learning_rate": 2.587974780491065e-06, "loss": 0.8498, "step": 26721 }, { "epoch": 0.5, "learning_rate": 2.5878221094092796e-06, "loss": 0.9843, "step": 26722 }, { "epoch": 0.5, "learning_rate": 2.5876694379995686e-06, "loss": 0.9395, "step": 26723 }, { "epoch": 0.5, "learning_rate": 2.587516766262503e-06, "loss": 0.9312, "step": 26724 }, { "epoch": 0.5, "learning_rate": 2.587364094198653e-06, "loss": 1.0031, "step": 26725 }, { "epoch": 0.5, "learning_rate": 2.5872114218085876e-06, "loss": 0.8512, "step": 26726 }, { "epoch": 0.5, "learning_rate": 2.587058749092877e-06, "loss": 0.908, "step": 26727 }, { "epoch": 0.5, "learning_rate": 2.586906076052093e-06, "loss": 0.9744, "step": 26728 }, { "epoch": 0.5, "learning_rate": 2.5867534026868036e-06, "loss": 0.7474, "step": 26729 }, { "epoch": 0.5, "learning_rate": 2.586600728997579e-06, "loss": 1.1042, "step": 26730 }, { "epoch": 0.5, "learning_rate": 2.586448054984991e-06, "loss": 0.9869, "step": 26731 }, { "epoch": 0.5, "learning_rate": 2.5862953806496077e-06, "loss": 0.9458, "step": 26732 }, { "epoch": 0.5, "learning_rate": 2.586142705992001e-06, "loss": 0.9672, "step": 26733 }, { "epoch": 0.5, "learning_rate": 2.58599003101274e-06, "loss": 0.9223, "step": 26734 }, { "epoch": 0.5, "learning_rate": 2.5858373557123945e-06, "loss": 0.7929, "step": 26735 }, { "epoch": 0.5, "learning_rate": 2.5856846800915346e-06, "loss": 0.798, "step": 26736 }, { "epoch": 0.5, "learning_rate": 2.585532004150731e-06, "loss": 1.2078, "step": 26737 }, { "epoch": 0.5, "learning_rate": 2.585379327890554e-06, "loss": 1.0994, "step": 26738 }, { "epoch": 0.5, "learning_rate": 2.5852266513115722e-06, "loss": 0.9973, "step": 26739 }, { "epoch": 0.5, "learning_rate": 2.5850739744143578e-06, "loss": 0.7912, "step": 26740 }, { "epoch": 0.5, "learning_rate": 2.5849212971994793e-06, "loss": 0.9258, "step": 26741 }, { "epoch": 0.5, "learning_rate": 2.584768619667507e-06, "loss": 0.7696, "step": 26742 }, { "epoch": 0.5, "learning_rate": 2.584615941819012e-06, "loss": 1.0201, "step": 26743 }, { "epoch": 0.5, "learning_rate": 2.5844632636545623e-06, "loss": 0.9276, "step": 26744 }, { "epoch": 0.5, "learning_rate": 2.5843105851747308e-06, "loss": 0.8718, "step": 26745 }, { "epoch": 0.5, "learning_rate": 2.584157906380086e-06, "loss": 0.7055, "step": 26746 }, { "epoch": 0.5, "learning_rate": 2.5840052272711973e-06, "loss": 0.7154, "step": 26747 }, { "epoch": 0.5, "learning_rate": 2.5838525478486367e-06, "loss": 0.913, "step": 26748 }, { "epoch": 0.5, "learning_rate": 2.583699868112973e-06, "loss": 0.7194, "step": 26749 }, { "epoch": 0.5, "learning_rate": 2.583547188064776e-06, "loss": 1.1492, "step": 26750 }, { "epoch": 0.5, "learning_rate": 2.5833945077046164e-06, "loss": 0.7085, "step": 26751 }, { "epoch": 0.5, "learning_rate": 2.5832418270330647e-06, "loss": 0.931, "step": 26752 }, { "epoch": 0.5, "learning_rate": 2.5830891460506904e-06, "loss": 0.7652, "step": 26753 }, { "epoch": 0.5, "learning_rate": 2.5829364647580636e-06, "loss": 0.6808, "step": 26754 }, { "epoch": 0.5, "learning_rate": 2.582783783155755e-06, "loss": 0.8931, "step": 26755 }, { "epoch": 0.5, "learning_rate": 2.582631101244334e-06, "loss": 1.1783, "step": 26756 }, { "epoch": 0.5, "learning_rate": 2.582478419024371e-06, "loss": 0.9968, "step": 26757 }, { "epoch": 0.5, "learning_rate": 2.582325736496436e-06, "loss": 0.895, "step": 26758 }, { "epoch": 0.5, "learning_rate": 2.582173053661099e-06, "loss": 1.0027, "step": 26759 }, { "epoch": 0.5, "learning_rate": 2.5820203705189305e-06, "loss": 0.7445, "step": 26760 }, { "epoch": 0.5, "learning_rate": 2.581867687070501e-06, "loss": 1.0096, "step": 26761 }, { "epoch": 0.5, "learning_rate": 2.58171500331638e-06, "loss": 0.9773, "step": 26762 }, { "epoch": 0.5, "learning_rate": 2.581562319257137e-06, "loss": 0.9868, "step": 26763 }, { "epoch": 0.5, "learning_rate": 2.5814096348933436e-06, "loss": 0.8474, "step": 26764 }, { "epoch": 0.5, "learning_rate": 2.5812569502255683e-06, "loss": 0.7553, "step": 26765 }, { "epoch": 0.5, "learning_rate": 2.581104265254383e-06, "loss": 1.044, "step": 26766 }, { "epoch": 0.51, "learning_rate": 2.5809515799803565e-06, "loss": 0.9048, "step": 26767 }, { "epoch": 0.51, "learning_rate": 2.5807988944040592e-06, "loss": 0.944, "step": 26768 }, { "epoch": 0.51, "learning_rate": 2.5806462085260606e-06, "loss": 0.9767, "step": 26769 }, { "epoch": 0.51, "learning_rate": 2.580493522346933e-06, "loss": 0.7391, "step": 26770 }, { "epoch": 0.51, "learning_rate": 2.5803408358672437e-06, "loss": 0.6536, "step": 26771 }, { "epoch": 0.51, "learning_rate": 2.5801881490875646e-06, "loss": 0.8478, "step": 26772 }, { "epoch": 0.51, "learning_rate": 2.5800354620084656e-06, "loss": 0.8904, "step": 26773 }, { "epoch": 0.51, "learning_rate": 2.579882774630516e-06, "loss": 1.0757, "step": 26774 }, { "epoch": 0.51, "learning_rate": 2.5797300869542878e-06, "loss": 1.0944, "step": 26775 }, { "epoch": 0.51, "learning_rate": 2.579577398980349e-06, "loss": 0.7403, "step": 26776 }, { "epoch": 0.51, "learning_rate": 2.5794247107092705e-06, "loss": 0.9089, "step": 26777 }, { "epoch": 0.51, "learning_rate": 2.5792720221416234e-06, "loss": 1.0204, "step": 26778 }, { "epoch": 0.51, "learning_rate": 2.5791193332779765e-06, "loss": 0.7308, "step": 26779 }, { "epoch": 0.51, "learning_rate": 2.5789666441189e-06, "loss": 1.0157, "step": 26780 }, { "epoch": 0.51, "learning_rate": 2.5788139546649655e-06, "loss": 1.1177, "step": 26781 }, { "epoch": 0.51, "learning_rate": 2.5786612649167413e-06, "loss": 0.934, "step": 26782 }, { "epoch": 0.51, "learning_rate": 2.5785085748747986e-06, "loss": 0.8189, "step": 26783 }, { "epoch": 0.51, "learning_rate": 2.5783558845397076e-06, "loss": 1.1484, "step": 26784 }, { "epoch": 0.51, "learning_rate": 2.578203193912038e-06, "loss": 0.8046, "step": 26785 }, { "epoch": 0.51, "learning_rate": 2.5780505029923586e-06, "loss": 0.9345, "step": 26786 }, { "epoch": 0.51, "learning_rate": 2.577897811781243e-06, "loss": 0.9125, "step": 26787 }, { "epoch": 0.51, "learning_rate": 2.577745120279259e-06, "loss": 1.0483, "step": 26788 }, { "epoch": 0.51, "learning_rate": 2.5775924284869763e-06, "loss": 1.0242, "step": 26789 }, { "epoch": 0.51, "learning_rate": 2.5774397364049663e-06, "loss": 1.152, "step": 26790 }, { "epoch": 0.51, "learning_rate": 2.5772870440337986e-06, "loss": 0.7513, "step": 26791 }, { "epoch": 0.51, "learning_rate": 2.577134351374044e-06, "loss": 0.8396, "step": 26792 }, { "epoch": 0.51, "learning_rate": 2.5769816584262713e-06, "loss": 1.0378, "step": 26793 }, { "epoch": 0.51, "learning_rate": 2.5768289651910516e-06, "loss": 1.0383, "step": 26794 }, { "epoch": 0.51, "learning_rate": 2.5766762716689547e-06, "loss": 0.7321, "step": 26795 }, { "epoch": 0.51, "learning_rate": 2.5765235778605517e-06, "loss": 0.9981, "step": 26796 }, { "epoch": 0.51, "learning_rate": 2.576370883766412e-06, "loss": 0.8388, "step": 26797 }, { "epoch": 0.51, "learning_rate": 2.5762181893871053e-06, "loss": 0.7881, "step": 26798 }, { "epoch": 0.51, "learning_rate": 2.5760654947232024e-06, "loss": 1.0279, "step": 26799 }, { "epoch": 0.51, "learning_rate": 2.5759127997752725e-06, "loss": 1.0981, "step": 26800 }, { "epoch": 0.51, "learning_rate": 2.5757601045438876e-06, "loss": 0.7807, "step": 26801 }, { "epoch": 0.51, "learning_rate": 2.575607409029617e-06, "loss": 0.8866, "step": 26802 }, { "epoch": 0.51, "learning_rate": 2.5754547132330295e-06, "loss": 0.8988, "step": 26803 }, { "epoch": 0.51, "learning_rate": 2.575302017154697e-06, "loss": 0.9745, "step": 26804 }, { "epoch": 0.51, "learning_rate": 2.5751493207951893e-06, "loss": 0.9698, "step": 26805 }, { "epoch": 0.51, "learning_rate": 2.574996624155076e-06, "loss": 1.0984, "step": 26806 }, { "epoch": 0.51, "learning_rate": 2.5748439272349272e-06, "loss": 0.9548, "step": 26807 }, { "epoch": 0.51, "learning_rate": 2.5746912300353143e-06, "loss": 0.7708, "step": 26808 }, { "epoch": 0.51, "learning_rate": 2.574538532556806e-06, "loss": 0.9512, "step": 26809 }, { "epoch": 0.51, "learning_rate": 2.5743858347999734e-06, "loss": 1.0047, "step": 26810 }, { "epoch": 0.51, "learning_rate": 2.5742331367653872e-06, "loss": 0.8509, "step": 26811 }, { "epoch": 0.51, "learning_rate": 2.5740804384536154e-06, "loss": 0.9831, "step": 26812 }, { "epoch": 0.51, "learning_rate": 2.57392773986523e-06, "loss": 1.1179, "step": 26813 }, { "epoch": 0.51, "learning_rate": 2.573775041000801e-06, "loss": 0.8389, "step": 26814 }, { "epoch": 0.51, "learning_rate": 2.573622341860898e-06, "loss": 0.8416, "step": 26815 }, { "epoch": 0.51, "learning_rate": 2.573469642446091e-06, "loss": 0.723, "step": 26816 }, { "epoch": 0.51, "learning_rate": 2.5733169427569517e-06, "loss": 0.8949, "step": 26817 }, { "epoch": 0.51, "learning_rate": 2.5731642427940484e-06, "loss": 1.2982, "step": 26818 }, { "epoch": 0.51, "learning_rate": 2.573011542557952e-06, "loss": 0.8752, "step": 26819 }, { "epoch": 0.51, "learning_rate": 2.572858842049233e-06, "loss": 1.0865, "step": 26820 }, { "epoch": 0.51, "learning_rate": 2.572706141268461e-06, "loss": 0.8476, "step": 26821 }, { "epoch": 0.51, "learning_rate": 2.5725534402162067e-06, "loss": 0.8584, "step": 26822 }, { "epoch": 0.51, "learning_rate": 2.5724007388930405e-06, "loss": 1.0649, "step": 26823 }, { "epoch": 0.51, "learning_rate": 2.572248037299532e-06, "loss": 1.0786, "step": 26824 }, { "epoch": 0.51, "learning_rate": 2.572095335436251e-06, "loss": 1.1751, "step": 26825 }, { "epoch": 0.51, "learning_rate": 2.5719426333037687e-06, "loss": 0.7733, "step": 26826 }, { "epoch": 0.51, "learning_rate": 2.5717899309026544e-06, "loss": 0.9041, "step": 26827 }, { "epoch": 0.51, "learning_rate": 2.5716372282334783e-06, "loss": 0.8671, "step": 26828 }, { "epoch": 0.51, "learning_rate": 2.5714845252968126e-06, "loss": 0.801, "step": 26829 }, { "epoch": 0.51, "learning_rate": 2.5713318220932243e-06, "loss": 0.8188, "step": 26830 }, { "epoch": 0.51, "learning_rate": 2.571179118623286e-06, "loss": 0.9969, "step": 26831 }, { "epoch": 0.51, "learning_rate": 2.5710264148875668e-06, "loss": 0.9284, "step": 26832 }, { "epoch": 0.51, "learning_rate": 2.570873710886637e-06, "loss": 0.8477, "step": 26833 }, { "epoch": 0.51, "learning_rate": 2.5707210066210674e-06, "loss": 0.7881, "step": 26834 }, { "epoch": 0.51, "learning_rate": 2.5705683020914275e-06, "loss": 0.9771, "step": 26835 }, { "epoch": 0.51, "learning_rate": 2.5704155972982874e-06, "loss": 0.9098, "step": 26836 }, { "epoch": 0.51, "learning_rate": 2.570262892242218e-06, "loss": 1.0063, "step": 26837 }, { "epoch": 0.51, "learning_rate": 2.5701101869237894e-06, "loss": 0.9796, "step": 26838 }, { "epoch": 0.51, "learning_rate": 2.5699574813435707e-06, "loss": 0.9049, "step": 26839 }, { "epoch": 0.51, "learning_rate": 2.5698047755021334e-06, "loss": 0.8242, "step": 26840 }, { "epoch": 0.51, "learning_rate": 2.569652069400047e-06, "loss": 0.595, "step": 26841 }, { "epoch": 0.51, "learning_rate": 2.569499363037882e-06, "loss": 0.9204, "step": 26842 }, { "epoch": 0.51, "learning_rate": 2.5693466564162082e-06, "loss": 1.1159, "step": 26843 }, { "epoch": 0.51, "learning_rate": 2.569193949535597e-06, "loss": 1.1592, "step": 26844 }, { "epoch": 0.51, "learning_rate": 2.569041242396617e-06, "loss": 1.045, "step": 26845 }, { "epoch": 0.51, "learning_rate": 2.568888534999839e-06, "loss": 0.689, "step": 26846 }, { "epoch": 0.51, "learning_rate": 2.5687358273458348e-06, "loss": 0.7376, "step": 26847 }, { "epoch": 0.51, "learning_rate": 2.5685831194351714e-06, "loss": 0.8014, "step": 26848 }, { "epoch": 0.51, "learning_rate": 2.5684304112684207e-06, "loss": 0.9673, "step": 26849 }, { "epoch": 0.51, "learning_rate": 2.568277702846154e-06, "loss": 1.0425, "step": 26850 }, { "epoch": 0.51, "learning_rate": 2.5681249941689397e-06, "loss": 1.0002, "step": 26851 }, { "epoch": 0.51, "learning_rate": 2.567972285237349e-06, "loss": 0.8032, "step": 26852 }, { "epoch": 0.51, "learning_rate": 2.5678195760519524e-06, "loss": 0.8918, "step": 26853 }, { "epoch": 0.51, "learning_rate": 2.567666866613319e-06, "loss": 0.8537, "step": 26854 }, { "epoch": 0.51, "learning_rate": 2.5675141569220196e-06, "loss": 0.9946, "step": 26855 }, { "epoch": 0.51, "learning_rate": 2.5673614469786245e-06, "loss": 1.0482, "step": 26856 }, { "epoch": 0.51, "learning_rate": 2.5672087367837034e-06, "loss": 0.9402, "step": 26857 }, { "epoch": 0.51, "learning_rate": 2.5670560263378275e-06, "loss": 0.8327, "step": 26858 }, { "epoch": 0.51, "learning_rate": 2.5669033156415667e-06, "loss": 0.9104, "step": 26859 }, { "epoch": 0.51, "learning_rate": 2.5667506046954904e-06, "loss": 0.9426, "step": 26860 }, { "epoch": 0.51, "learning_rate": 2.5665978935001696e-06, "loss": 0.7892, "step": 26861 }, { "epoch": 0.51, "learning_rate": 2.5664451820561743e-06, "loss": 0.9608, "step": 26862 }, { "epoch": 0.51, "learning_rate": 2.566292470364074e-06, "loss": 1.1393, "step": 26863 }, { "epoch": 0.51, "learning_rate": 2.566139758424441e-06, "loss": 0.8337, "step": 26864 }, { "epoch": 0.51, "learning_rate": 2.5659870462378434e-06, "loss": 0.6765, "step": 26865 }, { "epoch": 0.51, "learning_rate": 2.5658343338048524e-06, "loss": 0.9102, "step": 26866 }, { "epoch": 0.51, "learning_rate": 2.5656816211260376e-06, "loss": 0.8237, "step": 26867 }, { "epoch": 0.51, "learning_rate": 2.565528908201971e-06, "loss": 1.0747, "step": 26868 }, { "epoch": 0.51, "learning_rate": 2.5653761950332195e-06, "loss": 0.9833, "step": 26869 }, { "epoch": 0.51, "learning_rate": 2.565223481620356e-06, "loss": 0.9262, "step": 26870 }, { "epoch": 0.51, "learning_rate": 2.5650707679639508e-06, "loss": 0.8311, "step": 26871 }, { "epoch": 0.51, "learning_rate": 2.5649180540645726e-06, "loss": 0.7755, "step": 26872 }, { "epoch": 0.51, "learning_rate": 2.564765339922792e-06, "loss": 1.0161, "step": 26873 }, { "epoch": 0.51, "learning_rate": 2.564612625539181e-06, "loss": 1.0282, "step": 26874 }, { "epoch": 0.51, "learning_rate": 2.5644599109143075e-06, "loss": 1.0554, "step": 26875 }, { "epoch": 0.51, "learning_rate": 2.5643071960487425e-06, "loss": 0.7967, "step": 26876 }, { "epoch": 0.51, "learning_rate": 2.564154480943057e-06, "loss": 0.7971, "step": 26877 }, { "epoch": 0.51, "learning_rate": 2.56400176559782e-06, "loss": 0.8226, "step": 26878 }, { "epoch": 0.51, "learning_rate": 2.5638490500136027e-06, "loss": 0.7032, "step": 26879 }, { "epoch": 0.51, "learning_rate": 2.5636963341909756e-06, "loss": 0.941, "step": 26880 }, { "epoch": 0.51, "learning_rate": 2.563543618130507e-06, "loss": 0.9619, "step": 26881 }, { "epoch": 0.51, "learning_rate": 2.563390901832769e-06, "loss": 1.1929, "step": 26882 }, { "epoch": 0.51, "learning_rate": 2.563238185298332e-06, "loss": 0.7521, "step": 26883 }, { "epoch": 0.51, "learning_rate": 2.5630854685277645e-06, "loss": 0.9927, "step": 26884 }, { "epoch": 0.51, "learning_rate": 2.5629327515216384e-06, "loss": 0.7692, "step": 26885 }, { "epoch": 0.51, "learning_rate": 2.562780034280524e-06, "loss": 0.8218, "step": 26886 }, { "epoch": 0.51, "learning_rate": 2.56262731680499e-06, "loss": 1.1866, "step": 26887 }, { "epoch": 0.51, "learning_rate": 2.5624745990956075e-06, "loss": 1.1895, "step": 26888 }, { "epoch": 0.51, "learning_rate": 2.5623218811529476e-06, "loss": 1.04, "step": 26889 }, { "epoch": 0.51, "learning_rate": 2.5621691629775785e-06, "loss": 0.8951, "step": 26890 }, { "epoch": 0.51, "learning_rate": 2.5620164445700724e-06, "loss": 0.8371, "step": 26891 }, { "epoch": 0.51, "learning_rate": 2.5618637259309985e-06, "loss": 1.1023, "step": 26892 }, { "epoch": 0.51, "learning_rate": 2.5617110070609273e-06, "loss": 1.0865, "step": 26893 }, { "epoch": 0.51, "learning_rate": 2.56155828796043e-06, "loss": 1.1901, "step": 26894 }, { "epoch": 0.51, "learning_rate": 2.561405568630075e-06, "loss": 0.9547, "step": 26895 }, { "epoch": 0.51, "learning_rate": 2.5612528490704336e-06, "loss": 1.0721, "step": 26896 }, { "epoch": 0.51, "learning_rate": 2.561100129282076e-06, "loss": 0.8901, "step": 26897 }, { "epoch": 0.51, "learning_rate": 2.560947409265572e-06, "loss": 0.9192, "step": 26898 }, { "epoch": 0.51, "learning_rate": 2.5607946890214924e-06, "loss": 0.9077, "step": 26899 }, { "epoch": 0.51, "learning_rate": 2.5606419685504082e-06, "loss": 1.1999, "step": 26900 }, { "epoch": 0.51, "learning_rate": 2.560489247852888e-06, "loss": 0.7841, "step": 26901 }, { "epoch": 0.51, "learning_rate": 2.5603365269295026e-06, "loss": 0.7337, "step": 26902 }, { "epoch": 0.51, "learning_rate": 2.560183805780824e-06, "loss": 1.0082, "step": 26903 }, { "epoch": 0.51, "learning_rate": 2.5600310844074183e-06, "loss": 1.0253, "step": 26904 }, { "epoch": 0.51, "learning_rate": 2.55987836280986e-06, "loss": 0.7671, "step": 26905 }, { "epoch": 0.51, "learning_rate": 2.559725640988718e-06, "loss": 0.9874, "step": 26906 }, { "epoch": 0.51, "learning_rate": 2.559572918944562e-06, "loss": 0.8786, "step": 26907 }, { "epoch": 0.51, "learning_rate": 2.5594201966779618e-06, "loss": 0.953, "step": 26908 }, { "epoch": 0.51, "learning_rate": 2.559267474189489e-06, "loss": 0.9161, "step": 26909 }, { "epoch": 0.51, "learning_rate": 2.5591147514797133e-06, "loss": 0.8217, "step": 26910 }, { "epoch": 0.51, "learning_rate": 2.5589620285492046e-06, "loss": 0.843, "step": 26911 }, { "epoch": 0.51, "learning_rate": 2.5588093053985334e-06, "loss": 1.0484, "step": 26912 }, { "epoch": 0.51, "learning_rate": 2.5586565820282706e-06, "loss": 1.139, "step": 26913 }, { "epoch": 0.51, "learning_rate": 2.5585038584389854e-06, "loss": 0.9485, "step": 26914 }, { "epoch": 0.51, "learning_rate": 2.5583511346312495e-06, "loss": 0.8265, "step": 26915 }, { "epoch": 0.51, "learning_rate": 2.558198410605632e-06, "loss": 0.9312, "step": 26916 }, { "epoch": 0.51, "learning_rate": 2.5580456863627023e-06, "loss": 0.9172, "step": 26917 }, { "epoch": 0.51, "learning_rate": 2.5578929619030323e-06, "loss": 1.0448, "step": 26918 }, { "epoch": 0.51, "learning_rate": 2.557740237227192e-06, "loss": 1.1954, "step": 26919 }, { "epoch": 0.51, "learning_rate": 2.5575875123357515e-06, "loss": 0.7873, "step": 26920 }, { "epoch": 0.51, "learning_rate": 2.5574347872292816e-06, "loss": 0.7709, "step": 26921 }, { "epoch": 0.51, "learning_rate": 2.557282061908351e-06, "loss": 0.7825, "step": 26922 }, { "epoch": 0.51, "learning_rate": 2.557129336373531e-06, "loss": 0.8381, "step": 26923 }, { "epoch": 0.51, "learning_rate": 2.5569766106253923e-06, "loss": 1.0294, "step": 26924 }, { "epoch": 0.51, "learning_rate": 2.5568238846645038e-06, "loss": 1.0059, "step": 26925 }, { "epoch": 0.51, "learning_rate": 2.5566711584914373e-06, "loss": 0.7868, "step": 26926 }, { "epoch": 0.51, "learning_rate": 2.5565184321067634e-06, "loss": 0.8803, "step": 26927 }, { "epoch": 0.51, "learning_rate": 2.5563657055110495e-06, "loss": 0.9603, "step": 26928 }, { "epoch": 0.51, "learning_rate": 2.556212978704869e-06, "loss": 0.819, "step": 26929 }, { "epoch": 0.51, "learning_rate": 2.556060251688791e-06, "loss": 0.9547, "step": 26930 }, { "epoch": 0.51, "learning_rate": 2.555907524463385e-06, "loss": 0.9652, "step": 26931 }, { "epoch": 0.51, "learning_rate": 2.555754797029222e-06, "loss": 0.8673, "step": 26932 }, { "epoch": 0.51, "learning_rate": 2.5556020693868733e-06, "loss": 0.8762, "step": 26933 }, { "epoch": 0.51, "learning_rate": 2.5554493415369074e-06, "loss": 0.9105, "step": 26934 }, { "epoch": 0.51, "learning_rate": 2.5552966134798956e-06, "loss": 0.9059, "step": 26935 }, { "epoch": 0.51, "learning_rate": 2.5551438852164078e-06, "loss": 1.0032, "step": 26936 }, { "epoch": 0.51, "learning_rate": 2.5549911567470147e-06, "loss": 1.0439, "step": 26937 }, { "epoch": 0.51, "learning_rate": 2.554838428072286e-06, "loss": 0.9838, "step": 26938 }, { "epoch": 0.51, "learning_rate": 2.554685699192792e-06, "loss": 0.7736, "step": 26939 }, { "epoch": 0.51, "learning_rate": 2.5545329701091036e-06, "loss": 1.0671, "step": 26940 }, { "epoch": 0.51, "learning_rate": 2.554380240821791e-06, "loss": 0.8638, "step": 26941 }, { "epoch": 0.51, "learning_rate": 2.5542275113314245e-06, "loss": 0.9375, "step": 26942 }, { "epoch": 0.51, "learning_rate": 2.5540747816385736e-06, "loss": 1.2426, "step": 26943 }, { "epoch": 0.51, "learning_rate": 2.553922051743809e-06, "loss": 0.9352, "step": 26944 }, { "epoch": 0.51, "learning_rate": 2.5537693216477024e-06, "loss": 1.0319, "step": 26945 }, { "epoch": 0.51, "learning_rate": 2.553616591350821e-06, "loss": 0.7516, "step": 26946 }, { "epoch": 0.51, "learning_rate": 2.553463860853737e-06, "loss": 0.7006, "step": 26947 }, { "epoch": 0.51, "learning_rate": 2.553311130157022e-06, "loss": 0.7634, "step": 26948 }, { "epoch": 0.51, "learning_rate": 2.553158399261244e-06, "loss": 0.769, "step": 26949 }, { "epoch": 0.51, "learning_rate": 2.553005668166974e-06, "loss": 1.1499, "step": 26950 }, { "epoch": 0.51, "learning_rate": 2.5528529368747835e-06, "loss": 0.9824, "step": 26951 }, { "epoch": 0.51, "learning_rate": 2.5527002053852407e-06, "loss": 1.1136, "step": 26952 }, { "epoch": 0.51, "learning_rate": 2.552547473698917e-06, "loss": 0.9457, "step": 26953 }, { "epoch": 0.51, "learning_rate": 2.552394741816383e-06, "loss": 0.9725, "step": 26954 }, { "epoch": 0.51, "learning_rate": 2.5522420097382084e-06, "loss": 0.8843, "step": 26955 }, { "epoch": 0.51, "learning_rate": 2.5520892774649635e-06, "loss": 0.9438, "step": 26956 }, { "epoch": 0.51, "learning_rate": 2.55193654499722e-06, "loss": 1.0502, "step": 26957 }, { "epoch": 0.51, "learning_rate": 2.5517838123355458e-06, "loss": 0.8886, "step": 26958 }, { "epoch": 0.51, "learning_rate": 2.5516310794805125e-06, "loss": 0.9328, "step": 26959 }, { "epoch": 0.51, "learning_rate": 2.5514783464326908e-06, "loss": 0.867, "step": 26960 }, { "epoch": 0.51, "learning_rate": 2.5513256131926505e-06, "loss": 0.9583, "step": 26961 }, { "epoch": 0.51, "learning_rate": 2.551172879760962e-06, "loss": 1.0037, "step": 26962 }, { "epoch": 0.51, "learning_rate": 2.551020146138196e-06, "loss": 1.055, "step": 26963 }, { "epoch": 0.51, "learning_rate": 2.550867412324921e-06, "loss": 0.9187, "step": 26964 }, { "epoch": 0.51, "learning_rate": 2.5507146783217095e-06, "loss": 0.9281, "step": 26965 }, { "epoch": 0.51, "learning_rate": 2.5505619441291312e-06, "loss": 0.8278, "step": 26966 }, { "epoch": 0.51, "learning_rate": 2.550409209747755e-06, "loss": 0.8694, "step": 26967 }, { "epoch": 0.51, "learning_rate": 2.550256475178153e-06, "loss": 1.1421, "step": 26968 }, { "epoch": 0.51, "learning_rate": 2.5501037404208957e-06, "loss": 0.952, "step": 26969 }, { "epoch": 0.51, "learning_rate": 2.549951005476552e-06, "loss": 0.8999, "step": 26970 }, { "epoch": 0.51, "learning_rate": 2.5497982703456924e-06, "loss": 0.7341, "step": 26971 }, { "epoch": 0.51, "learning_rate": 2.5496455350288883e-06, "loss": 0.7747, "step": 26972 }, { "epoch": 0.51, "learning_rate": 2.549492799526709e-06, "loss": 0.9445, "step": 26973 }, { "epoch": 0.51, "learning_rate": 2.5493400638397244e-06, "loss": 1.0915, "step": 26974 }, { "epoch": 0.51, "learning_rate": 2.549187327968506e-06, "loss": 1.1088, "step": 26975 }, { "epoch": 0.51, "learning_rate": 2.549034591913623e-06, "loss": 1.0127, "step": 26976 }, { "epoch": 0.51, "learning_rate": 2.5488818556756475e-06, "loss": 1.0685, "step": 26977 }, { "epoch": 0.51, "learning_rate": 2.5487291192551485e-06, "loss": 1.0044, "step": 26978 }, { "epoch": 0.51, "learning_rate": 2.548576382652696e-06, "loss": 0.8022, "step": 26979 }, { "epoch": 0.51, "learning_rate": 2.548423645868861e-06, "loss": 0.7695, "step": 26980 }, { "epoch": 0.51, "learning_rate": 2.5482709089042133e-06, "loss": 1.22, "step": 26981 }, { "epoch": 0.51, "learning_rate": 2.5481181717593233e-06, "loss": 0.9029, "step": 26982 }, { "epoch": 0.51, "learning_rate": 2.547965434434762e-06, "loss": 0.8617, "step": 26983 }, { "epoch": 0.51, "learning_rate": 2.5478126969310996e-06, "loss": 0.8791, "step": 26984 }, { "epoch": 0.51, "learning_rate": 2.5476599592489056e-06, "loss": 0.9258, "step": 26985 }, { "epoch": 0.51, "learning_rate": 2.5475072213887504e-06, "loss": 0.775, "step": 26986 }, { "epoch": 0.51, "learning_rate": 2.5473544833512054e-06, "loss": 0.9649, "step": 26987 }, { "epoch": 0.51, "learning_rate": 2.5472017451368397e-06, "loss": 1.0974, "step": 26988 }, { "epoch": 0.51, "learning_rate": 2.5470490067462238e-06, "loss": 0.844, "step": 26989 }, { "epoch": 0.51, "learning_rate": 2.54689626817993e-06, "loss": 0.9924, "step": 26990 }, { "epoch": 0.51, "learning_rate": 2.546743529438525e-06, "loss": 0.9915, "step": 26991 }, { "epoch": 0.51, "learning_rate": 2.5465907905225822e-06, "loss": 1.0069, "step": 26992 }, { "epoch": 0.51, "learning_rate": 2.5464380514326707e-06, "loss": 0.8373, "step": 26993 }, { "epoch": 0.51, "learning_rate": 2.546285312169361e-06, "loss": 0.9933, "step": 26994 }, { "epoch": 0.51, "learning_rate": 2.5461325727332227e-06, "loss": 1.131, "step": 26995 }, { "epoch": 0.51, "learning_rate": 2.5459798331248275e-06, "loss": 0.8625, "step": 26996 }, { "epoch": 0.51, "learning_rate": 2.5458270933447443e-06, "loss": 0.9259, "step": 26997 }, { "epoch": 0.51, "learning_rate": 2.5456743533935447e-06, "loss": 0.7959, "step": 26998 }, { "epoch": 0.51, "learning_rate": 2.5455216132717984e-06, "loss": 0.7983, "step": 26999 }, { "epoch": 0.51, "learning_rate": 2.5453688729800755e-06, "loss": 1.1191, "step": 27000 }, { "epoch": 0.51, "learning_rate": 2.5452161325189473e-06, "loss": 1.085, "step": 27001 }, { "epoch": 0.51, "learning_rate": 2.545063391888983e-06, "loss": 0.86, "step": 27002 }, { "epoch": 0.51, "learning_rate": 2.544910651090753e-06, "loss": 0.8072, "step": 27003 }, { "epoch": 0.51, "learning_rate": 2.5447579101248283e-06, "loss": 1.046, "step": 27004 }, { "epoch": 0.51, "learning_rate": 2.5446051689917793e-06, "loss": 1.0642, "step": 27005 }, { "epoch": 0.51, "learning_rate": 2.544452427692176e-06, "loss": 1.171, "step": 27006 }, { "epoch": 0.51, "learning_rate": 2.544299686226589e-06, "loss": 0.9577, "step": 27007 }, { "epoch": 0.51, "learning_rate": 2.544146944595587e-06, "loss": 0.689, "step": 27008 }, { "epoch": 0.51, "learning_rate": 2.5439942027997423e-06, "loss": 0.9077, "step": 27009 }, { "epoch": 0.51, "learning_rate": 2.543841460839625e-06, "loss": 0.728, "step": 27010 }, { "epoch": 0.51, "learning_rate": 2.5436887187158045e-06, "loss": 0.8893, "step": 27011 }, { "epoch": 0.51, "learning_rate": 2.543535976428852e-06, "loss": 1.0004, "step": 27012 }, { "epoch": 0.51, "learning_rate": 2.5433832339793375e-06, "loss": 0.9849, "step": 27013 }, { "epoch": 0.51, "learning_rate": 2.5432304913678315e-06, "loss": 0.8816, "step": 27014 }, { "epoch": 0.51, "learning_rate": 2.543077748594904e-06, "loss": 0.938, "step": 27015 }, { "epoch": 0.51, "learning_rate": 2.5429250056611247e-06, "loss": 1.016, "step": 27016 }, { "epoch": 0.51, "learning_rate": 2.5427722625670653e-06, "loss": 0.9378, "step": 27017 }, { "epoch": 0.51, "learning_rate": 2.5426195193132957e-06, "loss": 0.9649, "step": 27018 }, { "epoch": 0.51, "learning_rate": 2.5424667759003868e-06, "loss": 0.8556, "step": 27019 }, { "epoch": 0.51, "learning_rate": 2.5423140323289074e-06, "loss": 0.9841, "step": 27020 }, { "epoch": 0.51, "learning_rate": 2.5421612885994284e-06, "loss": 0.8063, "step": 27021 }, { "epoch": 0.51, "learning_rate": 2.5420085447125208e-06, "loss": 0.8685, "step": 27022 }, { "epoch": 0.51, "learning_rate": 2.541855800668755e-06, "loss": 0.635, "step": 27023 }, { "epoch": 0.51, "learning_rate": 2.541703056468701e-06, "loss": 1.0945, "step": 27024 }, { "epoch": 0.51, "learning_rate": 2.5415503121129287e-06, "loss": 1.1152, "step": 27025 }, { "epoch": 0.51, "learning_rate": 2.5413975676020084e-06, "loss": 0.9341, "step": 27026 }, { "epoch": 0.51, "learning_rate": 2.5412448229365115e-06, "loss": 1.0718, "step": 27027 }, { "epoch": 0.51, "learning_rate": 2.541092078117008e-06, "loss": 0.8672, "step": 27028 }, { "epoch": 0.51, "learning_rate": 2.5409393331440667e-06, "loss": 0.9802, "step": 27029 }, { "epoch": 0.51, "learning_rate": 2.54078658801826e-06, "loss": 0.7401, "step": 27030 }, { "epoch": 0.51, "learning_rate": 2.5406338427401573e-06, "loss": 0.8447, "step": 27031 }, { "epoch": 0.51, "learning_rate": 2.5404810973103287e-06, "loss": 1.1646, "step": 27032 }, { "epoch": 0.51, "learning_rate": 2.540328351729346e-06, "loss": 0.8312, "step": 27033 }, { "epoch": 0.51, "learning_rate": 2.540175605997778e-06, "loss": 0.7979, "step": 27034 }, { "epoch": 0.51, "learning_rate": 2.5400228601161953e-06, "loss": 0.9972, "step": 27035 }, { "epoch": 0.51, "learning_rate": 2.5398701140851686e-06, "loss": 0.9703, "step": 27036 }, { "epoch": 0.51, "learning_rate": 2.5397173679052673e-06, "loss": 1.1245, "step": 27037 }, { "epoch": 0.51, "learning_rate": 2.5395646215770637e-06, "loss": 1.0652, "step": 27038 }, { "epoch": 0.51, "learning_rate": 2.539411875101126e-06, "loss": 0.8669, "step": 27039 }, { "epoch": 0.51, "learning_rate": 2.5392591284780264e-06, "loss": 1.0525, "step": 27040 }, { "epoch": 0.51, "learning_rate": 2.5391063817083344e-06, "loss": 0.9211, "step": 27041 }, { "epoch": 0.51, "learning_rate": 2.5389536347926203e-06, "loss": 0.9769, "step": 27042 }, { "epoch": 0.51, "learning_rate": 2.538800887731454e-06, "loss": 1.146, "step": 27043 }, { "epoch": 0.51, "learning_rate": 2.5386481405254063e-06, "loss": 1.076, "step": 27044 }, { "epoch": 0.51, "learning_rate": 2.5384953931750483e-06, "loss": 0.9204, "step": 27045 }, { "epoch": 0.51, "learning_rate": 2.53834264568095e-06, "loss": 0.9304, "step": 27046 }, { "epoch": 0.51, "learning_rate": 2.5381898980436807e-06, "loss": 0.7709, "step": 27047 }, { "epoch": 0.51, "learning_rate": 2.5380371502638113e-06, "loss": 0.8206, "step": 27048 }, { "epoch": 0.51, "learning_rate": 2.5378844023419136e-06, "loss": 0.97, "step": 27049 }, { "epoch": 0.51, "learning_rate": 2.5377316542785554e-06, "loss": 0.9401, "step": 27050 }, { "epoch": 0.51, "learning_rate": 2.5375789060743085e-06, "loss": 1.0356, "step": 27051 }, { "epoch": 0.51, "learning_rate": 2.537426157729744e-06, "loss": 0.8474, "step": 27052 }, { "epoch": 0.51, "learning_rate": 2.5372734092454306e-06, "loss": 0.721, "step": 27053 }, { "epoch": 0.51, "learning_rate": 2.537120660621939e-06, "loss": 0.6783, "step": 27054 }, { "epoch": 0.51, "learning_rate": 2.536967911859841e-06, "loss": 0.9035, "step": 27055 }, { "epoch": 0.51, "learning_rate": 2.5368151629597054e-06, "loss": 1.0538, "step": 27056 }, { "epoch": 0.51, "learning_rate": 2.5366624139221035e-06, "loss": 0.9056, "step": 27057 }, { "epoch": 0.51, "learning_rate": 2.5365096647476045e-06, "loss": 0.8471, "step": 27058 }, { "epoch": 0.51, "learning_rate": 2.5363569154367802e-06, "loss": 0.9427, "step": 27059 }, { "epoch": 0.51, "learning_rate": 2.5362041659902e-06, "loss": 0.8914, "step": 27060 }, { "epoch": 0.51, "learning_rate": 2.5360514164084356e-06, "loss": 1.0664, "step": 27061 }, { "epoch": 0.51, "learning_rate": 2.535898666692055e-06, "loss": 1.1337, "step": 27062 }, { "epoch": 0.51, "learning_rate": 2.5357459168416304e-06, "loss": 0.8551, "step": 27063 }, { "epoch": 0.51, "learning_rate": 2.535593166857731e-06, "loss": 0.8608, "step": 27064 }, { "epoch": 0.51, "learning_rate": 2.5354404167409285e-06, "loss": 0.8224, "step": 27065 }, { "epoch": 0.51, "learning_rate": 2.5352876664917925e-06, "loss": 0.8314, "step": 27066 }, { "epoch": 0.51, "learning_rate": 2.5351349161108937e-06, "loss": 0.8237, "step": 27067 }, { "epoch": 0.51, "learning_rate": 2.5349821655988018e-06, "loss": 0.9958, "step": 27068 }, { "epoch": 0.51, "learning_rate": 2.5348294149560876e-06, "loss": 1.2001, "step": 27069 }, { "epoch": 0.51, "learning_rate": 2.5346766641833213e-06, "loss": 0.9718, "step": 27070 }, { "epoch": 0.51, "learning_rate": 2.5345239132810733e-06, "loss": 1.0229, "step": 27071 }, { "epoch": 0.51, "learning_rate": 2.534371162249914e-06, "loss": 0.8312, "step": 27072 }, { "epoch": 0.51, "learning_rate": 2.534218411090415e-06, "loss": 0.7866, "step": 27073 }, { "epoch": 0.51, "learning_rate": 2.5340656598031444e-06, "loss": 1.0595, "step": 27074 }, { "epoch": 0.51, "learning_rate": 2.5339129083886736e-06, "loss": 1.1854, "step": 27075 }, { "epoch": 0.51, "learning_rate": 2.533760156847574e-06, "loss": 0.9611, "step": 27076 }, { "epoch": 0.51, "learning_rate": 2.5336074051804145e-06, "loss": 0.8485, "step": 27077 }, { "epoch": 0.51, "learning_rate": 2.533454653387765e-06, "loss": 0.8753, "step": 27078 }, { "epoch": 0.51, "learning_rate": 2.533301901470198e-06, "loss": 0.789, "step": 27079 }, { "epoch": 0.51, "learning_rate": 2.533149149428282e-06, "loss": 0.7899, "step": 27080 }, { "epoch": 0.51, "learning_rate": 2.5329963972625888e-06, "loss": 1.1303, "step": 27081 }, { "epoch": 0.51, "learning_rate": 2.532843644973688e-06, "loss": 0.7954, "step": 27082 }, { "epoch": 0.51, "learning_rate": 2.5326908925621503e-06, "loss": 0.8453, "step": 27083 }, { "epoch": 0.51, "learning_rate": 2.5325381400285448e-06, "loss": 0.8165, "step": 27084 }, { "epoch": 0.51, "learning_rate": 2.5323853873734434e-06, "loss": 0.8463, "step": 27085 }, { "epoch": 0.51, "learning_rate": 2.532232634597416e-06, "loss": 1.0729, "step": 27086 }, { "epoch": 0.51, "learning_rate": 2.532079881701033e-06, "loss": 0.893, "step": 27087 }, { "epoch": 0.51, "learning_rate": 2.5319271286848647e-06, "loss": 1.072, "step": 27088 }, { "epoch": 0.51, "learning_rate": 2.5317743755494812e-06, "loss": 1.047, "step": 27089 }, { "epoch": 0.51, "learning_rate": 2.531621622295453e-06, "loss": 1.0521, "step": 27090 }, { "epoch": 0.51, "learning_rate": 2.531468868923352e-06, "loss": 0.9509, "step": 27091 }, { "epoch": 0.51, "learning_rate": 2.531316115433745e-06, "loss": 1.0012, "step": 27092 }, { "epoch": 0.51, "learning_rate": 2.5311633618272056e-06, "loss": 0.9952, "step": 27093 }, { "epoch": 0.51, "learning_rate": 2.531010608104304e-06, "loss": 1.1296, "step": 27094 }, { "epoch": 0.51, "learning_rate": 2.530857854265609e-06, "loss": 0.8316, "step": 27095 }, { "epoch": 0.51, "learning_rate": 2.5307051003116917e-06, "loss": 0.9345, "step": 27096 }, { "epoch": 0.51, "learning_rate": 2.530552346243123e-06, "loss": 0.9575, "step": 27097 }, { "epoch": 0.51, "learning_rate": 2.5303995920604724e-06, "loss": 0.9646, "step": 27098 }, { "epoch": 0.51, "learning_rate": 2.5302468377643103e-06, "loss": 1.0979, "step": 27099 }, { "epoch": 0.51, "learning_rate": 2.530094083355208e-06, "loss": 1.1074, "step": 27100 }, { "epoch": 0.51, "learning_rate": 2.529941328833735e-06, "loss": 0.9178, "step": 27101 }, { "epoch": 0.51, "learning_rate": 2.529788574200462e-06, "loss": 0.962, "step": 27102 }, { "epoch": 0.51, "learning_rate": 2.5296358194559594e-06, "loss": 0.7012, "step": 27103 }, { "epoch": 0.51, "learning_rate": 2.529483064600798e-06, "loss": 0.7977, "step": 27104 }, { "epoch": 0.51, "learning_rate": 2.529330309635547e-06, "loss": 0.8616, "step": 27105 }, { "epoch": 0.51, "learning_rate": 2.5291775545607777e-06, "loss": 1.1473, "step": 27106 }, { "epoch": 0.51, "learning_rate": 2.5290247993770606e-06, "loss": 0.7587, "step": 27107 }, { "epoch": 0.51, "learning_rate": 2.5288720440849653e-06, "loss": 0.9811, "step": 27108 }, { "epoch": 0.51, "learning_rate": 2.528719288685064e-06, "loss": 0.8605, "step": 27109 }, { "epoch": 0.51, "learning_rate": 2.528566533177924e-06, "loss": 1.095, "step": 27110 }, { "epoch": 0.51, "learning_rate": 2.528413777564118e-06, "loss": 0.6643, "step": 27111 }, { "epoch": 0.51, "learning_rate": 2.5282610218442165e-06, "loss": 0.9669, "step": 27112 }, { "epoch": 0.51, "learning_rate": 2.528108266018788e-06, "loss": 1.0022, "step": 27113 }, { "epoch": 0.51, "learning_rate": 2.527955510088405e-06, "loss": 0.8612, "step": 27114 }, { "epoch": 0.51, "learning_rate": 2.5278027540536377e-06, "loss": 1.0758, "step": 27115 }, { "epoch": 0.51, "learning_rate": 2.527649997915055e-06, "loss": 0.9594, "step": 27116 }, { "epoch": 0.51, "learning_rate": 2.5274972416732273e-06, "loss": 0.843, "step": 27117 }, { "epoch": 0.51, "learning_rate": 2.527344485328727e-06, "loss": 1.1466, "step": 27118 }, { "epoch": 0.51, "learning_rate": 2.5271917288821223e-06, "loss": 1.147, "step": 27119 }, { "epoch": 0.51, "learning_rate": 2.527038972333985e-06, "loss": 1.0098, "step": 27120 }, { "epoch": 0.51, "learning_rate": 2.5268862156848846e-06, "loss": 0.7589, "step": 27121 }, { "epoch": 0.51, "learning_rate": 2.526733458935392e-06, "loss": 0.9266, "step": 27122 }, { "epoch": 0.51, "learning_rate": 2.526580702086078e-06, "loss": 0.8924, "step": 27123 }, { "epoch": 0.51, "learning_rate": 2.5264279451375125e-06, "loss": 0.9333, "step": 27124 }, { "epoch": 0.51, "learning_rate": 2.5262751880902654e-06, "loss": 0.9842, "step": 27125 }, { "epoch": 0.51, "learning_rate": 2.5261224309449073e-06, "loss": 0.9256, "step": 27126 }, { "epoch": 0.51, "learning_rate": 2.525969673702009e-06, "loss": 0.8438, "step": 27127 }, { "epoch": 0.51, "learning_rate": 2.525816916362141e-06, "loss": 0.9669, "step": 27128 }, { "epoch": 0.51, "learning_rate": 2.5256641589258735e-06, "loss": 0.7949, "step": 27129 }, { "epoch": 0.51, "learning_rate": 2.5255114013937767e-06, "loss": 1.1503, "step": 27130 }, { "epoch": 0.51, "learning_rate": 2.525358643766421e-06, "loss": 1.1149, "step": 27131 }, { "epoch": 0.51, "learning_rate": 2.5252058860443773e-06, "loss": 0.9242, "step": 27132 }, { "epoch": 0.51, "learning_rate": 2.5250531282282152e-06, "loss": 0.9511, "step": 27133 }, { "epoch": 0.51, "learning_rate": 2.5249003703185047e-06, "loss": 0.7194, "step": 27134 }, { "epoch": 0.51, "learning_rate": 2.524747612315819e-06, "loss": 0.7061, "step": 27135 }, { "epoch": 0.51, "learning_rate": 2.524594854220725e-06, "loss": 0.758, "step": 27136 }, { "epoch": 0.51, "learning_rate": 2.5244420960337947e-06, "loss": 0.9718, "step": 27137 }, { "epoch": 0.51, "learning_rate": 2.524289337755599e-06, "loss": 0.7837, "step": 27138 }, { "epoch": 0.51, "learning_rate": 2.524136579386707e-06, "loss": 0.5675, "step": 27139 }, { "epoch": 0.51, "learning_rate": 2.5239838209276896e-06, "loss": 1.0261, "step": 27140 }, { "epoch": 0.51, "learning_rate": 2.523831062379118e-06, "loss": 0.9451, "step": 27141 }, { "epoch": 0.51, "learning_rate": 2.5236783037415615e-06, "loss": 0.8022, "step": 27142 }, { "epoch": 0.51, "learning_rate": 2.5235255450155904e-06, "loss": 0.8314, "step": 27143 }, { "epoch": 0.51, "learning_rate": 2.5233727862017772e-06, "loss": 1.0737, "step": 27144 }, { "epoch": 0.51, "learning_rate": 2.5232200273006897e-06, "loss": 0.8963, "step": 27145 }, { "epoch": 0.51, "learning_rate": 2.5230672683128994e-06, "loss": 0.7712, "step": 27146 }, { "epoch": 0.51, "learning_rate": 2.522914509238976e-06, "loss": 0.8385, "step": 27147 }, { "epoch": 0.51, "learning_rate": 2.5227617500794917e-06, "loss": 0.8411, "step": 27148 }, { "epoch": 0.51, "learning_rate": 2.522608990835015e-06, "loss": 0.7938, "step": 27149 }, { "epoch": 0.51, "learning_rate": 2.522456231506118e-06, "loss": 1.1499, "step": 27150 }, { "epoch": 0.51, "learning_rate": 2.522303472093369e-06, "loss": 1.0768, "step": 27151 }, { "epoch": 0.51, "learning_rate": 2.52215071259734e-06, "loss": 0.7801, "step": 27152 }, { "epoch": 0.51, "learning_rate": 2.521997953018601e-06, "loss": 0.9065, "step": 27153 }, { "epoch": 0.51, "learning_rate": 2.521845193357722e-06, "loss": 0.9538, "step": 27154 }, { "epoch": 0.51, "learning_rate": 2.521692433615273e-06, "loss": 0.9664, "step": 27155 }, { "epoch": 0.51, "learning_rate": 2.521539673791827e-06, "loss": 1.2446, "step": 27156 }, { "epoch": 0.51, "learning_rate": 2.521386913887951e-06, "loss": 0.9667, "step": 27157 }, { "epoch": 0.51, "learning_rate": 2.521234153904217e-06, "loss": 1.1225, "step": 27158 }, { "epoch": 0.51, "learning_rate": 2.5210813938411965e-06, "loss": 0.6759, "step": 27159 }, { "epoch": 0.51, "learning_rate": 2.520928633699458e-06, "loss": 1.0029, "step": 27160 }, { "epoch": 0.51, "learning_rate": 2.5207758734795724e-06, "loss": 0.7886, "step": 27161 }, { "epoch": 0.51, "learning_rate": 2.5206231131821108e-06, "loss": 1.1649, "step": 27162 }, { "epoch": 0.51, "learning_rate": 2.5204703528076424e-06, "loss": 0.9419, "step": 27163 }, { "epoch": 0.51, "learning_rate": 2.5203175923567386e-06, "loss": 0.98, "step": 27164 }, { "epoch": 0.51, "learning_rate": 2.5201648318299704e-06, "loss": 0.9402, "step": 27165 }, { "epoch": 0.51, "learning_rate": 2.5200120712279064e-06, "loss": 0.9456, "step": 27166 }, { "epoch": 0.51, "learning_rate": 2.5198593105511184e-06, "loss": 0.9033, "step": 27167 }, { "epoch": 0.51, "learning_rate": 2.5197065498001756e-06, "loss": 0.8989, "step": 27168 }, { "epoch": 0.51, "learning_rate": 2.51955378897565e-06, "loss": 1.0866, "step": 27169 }, { "epoch": 0.51, "learning_rate": 2.5194010280781107e-06, "loss": 0.9034, "step": 27170 }, { "epoch": 0.51, "learning_rate": 2.5192482671081286e-06, "loss": 0.7975, "step": 27171 }, { "epoch": 0.51, "learning_rate": 2.519095506066274e-06, "loss": 0.8191, "step": 27172 }, { "epoch": 0.51, "learning_rate": 2.5189427449531177e-06, "loss": 1.0488, "step": 27173 }, { "epoch": 0.51, "learning_rate": 2.5187899837692297e-06, "loss": 0.9351, "step": 27174 }, { "epoch": 0.51, "learning_rate": 2.5186372225151807e-06, "loss": 1.0692, "step": 27175 }, { "epoch": 0.51, "learning_rate": 2.51848446119154e-06, "loss": 0.8942, "step": 27176 }, { "epoch": 0.51, "learning_rate": 2.5183316997988795e-06, "loss": 0.8669, "step": 27177 }, { "epoch": 0.51, "learning_rate": 2.518178938337769e-06, "loss": 1.0976, "step": 27178 }, { "epoch": 0.51, "learning_rate": 2.5180261768087788e-06, "loss": 0.9608, "step": 27179 }, { "epoch": 0.51, "learning_rate": 2.5178734152124794e-06, "loss": 1.0036, "step": 27180 }, { "epoch": 0.51, "learning_rate": 2.5177206535494414e-06, "loss": 1.1719, "step": 27181 }, { "epoch": 0.51, "learning_rate": 2.5175678918202353e-06, "loss": 1.0989, "step": 27182 }, { "epoch": 0.51, "learning_rate": 2.5174151300254303e-06, "loss": 0.9131, "step": 27183 }, { "epoch": 0.51, "learning_rate": 2.5172623681655982e-06, "loss": 0.9494, "step": 27184 }, { "epoch": 0.51, "learning_rate": 2.5171096062413086e-06, "loss": 0.795, "step": 27185 }, { "epoch": 0.51, "learning_rate": 2.516956844253133e-06, "loss": 1.0525, "step": 27186 }, { "epoch": 0.51, "learning_rate": 2.516804082201641e-06, "loss": 1.0828, "step": 27187 }, { "epoch": 0.51, "learning_rate": 2.5166513200874028e-06, "loss": 1.2284, "step": 27188 }, { "epoch": 0.51, "learning_rate": 2.5164985579109887e-06, "loss": 0.9371, "step": 27189 }, { "epoch": 0.51, "learning_rate": 2.51634579567297e-06, "loss": 0.9915, "step": 27190 }, { "epoch": 0.51, "learning_rate": 2.516193033373916e-06, "loss": 0.9493, "step": 27191 }, { "epoch": 0.51, "learning_rate": 2.516040271014399e-06, "loss": 1.0095, "step": 27192 }, { "epoch": 0.51, "learning_rate": 2.5158875085949868e-06, "loss": 1.3544, "step": 27193 }, { "epoch": 0.51, "learning_rate": 2.5157347461162514e-06, "loss": 1.0517, "step": 27194 }, { "epoch": 0.51, "learning_rate": 2.5155819835787637e-06, "loss": 0.969, "step": 27195 }, { "epoch": 0.51, "learning_rate": 2.515429220983093e-06, "loss": 0.9759, "step": 27196 }, { "epoch": 0.51, "learning_rate": 2.515276458329809e-06, "loss": 1.0768, "step": 27197 }, { "epoch": 0.51, "learning_rate": 2.5151236956194843e-06, "loss": 0.9522, "step": 27198 }, { "epoch": 0.51, "learning_rate": 2.514970932852688e-06, "loss": 1.0735, "step": 27199 }, { "epoch": 0.51, "learning_rate": 2.5148181700299906e-06, "loss": 1.1523, "step": 27200 }, { "epoch": 0.51, "learning_rate": 2.5146654071519626e-06, "loss": 1.0253, "step": 27201 }, { "epoch": 0.51, "learning_rate": 2.514512644219175e-06, "loss": 0.9719, "step": 27202 }, { "epoch": 0.51, "learning_rate": 2.5143598812321968e-06, "loss": 0.9389, "step": 27203 }, { "epoch": 0.51, "learning_rate": 2.514207118191599e-06, "loss": 0.8371, "step": 27204 }, { "epoch": 0.51, "learning_rate": 2.514054355097953e-06, "loss": 0.819, "step": 27205 }, { "epoch": 0.51, "learning_rate": 2.513901591951828e-06, "loss": 1.0526, "step": 27206 }, { "epoch": 0.51, "learning_rate": 2.5137488287537952e-06, "loss": 0.9211, "step": 27207 }, { "epoch": 0.51, "learning_rate": 2.513596065504425e-06, "loss": 1.0984, "step": 27208 }, { "epoch": 0.51, "learning_rate": 2.513443302204287e-06, "loss": 0.9481, "step": 27209 }, { "epoch": 0.51, "learning_rate": 2.513290538853952e-06, "loss": 0.8274, "step": 27210 }, { "epoch": 0.51, "learning_rate": 2.5131377754539902e-06, "loss": 0.9588, "step": 27211 }, { "epoch": 0.51, "learning_rate": 2.512985012004973e-06, "loss": 1.0201, "step": 27212 }, { "epoch": 0.51, "learning_rate": 2.5128322485074706e-06, "loss": 1.1328, "step": 27213 }, { "epoch": 0.51, "learning_rate": 2.512679484962053e-06, "loss": 0.9224, "step": 27214 }, { "epoch": 0.51, "learning_rate": 2.5125267213692893e-06, "loss": 0.7306, "step": 27215 }, { "epoch": 0.51, "learning_rate": 2.512373957729753e-06, "loss": 0.8033, "step": 27216 }, { "epoch": 0.51, "learning_rate": 2.5122211940440113e-06, "loss": 0.9546, "step": 27217 }, { "epoch": 0.51, "learning_rate": 2.5120684303126357e-06, "loss": 0.9597, "step": 27218 }, { "epoch": 0.51, "learning_rate": 2.511915666536198e-06, "loss": 1.1666, "step": 27219 }, { "epoch": 0.51, "learning_rate": 2.5117629027152674e-06, "loss": 0.9246, "step": 27220 }, { "epoch": 0.51, "learning_rate": 2.5116101388504142e-06, "loss": 0.8877, "step": 27221 }, { "epoch": 0.51, "learning_rate": 2.5114573749422096e-06, "loss": 0.9571, "step": 27222 }, { "epoch": 0.51, "learning_rate": 2.511304610991223e-06, "loss": 1.0651, "step": 27223 }, { "epoch": 0.51, "learning_rate": 2.5111518469980257e-06, "loss": 1.2056, "step": 27224 }, { "epoch": 0.51, "learning_rate": 2.510999082963187e-06, "loss": 0.9725, "step": 27225 }, { "epoch": 0.51, "learning_rate": 2.5108463188872783e-06, "loss": 0.9996, "step": 27226 }, { "epoch": 0.51, "learning_rate": 2.51069355477087e-06, "loss": 0.9537, "step": 27227 }, { "epoch": 0.51, "learning_rate": 2.510540790614533e-06, "loss": 1.018, "step": 27228 }, { "epoch": 0.51, "learning_rate": 2.5103880264188363e-06, "loss": 0.9121, "step": 27229 }, { "epoch": 0.51, "learning_rate": 2.510235262184351e-06, "loss": 0.7449, "step": 27230 }, { "epoch": 0.51, "learning_rate": 2.5100824979116474e-06, "loss": 1.0649, "step": 27231 }, { "epoch": 0.51, "learning_rate": 2.509929733601296e-06, "loss": 0.806, "step": 27232 }, { "epoch": 0.51, "learning_rate": 2.5097769692538675e-06, "loss": 0.8681, "step": 27233 }, { "epoch": 0.51, "learning_rate": 2.5096242048699327e-06, "loss": 0.9892, "step": 27234 }, { "epoch": 0.51, "learning_rate": 2.509471440450061e-06, "loss": 0.83, "step": 27235 }, { "epoch": 0.51, "learning_rate": 2.5093186759948228e-06, "loss": 1.0451, "step": 27236 }, { "epoch": 0.51, "learning_rate": 2.50916591150479e-06, "loss": 1.217, "step": 27237 }, { "epoch": 0.51, "learning_rate": 2.5090131469805313e-06, "loss": 1.1614, "step": 27238 }, { "epoch": 0.51, "learning_rate": 2.5088603824226172e-06, "loss": 0.8997, "step": 27239 }, { "epoch": 0.51, "learning_rate": 2.5087076178316193e-06, "loss": 0.728, "step": 27240 }, { "epoch": 0.51, "learning_rate": 2.508554853208107e-06, "loss": 0.9904, "step": 27241 }, { "epoch": 0.51, "learning_rate": 2.508402088552652e-06, "loss": 0.7411, "step": 27242 }, { "epoch": 0.51, "learning_rate": 2.5082493238658234e-06, "loss": 1.0751, "step": 27243 }, { "epoch": 0.51, "learning_rate": 2.508096559148192e-06, "loss": 1.1766, "step": 27244 }, { "epoch": 0.51, "learning_rate": 2.507943794400328e-06, "loss": 0.8559, "step": 27245 }, { "epoch": 0.51, "learning_rate": 2.5077910296228025e-06, "loss": 0.8201, "step": 27246 }, { "epoch": 0.51, "learning_rate": 2.507638264816185e-06, "loss": 0.8184, "step": 27247 }, { "epoch": 0.51, "learning_rate": 2.5074854999810477e-06, "loss": 0.6392, "step": 27248 }, { "epoch": 0.51, "learning_rate": 2.5073327351179586e-06, "loss": 0.8317, "step": 27249 }, { "epoch": 0.51, "learning_rate": 2.5071799702274896e-06, "loss": 1.0263, "step": 27250 }, { "epoch": 0.51, "learning_rate": 2.507027205310211e-06, "loss": 0.9214, "step": 27251 }, { "epoch": 0.51, "learning_rate": 2.506874440366693e-06, "loss": 0.9246, "step": 27252 }, { "epoch": 0.51, "learning_rate": 2.5067216753975054e-06, "loss": 1.0813, "step": 27253 }, { "epoch": 0.51, "learning_rate": 2.5065689104032202e-06, "loss": 0.8808, "step": 27254 }, { "epoch": 0.51, "learning_rate": 2.5064161453844067e-06, "loss": 1.245, "step": 27255 }, { "epoch": 0.51, "learning_rate": 2.5062633803416353e-06, "loss": 0.9815, "step": 27256 }, { "epoch": 0.51, "learning_rate": 2.5061106152754772e-06, "loss": 1.0628, "step": 27257 }, { "epoch": 0.51, "learning_rate": 2.505957850186502e-06, "loss": 0.9235, "step": 27258 }, { "epoch": 0.51, "learning_rate": 2.5058050850752796e-06, "loss": 0.7757, "step": 27259 }, { "epoch": 0.51, "learning_rate": 2.5056523199423817e-06, "loss": 0.9138, "step": 27260 }, { "epoch": 0.51, "learning_rate": 2.5054995547883775e-06, "loss": 0.885, "step": 27261 }, { "epoch": 0.51, "learning_rate": 2.505346789613839e-06, "loss": 0.9314, "step": 27262 }, { "epoch": 0.51, "learning_rate": 2.505194024419336e-06, "loss": 0.982, "step": 27263 }, { "epoch": 0.51, "learning_rate": 2.5050412592054385e-06, "loss": 1.0388, "step": 27264 }, { "epoch": 0.51, "learning_rate": 2.5048884939727166e-06, "loss": 0.7671, "step": 27265 }, { "epoch": 0.51, "learning_rate": 2.504735728721741e-06, "loss": 0.7457, "step": 27266 }, { "epoch": 0.51, "learning_rate": 2.504582963453083e-06, "loss": 0.9948, "step": 27267 }, { "epoch": 0.51, "learning_rate": 2.504430198167312e-06, "loss": 1.2568, "step": 27268 }, { "epoch": 0.51, "learning_rate": 2.5042774328649996e-06, "loss": 1.1147, "step": 27269 }, { "epoch": 0.51, "learning_rate": 2.5041246675467146e-06, "loss": 1.0276, "step": 27270 }, { "epoch": 0.51, "learning_rate": 2.5039719022130284e-06, "loss": 0.9158, "step": 27271 }, { "epoch": 0.51, "learning_rate": 2.503819136864511e-06, "loss": 0.9326, "step": 27272 }, { "epoch": 0.51, "learning_rate": 2.5036663715017327e-06, "loss": 0.9091, "step": 27273 }, { "epoch": 0.51, "learning_rate": 2.5035136061252646e-06, "loss": 1.0921, "step": 27274 }, { "epoch": 0.51, "learning_rate": 2.5033608407356776e-06, "loss": 0.9877, "step": 27275 }, { "epoch": 0.51, "learning_rate": 2.503208075333541e-06, "loss": 0.8737, "step": 27276 }, { "epoch": 0.51, "learning_rate": 2.503055309919425e-06, "loss": 0.8725, "step": 27277 }, { "epoch": 0.51, "learning_rate": 2.502902544493901e-06, "loss": 0.7011, "step": 27278 }, { "epoch": 0.51, "learning_rate": 2.502749779057539e-06, "loss": 1.0424, "step": 27279 }, { "epoch": 0.51, "learning_rate": 2.502597013610909e-06, "loss": 0.894, "step": 27280 }, { "epoch": 0.51, "learning_rate": 2.5024442481545818e-06, "loss": 1.038, "step": 27281 }, { "epoch": 0.51, "learning_rate": 2.502291482689128e-06, "loss": 0.9465, "step": 27282 }, { "epoch": 0.51, "learning_rate": 2.502138717215118e-06, "loss": 0.8697, "step": 27283 }, { "epoch": 0.51, "learning_rate": 2.501985951733123e-06, "loss": 0.9755, "step": 27284 }, { "epoch": 0.51, "learning_rate": 2.501833186243711e-06, "loss": 0.832, "step": 27285 }, { "epoch": 0.51, "learning_rate": 2.5016804207474547e-06, "loss": 0.9473, "step": 27286 }, { "epoch": 0.51, "learning_rate": 2.5015276552449235e-06, "loss": 1.0031, "step": 27287 }, { "epoch": 0.51, "learning_rate": 2.501374889736688e-06, "loss": 1.0167, "step": 27288 }, { "epoch": 0.51, "learning_rate": 2.5012221242233186e-06, "loss": 0.9171, "step": 27289 }, { "epoch": 0.51, "learning_rate": 2.501069358705387e-06, "loss": 0.7287, "step": 27290 }, { "epoch": 0.51, "learning_rate": 2.500916593183461e-06, "loss": 0.7532, "step": 27291 }, { "epoch": 0.51, "learning_rate": 2.5007638276581133e-06, "loss": 0.7165, "step": 27292 }, { "epoch": 0.51, "learning_rate": 2.5006110621299136e-06, "loss": 0.8427, "step": 27293 }, { "epoch": 0.51, "learning_rate": 2.500458296599431e-06, "loss": 1.0098, "step": 27294 }, { "epoch": 0.51, "learning_rate": 2.500305531067238e-06, "loss": 1.0227, "step": 27295 }, { "epoch": 0.51, "learning_rate": 2.5001527655339046e-06, "loss": 0.9814, "step": 27296 }, { "epoch": 0.52, "learning_rate": 2.5e-06, "loss": 0.7562, "step": 27297 }, { "epoch": 0.52, "learning_rate": 2.4998472344660966e-06, "loss": 0.7417, "step": 27298 }, { "epoch": 0.52, "learning_rate": 2.4996944689327622e-06, "loss": 1.0273, "step": 27299 }, { "epoch": 0.52, "learning_rate": 2.4995417034005696e-06, "loss": 1.0764, "step": 27300 }, { "epoch": 0.52, "learning_rate": 2.4993889378700876e-06, "loss": 0.9924, "step": 27301 }, { "epoch": 0.52, "learning_rate": 2.4992361723418867e-06, "loss": 1.0543, "step": 27302 }, { "epoch": 0.52, "learning_rate": 2.4990834068165394e-06, "loss": 0.914, "step": 27303 }, { "epoch": 0.52, "learning_rate": 2.498930641294614e-06, "loss": 0.9233, "step": 27304 }, { "epoch": 0.52, "learning_rate": 2.4987778757766814e-06, "loss": 0.926, "step": 27305 }, { "epoch": 0.52, "learning_rate": 2.498625110263313e-06, "loss": 1.0021, "step": 27306 }, { "epoch": 0.52, "learning_rate": 2.4984723447550773e-06, "loss": 0.903, "step": 27307 }, { "epoch": 0.52, "learning_rate": 2.498319579252546e-06, "loss": 0.823, "step": 27308 }, { "epoch": 0.52, "learning_rate": 2.4981668137562893e-06, "loss": 0.9984, "step": 27309 }, { "epoch": 0.52, "learning_rate": 2.4980140482668787e-06, "loss": 0.8886, "step": 27310 }, { "epoch": 0.52, "learning_rate": 2.497861282784882e-06, "loss": 1.0038, "step": 27311 }, { "epoch": 0.52, "learning_rate": 2.4977085173108726e-06, "loss": 1.3054, "step": 27312 }, { "epoch": 0.52, "learning_rate": 2.4975557518454195e-06, "loss": 0.695, "step": 27313 }, { "epoch": 0.52, "learning_rate": 2.497402986389092e-06, "loss": 0.6546, "step": 27314 }, { "epoch": 0.52, "learning_rate": 2.497250220942462e-06, "loss": 0.8719, "step": 27315 }, { "epoch": 0.52, "learning_rate": 2.4970974555061e-06, "loss": 0.8511, "step": 27316 }, { "epoch": 0.52, "learning_rate": 2.496944690080575e-06, "loss": 1.0442, "step": 27317 }, { "epoch": 0.52, "learning_rate": 2.4967919246664602e-06, "loss": 1.0492, "step": 27318 }, { "epoch": 0.52, "learning_rate": 2.4966391592643236e-06, "loss": 1.1123, "step": 27319 }, { "epoch": 0.52, "learning_rate": 2.4964863938747354e-06, "loss": 0.9315, "step": 27320 }, { "epoch": 0.52, "learning_rate": 2.4963336284982677e-06, "loss": 0.8463, "step": 27321 }, { "epoch": 0.52, "learning_rate": 2.49618086313549e-06, "loss": 0.9243, "step": 27322 }, { "epoch": 0.52, "learning_rate": 2.496028097786972e-06, "loss": 1.0041, "step": 27323 }, { "epoch": 0.52, "learning_rate": 2.4958753324532863e-06, "loss": 0.9825, "step": 27324 }, { "epoch": 0.52, "learning_rate": 2.4957225671350017e-06, "loss": 1.1432, "step": 27325 }, { "epoch": 0.52, "learning_rate": 2.4955698018326884e-06, "loss": 0.8878, "step": 27326 }, { "epoch": 0.52, "learning_rate": 2.4954170365469176e-06, "loss": 0.7712, "step": 27327 }, { "epoch": 0.52, "learning_rate": 2.49526427127826e-06, "loss": 0.9632, "step": 27328 }, { "epoch": 0.52, "learning_rate": 2.4951115060272843e-06, "loss": 0.9088, "step": 27329 }, { "epoch": 0.52, "learning_rate": 2.4949587407945623e-06, "loss": 1.0044, "step": 27330 }, { "epoch": 0.52, "learning_rate": 2.4948059755806652e-06, "loss": 1.1123, "step": 27331 }, { "epoch": 0.52, "learning_rate": 2.4946532103861614e-06, "loss": 0.8697, "step": 27332 }, { "epoch": 0.52, "learning_rate": 2.494500445211623e-06, "loss": 0.7849, "step": 27333 }, { "epoch": 0.52, "learning_rate": 2.4943476800576196e-06, "loss": 0.92, "step": 27334 }, { "epoch": 0.52, "learning_rate": 2.4941949149247213e-06, "loss": 0.9875, "step": 27335 }, { "epoch": 0.52, "learning_rate": 2.4940421498134994e-06, "loss": 0.8584, "step": 27336 }, { "epoch": 0.52, "learning_rate": 2.493889384724524e-06, "loss": 1.1568, "step": 27337 }, { "epoch": 0.52, "learning_rate": 2.4937366196583647e-06, "loss": 0.861, "step": 27338 }, { "epoch": 0.52, "learning_rate": 2.493583854615594e-06, "loss": 0.8376, "step": 27339 }, { "epoch": 0.52, "learning_rate": 2.493431089596781e-06, "loss": 1.022, "step": 27340 }, { "epoch": 0.52, "learning_rate": 2.4932783246024946e-06, "loss": 0.7667, "step": 27341 }, { "epoch": 0.52, "learning_rate": 2.493125559633308e-06, "loss": 0.965, "step": 27342 }, { "epoch": 0.52, "learning_rate": 2.4929727946897896e-06, "loss": 1.1373, "step": 27343 }, { "epoch": 0.52, "learning_rate": 2.4928200297725104e-06, "loss": 0.886, "step": 27344 }, { "epoch": 0.52, "learning_rate": 2.492667264882042e-06, "loss": 0.9761, "step": 27345 }, { "epoch": 0.52, "learning_rate": 2.492514500018954e-06, "loss": 0.81, "step": 27346 }, { "epoch": 0.52, "learning_rate": 2.492361735183815e-06, "loss": 1.0206, "step": 27347 }, { "epoch": 0.52, "learning_rate": 2.4922089703771984e-06, "loss": 0.8302, "step": 27348 }, { "epoch": 0.52, "learning_rate": 2.4920562055996727e-06, "loss": 0.89, "step": 27349 }, { "epoch": 0.52, "learning_rate": 2.491903440851809e-06, "loss": 1.0241, "step": 27350 }, { "epoch": 0.52, "learning_rate": 2.4917506761341775e-06, "loss": 0.8793, "step": 27351 }, { "epoch": 0.52, "learning_rate": 2.491597911447349e-06, "loss": 1.1966, "step": 27352 }, { "epoch": 0.52, "learning_rate": 2.491445146791893e-06, "loss": 0.8129, "step": 27353 }, { "epoch": 0.52, "learning_rate": 2.4912923821683815e-06, "loss": 0.994, "step": 27354 }, { "epoch": 0.52, "learning_rate": 2.491139617577384e-06, "loss": 1.045, "step": 27355 }, { "epoch": 0.52, "learning_rate": 2.49098685301947e-06, "loss": 1.068, "step": 27356 }, { "epoch": 0.52, "learning_rate": 2.490834088495211e-06, "loss": 1.0961, "step": 27357 }, { "epoch": 0.52, "learning_rate": 2.4906813240051776e-06, "loss": 0.9831, "step": 27358 }, { "epoch": 0.52, "learning_rate": 2.490528559549939e-06, "loss": 0.9636, "step": 27359 }, { "epoch": 0.52, "learning_rate": 2.4903757951300677e-06, "loss": 0.7356, "step": 27360 }, { "epoch": 0.52, "learning_rate": 2.490223030746133e-06, "loss": 0.8976, "step": 27361 }, { "epoch": 0.52, "learning_rate": 2.490070266398704e-06, "loss": 1.2596, "step": 27362 }, { "epoch": 0.52, "learning_rate": 2.489917502088353e-06, "loss": 1.0148, "step": 27363 }, { "epoch": 0.52, "learning_rate": 2.4897647378156497e-06, "loss": 0.8363, "step": 27364 }, { "epoch": 0.52, "learning_rate": 2.4896119735811637e-06, "loss": 0.8764, "step": 27365 }, { "epoch": 0.52, "learning_rate": 2.489459209385468e-06, "loss": 0.7122, "step": 27366 }, { "epoch": 0.52, "learning_rate": 2.4893064452291305e-06, "loss": 0.9478, "step": 27367 }, { "epoch": 0.52, "learning_rate": 2.4891536811127213e-06, "loss": 0.8792, "step": 27368 }, { "epoch": 0.52, "learning_rate": 2.489000917036814e-06, "loss": 1.1439, "step": 27369 }, { "epoch": 0.52, "learning_rate": 2.488848153001975e-06, "loss": 0.7997, "step": 27370 }, { "epoch": 0.52, "learning_rate": 2.488695389008778e-06, "loss": 0.7983, "step": 27371 }, { "epoch": 0.52, "learning_rate": 2.4885426250577913e-06, "loss": 1.0129, "step": 27372 }, { "epoch": 0.52, "learning_rate": 2.4883898611495866e-06, "loss": 0.7374, "step": 27373 }, { "epoch": 0.52, "learning_rate": 2.4882370972847326e-06, "loss": 1.0205, "step": 27374 }, { "epoch": 0.52, "learning_rate": 2.4880843334638024e-06, "loss": 1.0787, "step": 27375 }, { "epoch": 0.52, "learning_rate": 2.4879315696873647e-06, "loss": 0.9589, "step": 27376 }, { "epoch": 0.52, "learning_rate": 2.4877788059559896e-06, "loss": 0.9377, "step": 27377 }, { "epoch": 0.52, "learning_rate": 2.487626042270248e-06, "loss": 0.8411, "step": 27378 }, { "epoch": 0.52, "learning_rate": 2.487473278630711e-06, "loss": 0.8069, "step": 27379 }, { "epoch": 0.52, "learning_rate": 2.4873205150379474e-06, "loss": 0.9528, "step": 27380 }, { "epoch": 0.52, "learning_rate": 2.48716775149253e-06, "loss": 1.0865, "step": 27381 }, { "epoch": 0.52, "learning_rate": 2.4870149879950277e-06, "loss": 1.0865, "step": 27382 }, { "epoch": 0.52, "learning_rate": 2.4868622245460093e-06, "loss": 0.8138, "step": 27383 }, { "epoch": 0.52, "learning_rate": 2.486709461146049e-06, "loss": 0.8779, "step": 27384 }, { "epoch": 0.52, "learning_rate": 2.486556697795714e-06, "loss": 0.9509, "step": 27385 }, { "epoch": 0.52, "learning_rate": 2.4864039344955754e-06, "loss": 0.9787, "step": 27386 }, { "epoch": 0.52, "learning_rate": 2.486251171246205e-06, "loss": 1.1364, "step": 27387 }, { "epoch": 0.52, "learning_rate": 2.486098408048173e-06, "loss": 1.0154, "step": 27388 }, { "epoch": 0.52, "learning_rate": 2.4859456449020475e-06, "loss": 0.8553, "step": 27389 }, { "epoch": 0.52, "learning_rate": 2.4857928818084014e-06, "loss": 0.8608, "step": 27390 }, { "epoch": 0.52, "learning_rate": 2.485640118767804e-06, "loss": 1.0385, "step": 27391 }, { "epoch": 0.52, "learning_rate": 2.485487355780826e-06, "loss": 0.8595, "step": 27392 }, { "epoch": 0.52, "learning_rate": 2.485334592848038e-06, "loss": 0.9839, "step": 27393 }, { "epoch": 0.52, "learning_rate": 2.4851818299700103e-06, "loss": 1.0824, "step": 27394 }, { "epoch": 0.52, "learning_rate": 2.485029067147312e-06, "loss": 0.9132, "step": 27395 }, { "epoch": 0.52, "learning_rate": 2.484876304380516e-06, "loss": 0.8128, "step": 27396 }, { "epoch": 0.52, "learning_rate": 2.484723541670192e-06, "loss": 0.9525, "step": 27397 }, { "epoch": 0.52, "learning_rate": 2.484570779016908e-06, "loss": 0.6576, "step": 27398 }, { "epoch": 0.52, "learning_rate": 2.484418016421237e-06, "loss": 0.9712, "step": 27399 }, { "epoch": 0.52, "learning_rate": 2.484265253883749e-06, "loss": 1.0659, "step": 27400 }, { "epoch": 0.52, "learning_rate": 2.484112491405013e-06, "loss": 0.7829, "step": 27401 }, { "epoch": 0.52, "learning_rate": 2.483959728985602e-06, "loss": 0.7936, "step": 27402 }, { "epoch": 0.52, "learning_rate": 2.4838069666260847e-06, "loss": 0.9893, "step": 27403 }, { "epoch": 0.52, "learning_rate": 2.4836542043270305e-06, "loss": 0.9669, "step": 27404 }, { "epoch": 0.52, "learning_rate": 2.483501442089012e-06, "loss": 0.9423, "step": 27405 }, { "epoch": 0.52, "learning_rate": 2.4833486799125985e-06, "loss": 1.1158, "step": 27406 }, { "epoch": 0.52, "learning_rate": 2.4831959177983596e-06, "loss": 1.1249, "step": 27407 }, { "epoch": 0.52, "learning_rate": 2.4830431557468676e-06, "loss": 0.9266, "step": 27408 }, { "epoch": 0.52, "learning_rate": 2.4828903937586922e-06, "loss": 1.0542, "step": 27409 }, { "epoch": 0.52, "learning_rate": 2.482737631834402e-06, "loss": 0.835, "step": 27410 }, { "epoch": 0.52, "learning_rate": 2.4825848699745705e-06, "loss": 0.9244, "step": 27411 }, { "epoch": 0.52, "learning_rate": 2.482432108179766e-06, "loss": 1.0046, "step": 27412 }, { "epoch": 0.52, "learning_rate": 2.4822793464505595e-06, "loss": 1.1847, "step": 27413 }, { "epoch": 0.52, "learning_rate": 2.482126584787521e-06, "loss": 0.8264, "step": 27414 }, { "epoch": 0.52, "learning_rate": 2.481973823191222e-06, "loss": 1.0288, "step": 27415 }, { "epoch": 0.52, "learning_rate": 2.4818210616622325e-06, "loss": 0.8979, "step": 27416 }, { "epoch": 0.52, "learning_rate": 2.481668300201121e-06, "loss": 0.8238, "step": 27417 }, { "epoch": 0.52, "learning_rate": 2.481515538808461e-06, "loss": 1.1312, "step": 27418 }, { "epoch": 0.52, "learning_rate": 2.4813627774848205e-06, "loss": 1.2092, "step": 27419 }, { "epoch": 0.52, "learning_rate": 2.4812100162307707e-06, "loss": 1.0041, "step": 27420 }, { "epoch": 0.52, "learning_rate": 2.481057255046883e-06, "loss": 0.8216, "step": 27421 }, { "epoch": 0.52, "learning_rate": 2.480904493933727e-06, "loss": 1.0174, "step": 27422 }, { "epoch": 0.52, "learning_rate": 2.4807517328918718e-06, "loss": 0.7902, "step": 27423 }, { "epoch": 0.52, "learning_rate": 2.4805989719218905e-06, "loss": 1.1071, "step": 27424 }, { "epoch": 0.52, "learning_rate": 2.480446211024351e-06, "loss": 0.8908, "step": 27425 }, { "epoch": 0.52, "learning_rate": 2.4802934501998248e-06, "loss": 1.0769, "step": 27426 }, { "epoch": 0.52, "learning_rate": 2.4801406894488824e-06, "loss": 1.0383, "step": 27427 }, { "epoch": 0.52, "learning_rate": 2.479987928772095e-06, "loss": 0.9742, "step": 27428 }, { "epoch": 0.52, "learning_rate": 2.4798351681700305e-06, "loss": 0.8959, "step": 27429 }, { "epoch": 0.52, "learning_rate": 2.4796824076432618e-06, "loss": 0.9061, "step": 27430 }, { "epoch": 0.52, "learning_rate": 2.479529647192359e-06, "loss": 1.1492, "step": 27431 }, { "epoch": 0.52, "learning_rate": 2.47937688681789e-06, "loss": 1.0897, "step": 27432 }, { "epoch": 0.52, "learning_rate": 2.479224126520428e-06, "loss": 0.8265, "step": 27433 }, { "epoch": 0.52, "learning_rate": 2.479071366300543e-06, "loss": 0.7558, "step": 27434 }, { "epoch": 0.52, "learning_rate": 2.478918606158804e-06, "loss": 0.6792, "step": 27435 }, { "epoch": 0.52, "learning_rate": 2.478765846095783e-06, "loss": 0.9326, "step": 27436 }, { "epoch": 0.52, "learning_rate": 2.47861308611205e-06, "loss": 1.0892, "step": 27437 }, { "epoch": 0.52, "learning_rate": 2.478460326208174e-06, "loss": 0.8832, "step": 27438 }, { "epoch": 0.52, "learning_rate": 2.478307566384727e-06, "loss": 0.7744, "step": 27439 }, { "epoch": 0.52, "learning_rate": 2.4781548066422793e-06, "loss": 0.8128, "step": 27440 }, { "epoch": 0.52, "learning_rate": 2.4780020469813993e-06, "loss": 0.8803, "step": 27441 }, { "epoch": 0.52, "learning_rate": 2.477849287402661e-06, "loss": 0.8655, "step": 27442 }, { "epoch": 0.52, "learning_rate": 2.477696527906632e-06, "loss": 0.9219, "step": 27443 }, { "epoch": 0.52, "learning_rate": 2.477543768493883e-06, "loss": 0.9124, "step": 27444 }, { "epoch": 0.52, "learning_rate": 2.477391009164986e-06, "loss": 1.0258, "step": 27445 }, { "epoch": 0.52, "learning_rate": 2.477238249920509e-06, "loss": 0.9186, "step": 27446 }, { "epoch": 0.52, "learning_rate": 2.4770854907610244e-06, "loss": 0.7645, "step": 27447 }, { "epoch": 0.52, "learning_rate": 2.4769327316871015e-06, "loss": 0.9323, "step": 27448 }, { "epoch": 0.52, "learning_rate": 2.4767799726993116e-06, "loss": 1.0038, "step": 27449 }, { "epoch": 0.52, "learning_rate": 2.4766272137982236e-06, "loss": 0.9482, "step": 27450 }, { "epoch": 0.52, "learning_rate": 2.47647445498441e-06, "loss": 1.033, "step": 27451 }, { "epoch": 0.52, "learning_rate": 2.4763216962584398e-06, "loss": 0.91, "step": 27452 }, { "epoch": 0.52, "learning_rate": 2.476168937620883e-06, "loss": 0.8918, "step": 27453 }, { "epoch": 0.52, "learning_rate": 2.4760161790723112e-06, "loss": 0.7767, "step": 27454 }, { "epoch": 0.52, "learning_rate": 2.4758634206132944e-06, "loss": 1.0406, "step": 27455 }, { "epoch": 0.52, "learning_rate": 2.475710662244402e-06, "loss": 1.0224, "step": 27456 }, { "epoch": 0.52, "learning_rate": 2.475557903966206e-06, "loss": 0.9702, "step": 27457 }, { "epoch": 0.52, "learning_rate": 2.4754051457792766e-06, "loss": 1.0299, "step": 27458 }, { "epoch": 0.52, "learning_rate": 2.475252387684182e-06, "loss": 1.0417, "step": 27459 }, { "epoch": 0.52, "learning_rate": 2.4750996296814957e-06, "loss": 1.0548, "step": 27460 }, { "epoch": 0.52, "learning_rate": 2.474946871771786e-06, "loss": 0.8187, "step": 27461 }, { "epoch": 0.52, "learning_rate": 2.4747941139556236e-06, "loss": 0.9995, "step": 27462 }, { "epoch": 0.52, "learning_rate": 2.4746413562335796e-06, "loss": 0.9647, "step": 27463 }, { "epoch": 0.52, "learning_rate": 2.4744885986062246e-06, "loss": 0.8992, "step": 27464 }, { "epoch": 0.52, "learning_rate": 2.474335841074127e-06, "loss": 0.9838, "step": 27465 }, { "epoch": 0.52, "learning_rate": 2.47418308363786e-06, "loss": 0.8129, "step": 27466 }, { "epoch": 0.52, "learning_rate": 2.4740303262979917e-06, "loss": 0.8824, "step": 27467 }, { "epoch": 0.52, "learning_rate": 2.4738775690550936e-06, "loss": 0.9727, "step": 27468 }, { "epoch": 0.52, "learning_rate": 2.473724811909736e-06, "loss": 0.8174, "step": 27469 }, { "epoch": 0.52, "learning_rate": 2.4735720548624887e-06, "loss": 0.9749, "step": 27470 }, { "epoch": 0.52, "learning_rate": 2.473419297913922e-06, "loss": 0.8428, "step": 27471 }, { "epoch": 0.52, "learning_rate": 2.4732665410646085e-06, "loss": 0.8222, "step": 27472 }, { "epoch": 0.52, "learning_rate": 2.4731137843151167e-06, "loss": 0.9258, "step": 27473 }, { "epoch": 0.52, "learning_rate": 2.4729610276660157e-06, "loss": 1.1948, "step": 27474 }, { "epoch": 0.52, "learning_rate": 2.4728082711178785e-06, "loss": 1.0358, "step": 27475 }, { "epoch": 0.52, "learning_rate": 2.4726555146712743e-06, "loss": 0.8996, "step": 27476 }, { "epoch": 0.52, "learning_rate": 2.4725027583267727e-06, "loss": 0.893, "step": 27477 }, { "epoch": 0.52, "learning_rate": 2.4723500020849463e-06, "loss": 1.0799, "step": 27478 }, { "epoch": 0.52, "learning_rate": 2.472197245946364e-06, "loss": 0.7402, "step": 27479 }, { "epoch": 0.52, "learning_rate": 2.472044489911595e-06, "loss": 0.8208, "step": 27480 }, { "epoch": 0.52, "learning_rate": 2.4718917339812123e-06, "loss": 1.2294, "step": 27481 }, { "epoch": 0.52, "learning_rate": 2.4717389781557843e-06, "loss": 1.0283, "step": 27482 }, { "epoch": 0.52, "learning_rate": 2.471586222435882e-06, "loss": 0.7453, "step": 27483 }, { "epoch": 0.52, "learning_rate": 2.4714334668220766e-06, "loss": 1.0464, "step": 27484 }, { "epoch": 0.52, "learning_rate": 2.471280711314938e-06, "loss": 0.8381, "step": 27485 }, { "epoch": 0.52, "learning_rate": 2.4711279559150347e-06, "loss": 0.9652, "step": 27486 }, { "epoch": 0.52, "learning_rate": 2.47097520062294e-06, "loss": 1.1309, "step": 27487 }, { "epoch": 0.52, "learning_rate": 2.470822445439223e-06, "loss": 0.9719, "step": 27488 }, { "epoch": 0.52, "learning_rate": 2.470669690364454e-06, "loss": 0.6372, "step": 27489 }, { "epoch": 0.52, "learning_rate": 2.4705169353992033e-06, "loss": 1.0678, "step": 27490 }, { "epoch": 0.52, "learning_rate": 2.470364180544042e-06, "loss": 1.0201, "step": 27491 }, { "epoch": 0.52, "learning_rate": 2.4702114257995385e-06, "loss": 0.8456, "step": 27492 }, { "epoch": 0.52, "learning_rate": 2.470058671166266e-06, "loss": 0.8919, "step": 27493 }, { "epoch": 0.52, "learning_rate": 2.4699059166447934e-06, "loss": 1.1365, "step": 27494 }, { "epoch": 0.52, "learning_rate": 2.46975316223569e-06, "loss": 0.8221, "step": 27495 }, { "epoch": 0.52, "learning_rate": 2.4696004079395284e-06, "loss": 1.0023, "step": 27496 }, { "epoch": 0.52, "learning_rate": 2.469447653756878e-06, "loss": 0.8271, "step": 27497 }, { "epoch": 0.52, "learning_rate": 2.4692948996883083e-06, "loss": 0.9254, "step": 27498 }, { "epoch": 0.52, "learning_rate": 2.4691421457343916e-06, "loss": 1.0512, "step": 27499 }, { "epoch": 0.52, "learning_rate": 2.4689893918956973e-06, "loss": 0.8993, "step": 27500 }, { "epoch": 0.52, "learning_rate": 2.4688366381727944e-06, "loss": 0.7712, "step": 27501 }, { "epoch": 0.52, "learning_rate": 2.4686838845662557e-06, "loss": 0.8516, "step": 27502 }, { "epoch": 0.52, "learning_rate": 2.46853113107665e-06, "loss": 0.9839, "step": 27503 }, { "epoch": 0.52, "learning_rate": 2.468378377704547e-06, "loss": 0.796, "step": 27504 }, { "epoch": 0.52, "learning_rate": 2.4682256244505196e-06, "loss": 1.1692, "step": 27505 }, { "epoch": 0.52, "learning_rate": 2.4680728713151366e-06, "loss": 0.9792, "step": 27506 }, { "epoch": 0.52, "learning_rate": 2.4679201182989675e-06, "loss": 0.8673, "step": 27507 }, { "epoch": 0.52, "learning_rate": 2.467767365402585e-06, "loss": 0.7457, "step": 27508 }, { "epoch": 0.52, "learning_rate": 2.4676146126265574e-06, "loss": 0.79, "step": 27509 }, { "epoch": 0.52, "learning_rate": 2.467461859971456e-06, "loss": 0.9645, "step": 27510 }, { "epoch": 0.52, "learning_rate": 2.467309107437851e-06, "loss": 0.9991, "step": 27511 }, { "epoch": 0.52, "learning_rate": 2.467156355026313e-06, "loss": 1.0441, "step": 27512 }, { "epoch": 0.52, "learning_rate": 2.467003602737411e-06, "loss": 1.0658, "step": 27513 }, { "epoch": 0.52, "learning_rate": 2.4668508505717183e-06, "loss": 0.8521, "step": 27514 }, { "epoch": 0.52, "learning_rate": 2.4666980985298036e-06, "loss": 0.9479, "step": 27515 }, { "epoch": 0.52, "learning_rate": 2.4665453466122354e-06, "loss": 0.8356, "step": 27516 }, { "epoch": 0.52, "learning_rate": 2.4663925948195868e-06, "loss": 0.9822, "step": 27517 }, { "epoch": 0.52, "learning_rate": 2.4662398431524274e-06, "loss": 1.0698, "step": 27518 }, { "epoch": 0.52, "learning_rate": 2.4660870916113264e-06, "loss": 1.0304, "step": 27519 }, { "epoch": 0.52, "learning_rate": 2.4659343401968564e-06, "loss": 0.9592, "step": 27520 }, { "epoch": 0.52, "learning_rate": 2.4657815889095866e-06, "loss": 0.8032, "step": 27521 }, { "epoch": 0.52, "learning_rate": 2.4656288377500863e-06, "loss": 1.1885, "step": 27522 }, { "epoch": 0.52, "learning_rate": 2.4654760867189275e-06, "loss": 0.8779, "step": 27523 }, { "epoch": 0.52, "learning_rate": 2.46532333581668e-06, "loss": 0.9605, "step": 27524 }, { "epoch": 0.52, "learning_rate": 2.4651705850439128e-06, "loss": 1.0632, "step": 27525 }, { "epoch": 0.52, "learning_rate": 2.465017834401199e-06, "loss": 0.8759, "step": 27526 }, { "epoch": 0.52, "learning_rate": 2.4648650838891076e-06, "loss": 0.8021, "step": 27527 }, { "epoch": 0.52, "learning_rate": 2.464712333508208e-06, "loss": 0.8116, "step": 27528 }, { "epoch": 0.52, "learning_rate": 2.4645595832590723e-06, "loss": 0.9421, "step": 27529 }, { "epoch": 0.52, "learning_rate": 2.4644068331422695e-06, "loss": 0.9601, "step": 27530 }, { "epoch": 0.52, "learning_rate": 2.4642540831583704e-06, "loss": 1.0329, "step": 27531 }, { "epoch": 0.52, "learning_rate": 2.464101333307946e-06, "loss": 0.9826, "step": 27532 }, { "epoch": 0.52, "learning_rate": 2.463948583591566e-06, "loss": 0.9034, "step": 27533 }, { "epoch": 0.52, "learning_rate": 2.4637958340098e-06, "loss": 0.7767, "step": 27534 }, { "epoch": 0.52, "learning_rate": 2.4636430845632206e-06, "loss": 0.8474, "step": 27535 }, { "epoch": 0.52, "learning_rate": 2.4634903352523963e-06, "loss": 0.9298, "step": 27536 }, { "epoch": 0.52, "learning_rate": 2.4633375860778973e-06, "loss": 0.92, "step": 27537 }, { "epoch": 0.52, "learning_rate": 2.463184837040295e-06, "loss": 1.0245, "step": 27538 }, { "epoch": 0.52, "learning_rate": 2.46303208814016e-06, "loss": 0.8008, "step": 27539 }, { "epoch": 0.52, "learning_rate": 2.462879339378061e-06, "loss": 0.8394, "step": 27540 }, { "epoch": 0.52, "learning_rate": 2.4627265907545707e-06, "loss": 1.0182, "step": 27541 }, { "epoch": 0.52, "learning_rate": 2.462573842270258e-06, "loss": 0.8322, "step": 27542 }, { "epoch": 0.52, "learning_rate": 2.462421093925692e-06, "loss": 1.064, "step": 27543 }, { "epoch": 0.52, "learning_rate": 2.462268345721446e-06, "loss": 1.0886, "step": 27544 }, { "epoch": 0.52, "learning_rate": 2.462115597658088e-06, "loss": 0.8558, "step": 27545 }, { "epoch": 0.52, "learning_rate": 2.4619628497361886e-06, "loss": 0.9677, "step": 27546 }, { "epoch": 0.52, "learning_rate": 2.46181010195632e-06, "loss": 0.9767, "step": 27547 }, { "epoch": 0.52, "learning_rate": 2.4616573543190512e-06, "loss": 0.9959, "step": 27548 }, { "epoch": 0.52, "learning_rate": 2.4615046068249517e-06, "loss": 0.8544, "step": 27549 }, { "epoch": 0.52, "learning_rate": 2.461351859474594e-06, "loss": 1.124, "step": 27550 }, { "epoch": 0.52, "learning_rate": 2.4611991122685467e-06, "loss": 1.0303, "step": 27551 }, { "epoch": 0.52, "learning_rate": 2.4610463652073805e-06, "loss": 0.7751, "step": 27552 }, { "epoch": 0.52, "learning_rate": 2.4608936182916664e-06, "loss": 0.9094, "step": 27553 }, { "epoch": 0.52, "learning_rate": 2.4607408715219745e-06, "loss": 0.8298, "step": 27554 }, { "epoch": 0.52, "learning_rate": 2.460588124898874e-06, "loss": 0.9464, "step": 27555 }, { "epoch": 0.52, "learning_rate": 2.4604353784229375e-06, "loss": 1.1176, "step": 27556 }, { "epoch": 0.52, "learning_rate": 2.460282632094734e-06, "loss": 1.0533, "step": 27557 }, { "epoch": 0.52, "learning_rate": 2.4601298859148327e-06, "loss": 0.9736, "step": 27558 }, { "epoch": 0.52, "learning_rate": 2.4599771398838055e-06, "loss": 0.7446, "step": 27559 }, { "epoch": 0.52, "learning_rate": 2.4598243940022234e-06, "loss": 0.7786, "step": 27560 }, { "epoch": 0.52, "learning_rate": 2.4596716482706546e-06, "loss": 0.874, "step": 27561 }, { "epoch": 0.52, "learning_rate": 2.4595189026896717e-06, "loss": 1.1658, "step": 27562 }, { "epoch": 0.52, "learning_rate": 2.459366157259844e-06, "loss": 0.9408, "step": 27563 }, { "epoch": 0.52, "learning_rate": 2.4592134119817406e-06, "loss": 0.9935, "step": 27564 }, { "epoch": 0.52, "learning_rate": 2.459060666855934e-06, "loss": 1.0945, "step": 27565 }, { "epoch": 0.52, "learning_rate": 2.4589079218829934e-06, "loss": 0.8942, "step": 27566 }, { "epoch": 0.52, "learning_rate": 2.458755177063489e-06, "loss": 0.7622, "step": 27567 }, { "epoch": 0.52, "learning_rate": 2.458602432397992e-06, "loss": 1.0726, "step": 27568 }, { "epoch": 0.52, "learning_rate": 2.4584496878870726e-06, "loss": 0.7694, "step": 27569 }, { "epoch": 0.52, "learning_rate": 2.4582969435312996e-06, "loss": 0.9886, "step": 27570 }, { "epoch": 0.52, "learning_rate": 2.458144199331246e-06, "loss": 0.9462, "step": 27571 }, { "epoch": 0.52, "learning_rate": 2.4579914552874796e-06, "loss": 0.8015, "step": 27572 }, { "epoch": 0.52, "learning_rate": 2.457838711400572e-06, "loss": 0.9252, "step": 27573 }, { "epoch": 0.52, "learning_rate": 2.4576859676710934e-06, "loss": 0.7905, "step": 27574 }, { "epoch": 0.52, "learning_rate": 2.457533224099615e-06, "loss": 1.0967, "step": 27575 }, { "epoch": 0.52, "learning_rate": 2.4573804806867043e-06, "loss": 0.6665, "step": 27576 }, { "epoch": 0.52, "learning_rate": 2.457227737432935e-06, "loss": 1.1179, "step": 27577 }, { "epoch": 0.52, "learning_rate": 2.457074994338876e-06, "loss": 0.9259, "step": 27578 }, { "epoch": 0.52, "learning_rate": 2.4569222514050974e-06, "loss": 0.8304, "step": 27579 }, { "epoch": 0.52, "learning_rate": 2.4567695086321693e-06, "loss": 0.7797, "step": 27580 }, { "epoch": 0.52, "learning_rate": 2.4566167660206637e-06, "loss": 0.9233, "step": 27581 }, { "epoch": 0.52, "learning_rate": 2.4564640235711485e-06, "loss": 1.0236, "step": 27582 }, { "epoch": 0.52, "learning_rate": 2.456311281284196e-06, "loss": 0.919, "step": 27583 }, { "epoch": 0.52, "learning_rate": 2.4561585391603763e-06, "loss": 1.0112, "step": 27584 }, { "epoch": 0.52, "learning_rate": 2.456005797200258e-06, "loss": 0.8095, "step": 27585 }, { "epoch": 0.52, "learning_rate": 2.455853055404414e-06, "loss": 0.9504, "step": 27586 }, { "epoch": 0.52, "learning_rate": 2.4557003137734125e-06, "loss": 1.2245, "step": 27587 }, { "epoch": 0.52, "learning_rate": 2.4555475723078243e-06, "loss": 1.1424, "step": 27588 }, { "epoch": 0.52, "learning_rate": 2.455394831008221e-06, "loss": 0.8799, "step": 27589 }, { "epoch": 0.52, "learning_rate": 2.455242089875172e-06, "loss": 0.9192, "step": 27590 }, { "epoch": 0.52, "learning_rate": 2.455089348909247e-06, "loss": 0.8668, "step": 27591 }, { "epoch": 0.52, "learning_rate": 2.454936608111018e-06, "loss": 0.8455, "step": 27592 }, { "epoch": 0.52, "learning_rate": 2.4547838674810535e-06, "loss": 1.0894, "step": 27593 }, { "epoch": 0.52, "learning_rate": 2.454631127019925e-06, "loss": 1.1332, "step": 27594 }, { "epoch": 0.52, "learning_rate": 2.454478386728202e-06, "loss": 0.9565, "step": 27595 }, { "epoch": 0.52, "learning_rate": 2.454325646606456e-06, "loss": 0.873, "step": 27596 }, { "epoch": 0.52, "learning_rate": 2.4541729066552557e-06, "loss": 0.8539, "step": 27597 }, { "epoch": 0.52, "learning_rate": 2.4540201668751733e-06, "loss": 0.8256, "step": 27598 }, { "epoch": 0.52, "learning_rate": 2.4538674272667786e-06, "loss": 0.9661, "step": 27599 }, { "epoch": 0.52, "learning_rate": 2.45371468783064e-06, "loss": 1.1083, "step": 27600 }, { "epoch": 0.52, "learning_rate": 2.4535619485673297e-06, "loss": 0.8086, "step": 27601 }, { "epoch": 0.52, "learning_rate": 2.4534092094774186e-06, "loss": 0.9738, "step": 27602 }, { "epoch": 0.52, "learning_rate": 2.453256470561475e-06, "loss": 1.0184, "step": 27603 }, { "epoch": 0.52, "learning_rate": 2.4531037318200714e-06, "loss": 0.8621, "step": 27604 }, { "epoch": 0.52, "learning_rate": 2.4529509932537766e-06, "loss": 0.7852, "step": 27605 }, { "epoch": 0.52, "learning_rate": 2.4527982548631607e-06, "loss": 1.0783, "step": 27606 }, { "epoch": 0.52, "learning_rate": 2.452645516648795e-06, "loss": 0.7359, "step": 27607 }, { "epoch": 0.52, "learning_rate": 2.45249277861125e-06, "loss": 0.8904, "step": 27608 }, { "epoch": 0.52, "learning_rate": 2.452340040751095e-06, "loss": 0.8985, "step": 27609 }, { "epoch": 0.52, "learning_rate": 2.4521873030689013e-06, "loss": 0.6585, "step": 27610 }, { "epoch": 0.52, "learning_rate": 2.4520345655652385e-06, "loss": 1.0307, "step": 27611 }, { "epoch": 0.52, "learning_rate": 2.4518818282406767e-06, "loss": 1.0931, "step": 27612 }, { "epoch": 0.52, "learning_rate": 2.4517290910957875e-06, "loss": 1.0735, "step": 27613 }, { "epoch": 0.52, "learning_rate": 2.45157635413114e-06, "loss": 1.038, "step": 27614 }, { "epoch": 0.52, "learning_rate": 2.4514236173473042e-06, "loss": 0.8603, "step": 27615 }, { "epoch": 0.52, "learning_rate": 2.451270880744852e-06, "loss": 0.8896, "step": 27616 }, { "epoch": 0.52, "learning_rate": 2.4511181443243534e-06, "loss": 0.7357, "step": 27617 }, { "epoch": 0.52, "learning_rate": 2.4509654080863764e-06, "loss": 1.0687, "step": 27618 }, { "epoch": 0.52, "learning_rate": 2.450812672031495e-06, "loss": 0.9721, "step": 27619 }, { "epoch": 0.52, "learning_rate": 2.450659936160276e-06, "loss": 0.6895, "step": 27620 }, { "epoch": 0.52, "learning_rate": 2.4505072004732923e-06, "loss": 0.7878, "step": 27621 }, { "epoch": 0.52, "learning_rate": 2.4503544649711125e-06, "loss": 0.73, "step": 27622 }, { "epoch": 0.52, "learning_rate": 2.4502017296543085e-06, "loss": 0.92, "step": 27623 }, { "epoch": 0.52, "learning_rate": 2.4500489945234485e-06, "loss": 0.7792, "step": 27624 }, { "epoch": 0.52, "learning_rate": 2.449896259579105e-06, "loss": 1.1509, "step": 27625 }, { "epoch": 0.52, "learning_rate": 2.449743524821847e-06, "loss": 0.9351, "step": 27626 }, { "epoch": 0.52, "learning_rate": 2.4495907902522448e-06, "loss": 0.8252, "step": 27627 }, { "epoch": 0.52, "learning_rate": 2.4494380558708696e-06, "loss": 0.8875, "step": 27628 }, { "epoch": 0.52, "learning_rate": 2.4492853216782913e-06, "loss": 0.7562, "step": 27629 }, { "epoch": 0.52, "learning_rate": 2.4491325876750786e-06, "loss": 1.1256, "step": 27630 }, { "epoch": 0.52, "learning_rate": 2.448979853861805e-06, "loss": 1.2184, "step": 27631 }, { "epoch": 0.52, "learning_rate": 2.448827120239039e-06, "loss": 0.8213, "step": 27632 }, { "epoch": 0.52, "learning_rate": 2.4486743868073495e-06, "loss": 0.8062, "step": 27633 }, { "epoch": 0.52, "learning_rate": 2.4485216535673097e-06, "loss": 0.8471, "step": 27634 }, { "epoch": 0.52, "learning_rate": 2.448368920519488e-06, "loss": 0.7204, "step": 27635 }, { "epoch": 0.52, "learning_rate": 2.4482161876644542e-06, "loss": 0.8248, "step": 27636 }, { "epoch": 0.52, "learning_rate": 2.448063455002781e-06, "loss": 1.0648, "step": 27637 }, { "epoch": 0.52, "learning_rate": 2.4479107225350373e-06, "loss": 1.119, "step": 27638 }, { "epoch": 0.52, "learning_rate": 2.4477579902617916e-06, "loss": 0.8277, "step": 27639 }, { "epoch": 0.52, "learning_rate": 2.4476052581836176e-06, "loss": 0.8315, "step": 27640 }, { "epoch": 0.52, "learning_rate": 2.4474525263010836e-06, "loss": 1.0187, "step": 27641 }, { "epoch": 0.52, "learning_rate": 2.44729979461476e-06, "loss": 0.7882, "step": 27642 }, { "epoch": 0.52, "learning_rate": 2.4471470631252173e-06, "loss": 1.0288, "step": 27643 }, { "epoch": 0.52, "learning_rate": 2.4469943318330267e-06, "loss": 1.0737, "step": 27644 }, { "epoch": 0.52, "learning_rate": 2.4468416007387565e-06, "loss": 1.0681, "step": 27645 }, { "epoch": 0.52, "learning_rate": 2.4466888698429786e-06, "loss": 0.9259, "step": 27646 }, { "epoch": 0.52, "learning_rate": 2.4465361391462632e-06, "loss": 0.9384, "step": 27647 }, { "epoch": 0.52, "learning_rate": 2.44638340864918e-06, "loss": 0.8936, "step": 27648 }, { "epoch": 0.52, "learning_rate": 2.446230678352299e-06, "loss": 0.7921, "step": 27649 }, { "epoch": 0.52, "learning_rate": 2.4460779482561913e-06, "loss": 1.0328, "step": 27650 }, { "epoch": 0.52, "learning_rate": 2.4459252183614276e-06, "loss": 0.9626, "step": 27651 }, { "epoch": 0.52, "learning_rate": 2.445772488668576e-06, "loss": 0.6753, "step": 27652 }, { "epoch": 0.52, "learning_rate": 2.4456197591782095e-06, "loss": 0.8802, "step": 27653 }, { "epoch": 0.52, "learning_rate": 2.445467029890897e-06, "loss": 0.8321, "step": 27654 }, { "epoch": 0.52, "learning_rate": 2.4453143008072083e-06, "loss": 0.8553, "step": 27655 }, { "epoch": 0.52, "learning_rate": 2.445161571927715e-06, "loss": 0.9781, "step": 27656 }, { "epoch": 0.52, "learning_rate": 2.4450088432529866e-06, "loss": 0.7667, "step": 27657 }, { "epoch": 0.52, "learning_rate": 2.4448561147835926e-06, "loss": 0.8393, "step": 27658 }, { "epoch": 0.52, "learning_rate": 2.444703386520105e-06, "loss": 0.8054, "step": 27659 }, { "epoch": 0.52, "learning_rate": 2.444550658463094e-06, "loss": 0.803, "step": 27660 }, { "epoch": 0.52, "learning_rate": 2.4443979306131275e-06, "loss": 0.9811, "step": 27661 }, { "epoch": 0.52, "learning_rate": 2.4442452029707782e-06, "loss": 1.1117, "step": 27662 }, { "epoch": 0.52, "learning_rate": 2.444092475536616e-06, "loss": 1.164, "step": 27663 }, { "epoch": 0.52, "learning_rate": 2.44393974831121e-06, "loss": 1.0129, "step": 27664 }, { "epoch": 0.52, "learning_rate": 2.4437870212951317e-06, "loss": 1.1095, "step": 27665 }, { "epoch": 0.52, "learning_rate": 2.4436342944889518e-06, "loss": 1.0203, "step": 27666 }, { "epoch": 0.52, "learning_rate": 2.443481567893238e-06, "loss": 0.8762, "step": 27667 }, { "epoch": 0.52, "learning_rate": 2.443328841508563e-06, "loss": 0.784, "step": 27668 }, { "epoch": 0.52, "learning_rate": 2.4431761153354967e-06, "loss": 1.1102, "step": 27669 }, { "epoch": 0.52, "learning_rate": 2.443023389374608e-06, "loss": 0.8604, "step": 27670 }, { "epoch": 0.52, "learning_rate": 2.4428706636264697e-06, "loss": 0.9209, "step": 27671 }, { "epoch": 0.52, "learning_rate": 2.4427179380916502e-06, "loss": 0.7231, "step": 27672 }, { "epoch": 0.52, "learning_rate": 2.4425652127707192e-06, "loss": 0.8763, "step": 27673 }, { "epoch": 0.52, "learning_rate": 2.442412487664249e-06, "loss": 0.8428, "step": 27674 }, { "epoch": 0.52, "learning_rate": 2.4422597627728086e-06, "loss": 1.0812, "step": 27675 }, { "epoch": 0.52, "learning_rate": 2.442107038096968e-06, "loss": 1.0097, "step": 27676 }, { "epoch": 0.52, "learning_rate": 2.441954313637298e-06, "loss": 0.686, "step": 27677 }, { "epoch": 0.52, "learning_rate": 2.44180158939437e-06, "loss": 0.8996, "step": 27678 }, { "epoch": 0.52, "learning_rate": 2.4416488653687513e-06, "loss": 0.8827, "step": 27679 }, { "epoch": 0.52, "learning_rate": 2.441496141561015e-06, "loss": 1.2681, "step": 27680 }, { "epoch": 0.52, "learning_rate": 2.4413434179717307e-06, "loss": 0.9514, "step": 27681 }, { "epoch": 0.52, "learning_rate": 2.441190694601467e-06, "loss": 0.9264, "step": 27682 }, { "epoch": 0.52, "learning_rate": 2.441037971450796e-06, "loss": 0.9695, "step": 27683 }, { "epoch": 0.52, "learning_rate": 2.440885248520288e-06, "loss": 1.1667, "step": 27684 }, { "epoch": 0.52, "learning_rate": 2.4407325258105113e-06, "loss": 0.9398, "step": 27685 }, { "epoch": 0.52, "learning_rate": 2.440579803322039e-06, "loss": 1.0195, "step": 27686 }, { "epoch": 0.52, "learning_rate": 2.44042708105544e-06, "loss": 1.1058, "step": 27687 }, { "epoch": 0.52, "learning_rate": 2.440274359011283e-06, "loss": 0.9212, "step": 27688 }, { "epoch": 0.52, "learning_rate": 2.440121637190141e-06, "loss": 0.9299, "step": 27689 }, { "epoch": 0.52, "learning_rate": 2.439968915592582e-06, "loss": 0.8851, "step": 27690 }, { "epoch": 0.52, "learning_rate": 2.4398161942191774e-06, "loss": 0.9617, "step": 27691 }, { "epoch": 0.52, "learning_rate": 2.4396634730704978e-06, "loss": 1.0092, "step": 27692 }, { "epoch": 0.52, "learning_rate": 2.4395107521471133e-06, "loss": 0.9746, "step": 27693 }, { "epoch": 0.52, "learning_rate": 2.439358031449592e-06, "loss": 1.0798, "step": 27694 }, { "epoch": 0.52, "learning_rate": 2.439205310978508e-06, "loss": 1.0468, "step": 27695 }, { "epoch": 0.52, "learning_rate": 2.4390525907344286e-06, "loss": 0.9309, "step": 27696 }, { "epoch": 0.52, "learning_rate": 2.438899870717925e-06, "loss": 1.0266, "step": 27697 }, { "epoch": 0.52, "learning_rate": 2.438747150929567e-06, "loss": 1.0082, "step": 27698 }, { "epoch": 0.52, "learning_rate": 2.4385944313699265e-06, "loss": 0.729, "step": 27699 }, { "epoch": 0.52, "learning_rate": 2.4384417120395708e-06, "loss": 1.0457, "step": 27700 }, { "epoch": 0.52, "learning_rate": 2.438288992939073e-06, "loss": 0.8269, "step": 27701 }, { "epoch": 0.52, "learning_rate": 2.4381362740690028e-06, "loss": 0.8816, "step": 27702 }, { "epoch": 0.52, "learning_rate": 2.4379835554299285e-06, "loss": 0.8513, "step": 27703 }, { "epoch": 0.52, "learning_rate": 2.437830837022422e-06, "loss": 0.8171, "step": 27704 }, { "epoch": 0.52, "learning_rate": 2.4376781188470537e-06, "loss": 0.6881, "step": 27705 }, { "epoch": 0.52, "learning_rate": 2.437525400904393e-06, "loss": 0.9898, "step": 27706 }, { "epoch": 0.52, "learning_rate": 2.437372683195011e-06, "loss": 1.019, "step": 27707 }, { "epoch": 0.52, "learning_rate": 2.4372199657194774e-06, "loss": 0.8066, "step": 27708 }, { "epoch": 0.52, "learning_rate": 2.4370672484783616e-06, "loss": 0.9583, "step": 27709 }, { "epoch": 0.52, "learning_rate": 2.436914531472236e-06, "loss": 0.9438, "step": 27710 }, { "epoch": 0.52, "learning_rate": 2.436761814701669e-06, "loss": 0.8478, "step": 27711 }, { "epoch": 0.52, "learning_rate": 2.436609098167231e-06, "loss": 1.191, "step": 27712 }, { "epoch": 0.52, "learning_rate": 2.4364563818694937e-06, "loss": 0.9257, "step": 27713 }, { "epoch": 0.52, "learning_rate": 2.436303665809026e-06, "loss": 0.9689, "step": 27714 }, { "epoch": 0.52, "learning_rate": 2.4361509499863977e-06, "loss": 1.1831, "step": 27715 }, { "epoch": 0.52, "learning_rate": 2.4359982344021808e-06, "loss": 0.9095, "step": 27716 }, { "epoch": 0.52, "learning_rate": 2.435845519056944e-06, "loss": 0.8837, "step": 27717 }, { "epoch": 0.52, "learning_rate": 2.4356928039512583e-06, "loss": 0.8906, "step": 27718 }, { "epoch": 0.52, "learning_rate": 2.4355400890856933e-06, "loss": 1.1465, "step": 27719 }, { "epoch": 0.52, "learning_rate": 2.4353873744608204e-06, "loss": 0.8169, "step": 27720 }, { "epoch": 0.52, "learning_rate": 2.435234660077208e-06, "loss": 0.8275, "step": 27721 }, { "epoch": 0.52, "learning_rate": 2.4350819459354283e-06, "loss": 0.9274, "step": 27722 }, { "epoch": 0.52, "learning_rate": 2.4349292320360505e-06, "loss": 0.8436, "step": 27723 }, { "epoch": 0.52, "learning_rate": 2.434776518379644e-06, "loss": 0.9125, "step": 27724 }, { "epoch": 0.52, "learning_rate": 2.434623804966781e-06, "loss": 1.0434, "step": 27725 }, { "epoch": 0.52, "learning_rate": 2.434471091798031e-06, "loss": 0.8672, "step": 27726 }, { "epoch": 0.52, "learning_rate": 2.4343183788739623e-06, "loss": 0.6696, "step": 27727 }, { "epoch": 0.52, "learning_rate": 2.4341656661951484e-06, "loss": 0.9275, "step": 27728 }, { "epoch": 0.52, "learning_rate": 2.434012953762158e-06, "loss": 0.7314, "step": 27729 }, { "epoch": 0.52, "learning_rate": 2.4338602415755595e-06, "loss": 1.0092, "step": 27730 }, { "epoch": 0.52, "learning_rate": 2.4337075296359263e-06, "loss": 1.0404, "step": 27731 }, { "epoch": 0.52, "learning_rate": 2.4335548179438266e-06, "loss": 1.0663, "step": 27732 }, { "epoch": 0.52, "learning_rate": 2.433402106499831e-06, "loss": 0.7958, "step": 27733 }, { "epoch": 0.52, "learning_rate": 2.4332493953045104e-06, "loss": 0.9515, "step": 27734 }, { "epoch": 0.52, "learning_rate": 2.4330966843584346e-06, "loss": 0.7338, "step": 27735 }, { "epoch": 0.52, "learning_rate": 2.432943973662173e-06, "loss": 0.8606, "step": 27736 }, { "epoch": 0.52, "learning_rate": 2.4327912632162975e-06, "loss": 1.2308, "step": 27737 }, { "epoch": 0.52, "learning_rate": 2.4326385530213764e-06, "loss": 1.0814, "step": 27738 }, { "epoch": 0.52, "learning_rate": 2.4324858430779812e-06, "loss": 0.9066, "step": 27739 }, { "epoch": 0.52, "learning_rate": 2.4323331333866818e-06, "loss": 0.7879, "step": 27740 }, { "epoch": 0.52, "learning_rate": 2.432180423948049e-06, "loss": 0.8546, "step": 27741 }, { "epoch": 0.52, "learning_rate": 2.4320277147626512e-06, "loss": 1.1829, "step": 27742 }, { "epoch": 0.52, "learning_rate": 2.4318750058310607e-06, "loss": 1.285, "step": 27743 }, { "epoch": 0.52, "learning_rate": 2.4317222971538473e-06, "loss": 0.9703, "step": 27744 }, { "epoch": 0.52, "learning_rate": 2.4315695887315798e-06, "loss": 0.9223, "step": 27745 }, { "epoch": 0.52, "learning_rate": 2.431416880564829e-06, "loss": 0.8379, "step": 27746 }, { "epoch": 0.52, "learning_rate": 2.431264172654167e-06, "loss": 0.823, "step": 27747 }, { "epoch": 0.52, "learning_rate": 2.431111465000161e-06, "loss": 0.7131, "step": 27748 }, { "epoch": 0.52, "learning_rate": 2.4309587576033834e-06, "loss": 0.8872, "step": 27749 }, { "epoch": 0.52, "learning_rate": 2.4308060504644042e-06, "loss": 1.291, "step": 27750 }, { "epoch": 0.52, "learning_rate": 2.4306533435837918e-06, "loss": 1.0126, "step": 27751 }, { "epoch": 0.52, "learning_rate": 2.4305006369621185e-06, "loss": 1.1294, "step": 27752 }, { "epoch": 0.52, "learning_rate": 2.4303479305999537e-06, "loss": 0.7722, "step": 27753 }, { "epoch": 0.52, "learning_rate": 2.430195224497867e-06, "loss": 0.7256, "step": 27754 }, { "epoch": 0.52, "learning_rate": 2.43004251865643e-06, "loss": 0.9439, "step": 27755 }, { "epoch": 0.52, "learning_rate": 2.429889813076212e-06, "loss": 1.0856, "step": 27756 }, { "epoch": 0.52, "learning_rate": 2.4297371077577826e-06, "loss": 0.8242, "step": 27757 }, { "epoch": 0.52, "learning_rate": 2.4295844027017134e-06, "loss": 0.8873, "step": 27758 }, { "epoch": 0.52, "learning_rate": 2.4294316979085734e-06, "loss": 0.8533, "step": 27759 }, { "epoch": 0.52, "learning_rate": 2.429278993378933e-06, "loss": 0.9405, "step": 27760 }, { "epoch": 0.52, "learning_rate": 2.4291262891133632e-06, "loss": 0.9374, "step": 27761 }, { "epoch": 0.52, "learning_rate": 2.428973585112434e-06, "loss": 1.1442, "step": 27762 }, { "epoch": 0.52, "learning_rate": 2.4288208813767143e-06, "loss": 1.0555, "step": 27763 }, { "epoch": 0.52, "learning_rate": 2.428668177906776e-06, "loss": 0.7679, "step": 27764 }, { "epoch": 0.52, "learning_rate": 2.4285154747031887e-06, "loss": 0.9868, "step": 27765 }, { "epoch": 0.52, "learning_rate": 2.4283627717665217e-06, "loss": 0.7477, "step": 27766 }, { "epoch": 0.52, "learning_rate": 2.428210069097346e-06, "loss": 0.9557, "step": 27767 }, { "epoch": 0.52, "learning_rate": 2.4280573666962325e-06, "loss": 1.0189, "step": 27768 }, { "epoch": 0.52, "learning_rate": 2.4279046645637496e-06, "loss": 1.0496, "step": 27769 }, { "epoch": 0.52, "learning_rate": 2.427751962700469e-06, "loss": 0.7229, "step": 27770 }, { "epoch": 0.52, "learning_rate": 2.427599261106961e-06, "loss": 0.7938, "step": 27771 }, { "epoch": 0.52, "learning_rate": 2.4274465597837937e-06, "loss": 0.8332, "step": 27772 }, { "epoch": 0.52, "learning_rate": 2.4272938587315396e-06, "loss": 0.6554, "step": 27773 }, { "epoch": 0.52, "learning_rate": 2.427141157950768e-06, "loss": 0.8411, "step": 27774 }, { "epoch": 0.52, "learning_rate": 2.4269884574420485e-06, "loss": 0.8445, "step": 27775 }, { "epoch": 0.52, "learning_rate": 2.4268357572059525e-06, "loss": 0.8363, "step": 27776 }, { "epoch": 0.52, "learning_rate": 2.4266830572430496e-06, "loss": 0.8784, "step": 27777 }, { "epoch": 0.52, "learning_rate": 2.426530357553909e-06, "loss": 1.1583, "step": 27778 }, { "epoch": 0.52, "learning_rate": 2.426377658139103e-06, "loss": 0.8739, "step": 27779 }, { "epoch": 0.52, "learning_rate": 2.4262249589991997e-06, "loss": 0.8284, "step": 27780 }, { "epoch": 0.52, "learning_rate": 2.4260722601347707e-06, "loss": 0.9879, "step": 27781 }, { "epoch": 0.52, "learning_rate": 2.425919561546385e-06, "loss": 0.9321, "step": 27782 }, { "epoch": 0.52, "learning_rate": 2.4257668632346145e-06, "loss": 0.9202, "step": 27783 }, { "epoch": 0.52, "learning_rate": 2.4256141652000266e-06, "loss": 0.9531, "step": 27784 }, { "epoch": 0.52, "learning_rate": 2.4254614674431943e-06, "loss": 0.9525, "step": 27785 }, { "epoch": 0.52, "learning_rate": 2.425308769964687e-06, "loss": 0.9389, "step": 27786 }, { "epoch": 0.52, "learning_rate": 2.425156072765073e-06, "loss": 0.9986, "step": 27787 }, { "epoch": 0.52, "learning_rate": 2.4250033758449244e-06, "loss": 1.1533, "step": 27788 }, { "epoch": 0.52, "learning_rate": 2.424850679204812e-06, "loss": 0.7847, "step": 27789 }, { "epoch": 0.52, "learning_rate": 2.4246979828453032e-06, "loss": 0.8058, "step": 27790 }, { "epoch": 0.52, "learning_rate": 2.424545286766971e-06, "loss": 0.9178, "step": 27791 }, { "epoch": 0.52, "learning_rate": 2.4243925909703847e-06, "loss": 0.6742, "step": 27792 }, { "epoch": 0.52, "learning_rate": 2.424239895456113e-06, "loss": 0.9471, "step": 27793 }, { "epoch": 0.52, "learning_rate": 2.424087200224728e-06, "loss": 0.9989, "step": 27794 }, { "epoch": 0.52, "learning_rate": 2.423934505276799e-06, "loss": 1.0538, "step": 27795 }, { "epoch": 0.52, "learning_rate": 2.423781810612895e-06, "loss": 0.884, "step": 27796 }, { "epoch": 0.52, "learning_rate": 2.423629116233589e-06, "loss": 0.7517, "step": 27797 }, { "epoch": 0.52, "learning_rate": 2.4234764221394496e-06, "loss": 0.6756, "step": 27798 }, { "epoch": 0.52, "learning_rate": 2.4233237283310453e-06, "loss": 1.0745, "step": 27799 }, { "epoch": 0.52, "learning_rate": 2.423171034808949e-06, "loss": 1.0452, "step": 27800 }, { "epoch": 0.52, "learning_rate": 2.4230183415737296e-06, "loss": 0.9772, "step": 27801 }, { "epoch": 0.52, "learning_rate": 2.4228656486259574e-06, "loss": 0.8711, "step": 27802 }, { "epoch": 0.52, "learning_rate": 2.422712955966202e-06, "loss": 0.8649, "step": 27803 }, { "epoch": 0.52, "learning_rate": 2.4225602635950346e-06, "loss": 0.8907, "step": 27804 }, { "epoch": 0.52, "learning_rate": 2.422407571513024e-06, "loss": 0.7525, "step": 27805 }, { "epoch": 0.52, "learning_rate": 2.4222548797207424e-06, "loss": 0.989, "step": 27806 }, { "epoch": 0.52, "learning_rate": 2.4221021882187585e-06, "loss": 0.9919, "step": 27807 }, { "epoch": 0.52, "learning_rate": 2.4219494970076414e-06, "loss": 0.8899, "step": 27808 }, { "epoch": 0.52, "learning_rate": 2.421796806087963e-06, "loss": 0.8191, "step": 27809 }, { "epoch": 0.52, "learning_rate": 2.4216441154602937e-06, "loss": 0.8942, "step": 27810 }, { "epoch": 0.52, "learning_rate": 2.4214914251252018e-06, "loss": 0.9971, "step": 27811 }, { "epoch": 0.52, "learning_rate": 2.4213387350832595e-06, "loss": 1.0469, "step": 27812 }, { "epoch": 0.52, "learning_rate": 2.4211860453350357e-06, "loss": 1.1987, "step": 27813 }, { "epoch": 0.52, "learning_rate": 2.4210333558811e-06, "loss": 0.7605, "step": 27814 }, { "epoch": 0.52, "learning_rate": 2.4208806667220244e-06, "loss": 0.7719, "step": 27815 }, { "epoch": 0.52, "learning_rate": 2.4207279778583774e-06, "loss": 0.8915, "step": 27816 }, { "epoch": 0.52, "learning_rate": 2.420575289290729e-06, "loss": 0.8839, "step": 27817 }, { "epoch": 0.52, "learning_rate": 2.4204226010196515e-06, "loss": 1.1035, "step": 27818 }, { "epoch": 0.52, "learning_rate": 2.4202699130457135e-06, "loss": 1.0546, "step": 27819 }, { "epoch": 0.52, "learning_rate": 2.420117225369484e-06, "loss": 1.1102, "step": 27820 }, { "epoch": 0.52, "learning_rate": 2.419964537991535e-06, "loss": 0.7923, "step": 27821 }, { "epoch": 0.52, "learning_rate": 2.419811850912436e-06, "loss": 0.9436, "step": 27822 }, { "epoch": 0.52, "learning_rate": 2.4196591641327567e-06, "loss": 0.9469, "step": 27823 }, { "epoch": 0.52, "learning_rate": 2.419506477653068e-06, "loss": 0.9686, "step": 27824 }, { "epoch": 0.52, "learning_rate": 2.41935379147394e-06, "loss": 1.0583, "step": 27825 }, { "epoch": 0.52, "learning_rate": 2.419201105595941e-06, "loss": 1.0181, "step": 27826 }, { "epoch": 0.53, "learning_rate": 2.4190484200196443e-06, "loss": 0.818, "step": 27827 }, { "epoch": 0.53, "learning_rate": 2.4188957347456184e-06, "loss": 0.889, "step": 27828 }, { "epoch": 0.53, "learning_rate": 2.4187430497744316e-06, "loss": 0.8936, "step": 27829 }, { "epoch": 0.53, "learning_rate": 2.418590365106657e-06, "loss": 0.9752, "step": 27830 }, { "epoch": 0.53, "learning_rate": 2.4184376807428635e-06, "loss": 0.9528, "step": 27831 }, { "epoch": 0.53, "learning_rate": 2.4182849966836204e-06, "loss": 1.0307, "step": 27832 }, { "epoch": 0.53, "learning_rate": 2.4181323129294993e-06, "loss": 1.074, "step": 27833 }, { "epoch": 0.53, "learning_rate": 2.41797962948107e-06, "loss": 0.8304, "step": 27834 }, { "epoch": 0.53, "learning_rate": 2.417826946338901e-06, "loss": 0.8231, "step": 27835 }, { "epoch": 0.53, "learning_rate": 2.417674263503565e-06, "loss": 0.897, "step": 27836 }, { "epoch": 0.53, "learning_rate": 2.4175215809756296e-06, "loss": 1.1456, "step": 27837 }, { "epoch": 0.53, "learning_rate": 2.417368898755666e-06, "loss": 1.0186, "step": 27838 }, { "epoch": 0.53, "learning_rate": 2.4172162168442457e-06, "loss": 0.9755, "step": 27839 }, { "epoch": 0.53, "learning_rate": 2.4170635352419373e-06, "loss": 0.8404, "step": 27840 }, { "epoch": 0.53, "learning_rate": 2.41691085394931e-06, "loss": 0.9445, "step": 27841 }, { "epoch": 0.53, "learning_rate": 2.416758172966936e-06, "loss": 0.896, "step": 27842 }, { "epoch": 0.53, "learning_rate": 2.416605492295384e-06, "loss": 1.1656, "step": 27843 }, { "epoch": 0.53, "learning_rate": 2.4164528119352244e-06, "loss": 0.9852, "step": 27844 }, { "epoch": 0.53, "learning_rate": 2.4163001318870275e-06, "loss": 0.8309, "step": 27845 }, { "epoch": 0.53, "learning_rate": 2.4161474521513646e-06, "loss": 1.0374, "step": 27846 }, { "epoch": 0.53, "learning_rate": 2.4159947727288023e-06, "loss": 0.8904, "step": 27847 }, { "epoch": 0.53, "learning_rate": 2.415842093619915e-06, "loss": 0.8784, "step": 27848 }, { "epoch": 0.53, "learning_rate": 2.41568941482527e-06, "loss": 1.2165, "step": 27849 }, { "epoch": 0.53, "learning_rate": 2.4155367363454372e-06, "loss": 0.9445, "step": 27850 }, { "epoch": 0.53, "learning_rate": 2.4153840581809887e-06, "loss": 1.0865, "step": 27851 }, { "epoch": 0.53, "learning_rate": 2.4152313803324936e-06, "loss": 0.8475, "step": 27852 }, { "epoch": 0.53, "learning_rate": 2.415078702800521e-06, "loss": 1.1181, "step": 27853 }, { "epoch": 0.53, "learning_rate": 2.414926025585643e-06, "loss": 0.8519, "step": 27854 }, { "epoch": 0.53, "learning_rate": 2.414773348688428e-06, "loss": 0.8917, "step": 27855 }, { "epoch": 0.53, "learning_rate": 2.4146206721094466e-06, "loss": 1.2377, "step": 27856 }, { "epoch": 0.53, "learning_rate": 2.41446799584927e-06, "loss": 0.7151, "step": 27857 }, { "epoch": 0.53, "learning_rate": 2.4143153199084662e-06, "loss": 0.8539, "step": 27858 }, { "epoch": 0.53, "learning_rate": 2.414162644287606e-06, "loss": 0.7223, "step": 27859 }, { "epoch": 0.53, "learning_rate": 2.4140099689872608e-06, "loss": 0.8431, "step": 27860 }, { "epoch": 0.53, "learning_rate": 2.413857294008e-06, "loss": 0.7764, "step": 27861 }, { "epoch": 0.53, "learning_rate": 2.4137046193503923e-06, "loss": 1.1292, "step": 27862 }, { "epoch": 0.53, "learning_rate": 2.41355194501501e-06, "loss": 0.9879, "step": 27863 }, { "epoch": 0.53, "learning_rate": 2.4133992710024213e-06, "loss": 0.8154, "step": 27864 }, { "epoch": 0.53, "learning_rate": 2.413246597313197e-06, "loss": 1.0948, "step": 27865 }, { "epoch": 0.53, "learning_rate": 2.4130939239479077e-06, "loss": 0.8898, "step": 27866 }, { "epoch": 0.53, "learning_rate": 2.4129412509071233e-06, "loss": 1.05, "step": 27867 }, { "epoch": 0.53, "learning_rate": 2.412788578191413e-06, "loss": 1.2632, "step": 27868 }, { "epoch": 0.53, "learning_rate": 2.412635905801348e-06, "loss": 0.9377, "step": 27869 }, { "epoch": 0.53, "learning_rate": 2.412483233737498e-06, "loss": 0.9359, "step": 27870 }, { "epoch": 0.53, "learning_rate": 2.412330562000432e-06, "loss": 0.8064, "step": 27871 }, { "epoch": 0.53, "learning_rate": 2.412177890590721e-06, "loss": 0.9874, "step": 27872 }, { "epoch": 0.53, "learning_rate": 2.412025219508936e-06, "loss": 1.0194, "step": 27873 }, { "epoch": 0.53, "learning_rate": 2.411872548755645e-06, "loss": 1.0982, "step": 27874 }, { "epoch": 0.53, "learning_rate": 2.4117198783314203e-06, "loss": 1.0166, "step": 27875 }, { "epoch": 0.53, "learning_rate": 2.411567208236831e-06, "loss": 0.7442, "step": 27876 }, { "epoch": 0.53, "learning_rate": 2.4114145384724457e-06, "loss": 0.7928, "step": 27877 }, { "epoch": 0.53, "learning_rate": 2.4112618690388366e-06, "loss": 0.8841, "step": 27878 }, { "epoch": 0.53, "learning_rate": 2.411109199936573e-06, "loss": 0.9349, "step": 27879 }, { "epoch": 0.53, "learning_rate": 2.410956531166224e-06, "loss": 0.9932, "step": 27880 }, { "epoch": 0.53, "learning_rate": 2.410803862728362e-06, "loss": 1.1183, "step": 27881 }, { "epoch": 0.53, "learning_rate": 2.4106511946235554e-06, "loss": 1.0284, "step": 27882 }, { "epoch": 0.53, "learning_rate": 2.4104985268523748e-06, "loss": 0.9051, "step": 27883 }, { "epoch": 0.53, "learning_rate": 2.410345859415389e-06, "loss": 0.8845, "step": 27884 }, { "epoch": 0.53, "learning_rate": 2.410193192313169e-06, "loss": 0.692, "step": 27885 }, { "epoch": 0.53, "learning_rate": 2.4100405255462856e-06, "loss": 0.7906, "step": 27886 }, { "epoch": 0.53, "learning_rate": 2.4098878591153067e-06, "loss": 1.063, "step": 27887 }, { "epoch": 0.53, "learning_rate": 2.4097351930208053e-06, "loss": 1.0156, "step": 27888 }, { "epoch": 0.53, "learning_rate": 2.4095825272633498e-06, "loss": 0.9124, "step": 27889 }, { "epoch": 0.53, "learning_rate": 2.4094298618435097e-06, "loss": 0.8245, "step": 27890 }, { "epoch": 0.53, "learning_rate": 2.4092771967618564e-06, "loss": 0.8066, "step": 27891 }, { "epoch": 0.53, "learning_rate": 2.4091245320189587e-06, "loss": 0.8436, "step": 27892 }, { "epoch": 0.53, "learning_rate": 2.4089718676153866e-06, "loss": 1.3629, "step": 27893 }, { "epoch": 0.53, "learning_rate": 2.408819203551712e-06, "loss": 1.1489, "step": 27894 }, { "epoch": 0.53, "learning_rate": 2.4086665398285034e-06, "loss": 1.0506, "step": 27895 }, { "epoch": 0.53, "learning_rate": 2.4085138764463307e-06, "loss": 0.8282, "step": 27896 }, { "epoch": 0.53, "learning_rate": 2.408361213405765e-06, "loss": 1.041, "step": 27897 }, { "epoch": 0.53, "learning_rate": 2.4082085507073754e-06, "loss": 0.9547, "step": 27898 }, { "epoch": 0.53, "learning_rate": 2.408055888351732e-06, "loss": 0.9856, "step": 27899 }, { "epoch": 0.53, "learning_rate": 2.407903226339405e-06, "loss": 0.8702, "step": 27900 }, { "epoch": 0.53, "learning_rate": 2.407750564670965e-06, "loss": 0.9203, "step": 27901 }, { "epoch": 0.53, "learning_rate": 2.4075979033469813e-06, "loss": 0.9346, "step": 27902 }, { "epoch": 0.53, "learning_rate": 2.407445242368025e-06, "loss": 0.8305, "step": 27903 }, { "epoch": 0.53, "learning_rate": 2.407292581734665e-06, "loss": 0.7935, "step": 27904 }, { "epoch": 0.53, "learning_rate": 2.4071399214474702e-06, "loss": 1.0073, "step": 27905 }, { "epoch": 0.53, "learning_rate": 2.4069872615070134e-06, "loss": 0.9031, "step": 27906 }, { "epoch": 0.53, "learning_rate": 2.4068346019138635e-06, "loss": 1.027, "step": 27907 }, { "epoch": 0.53, "learning_rate": 2.406681942668589e-06, "loss": 0.844, "step": 27908 }, { "epoch": 0.53, "learning_rate": 2.406529283771763e-06, "loss": 0.9232, "step": 27909 }, { "epoch": 0.53, "learning_rate": 2.406376625223953e-06, "loss": 0.7346, "step": 27910 }, { "epoch": 0.53, "learning_rate": 2.406223967025729e-06, "loss": 0.9479, "step": 27911 }, { "epoch": 0.53, "learning_rate": 2.406071309177663e-06, "loss": 1.0697, "step": 27912 }, { "epoch": 0.53, "learning_rate": 2.405918651680324e-06, "loss": 0.968, "step": 27913 }, { "epoch": 0.53, "learning_rate": 2.4057659945342804e-06, "loss": 0.7433, "step": 27914 }, { "epoch": 0.53, "learning_rate": 2.405613337740105e-06, "loss": 1.0315, "step": 27915 }, { "epoch": 0.53, "learning_rate": 2.4054606812983666e-06, "loss": 0.8433, "step": 27916 }, { "epoch": 0.53, "learning_rate": 2.405308025209634e-06, "loss": 1.0094, "step": 27917 }, { "epoch": 0.53, "learning_rate": 2.4051553694744795e-06, "loss": 1.1813, "step": 27918 }, { "epoch": 0.53, "learning_rate": 2.405002714093471e-06, "loss": 1.1553, "step": 27919 }, { "epoch": 0.53, "learning_rate": 2.40485005906718e-06, "loss": 0.8887, "step": 27920 }, { "epoch": 0.53, "learning_rate": 2.404697404396176e-06, "loss": 0.7611, "step": 27921 }, { "epoch": 0.53, "learning_rate": 2.404544750081029e-06, "loss": 0.843, "step": 27922 }, { "epoch": 0.53, "learning_rate": 2.404392096122308e-06, "loss": 0.9399, "step": 27923 }, { "epoch": 0.53, "learning_rate": 2.4042394425205855e-06, "loss": 0.9583, "step": 27924 }, { "epoch": 0.53, "learning_rate": 2.40408678927643e-06, "loss": 1.0068, "step": 27925 }, { "epoch": 0.53, "learning_rate": 2.40393413639041e-06, "loss": 0.8036, "step": 27926 }, { "epoch": 0.53, "learning_rate": 2.4037814838630974e-06, "loss": 0.8972, "step": 27927 }, { "epoch": 0.53, "learning_rate": 2.4036288316950628e-06, "loss": 1.223, "step": 27928 }, { "epoch": 0.53, "learning_rate": 2.4034761798868736e-06, "loss": 0.7704, "step": 27929 }, { "epoch": 0.53, "learning_rate": 2.4033235284391025e-06, "loss": 0.9249, "step": 27930 }, { "epoch": 0.53, "learning_rate": 2.403170877352319e-06, "loss": 1.0389, "step": 27931 }, { "epoch": 0.53, "learning_rate": 2.4030182266270906e-06, "loss": 0.967, "step": 27932 }, { "epoch": 0.53, "learning_rate": 2.402865576263991e-06, "loss": 0.8978, "step": 27933 }, { "epoch": 0.53, "learning_rate": 2.4027129262635873e-06, "loss": 0.925, "step": 27934 }, { "epoch": 0.53, "learning_rate": 2.4025602766264503e-06, "loss": 0.8916, "step": 27935 }, { "epoch": 0.53, "learning_rate": 2.4024076273531512e-06, "loss": 0.9823, "step": 27936 }, { "epoch": 0.53, "learning_rate": 2.402254978444259e-06, "loss": 0.9165, "step": 27937 }, { "epoch": 0.53, "learning_rate": 2.402102329900343e-06, "loss": 0.8914, "step": 27938 }, { "epoch": 0.53, "learning_rate": 2.4019496817219744e-06, "loss": 0.8886, "step": 27939 }, { "epoch": 0.53, "learning_rate": 2.401797033909722e-06, "loss": 0.9009, "step": 27940 }, { "epoch": 0.53, "learning_rate": 2.401644386464157e-06, "loss": 0.7141, "step": 27941 }, { "epoch": 0.53, "learning_rate": 2.401491739385849e-06, "loss": 1.1795, "step": 27942 }, { "epoch": 0.53, "learning_rate": 2.401339092675368e-06, "loss": 0.9857, "step": 27943 }, { "epoch": 0.53, "learning_rate": 2.4011864463332826e-06, "loss": 0.8351, "step": 27944 }, { "epoch": 0.53, "learning_rate": 2.4010338003601654e-06, "loss": 0.9586, "step": 27945 }, { "epoch": 0.53, "learning_rate": 2.400881154756585e-06, "loss": 0.8146, "step": 27946 }, { "epoch": 0.53, "learning_rate": 2.40072850952311e-06, "loss": 1.0279, "step": 27947 }, { "epoch": 0.53, "learning_rate": 2.4005758646603118e-06, "loss": 0.7788, "step": 27948 }, { "epoch": 0.53, "learning_rate": 2.4004232201687614e-06, "loss": 1.0948, "step": 27949 }, { "epoch": 0.53, "learning_rate": 2.400270576049027e-06, "loss": 1.049, "step": 27950 }, { "epoch": 0.53, "learning_rate": 2.400117932301679e-06, "loss": 0.956, "step": 27951 }, { "epoch": 0.53, "learning_rate": 2.3999652889272887e-06, "loss": 1.0854, "step": 27952 }, { "epoch": 0.53, "learning_rate": 2.3998126459264236e-06, "loss": 1.0757, "step": 27953 }, { "epoch": 0.53, "learning_rate": 2.399660003299656e-06, "loss": 0.9243, "step": 27954 }, { "epoch": 0.53, "learning_rate": 2.399507361047554e-06, "loss": 0.8682, "step": 27955 }, { "epoch": 0.53, "learning_rate": 2.3993547191706886e-06, "loss": 1.306, "step": 27956 }, { "epoch": 0.53, "learning_rate": 2.39920207766963e-06, "loss": 0.8844, "step": 27957 }, { "epoch": 0.53, "learning_rate": 2.399049436544948e-06, "loss": 0.8203, "step": 27958 }, { "epoch": 0.53, "learning_rate": 2.3988967957972117e-06, "loss": 0.8995, "step": 27959 }, { "epoch": 0.53, "learning_rate": 2.398744155426992e-06, "loss": 0.9257, "step": 27960 }, { "epoch": 0.53, "learning_rate": 2.3985915154348583e-06, "loss": 0.749, "step": 27961 }, { "epoch": 0.53, "learning_rate": 2.3984388758213804e-06, "loss": 1.0901, "step": 27962 }, { "epoch": 0.53, "learning_rate": 2.3982862365871294e-06, "loss": 1.0176, "step": 27963 }, { "epoch": 0.53, "learning_rate": 2.3981335977326744e-06, "loss": 0.9776, "step": 27964 }, { "epoch": 0.53, "learning_rate": 2.3979809592585846e-06, "loss": 1.0364, "step": 27965 }, { "epoch": 0.53, "learning_rate": 2.3978283211654318e-06, "loss": 1.0205, "step": 27966 }, { "epoch": 0.53, "learning_rate": 2.3976756834537847e-06, "loss": 0.8279, "step": 27967 }, { "epoch": 0.53, "learning_rate": 2.3975230461242126e-06, "loss": 1.0938, "step": 27968 }, { "epoch": 0.53, "learning_rate": 2.397370409177287e-06, "loss": 1.0233, "step": 27969 }, { "epoch": 0.53, "learning_rate": 2.3972177726135777e-06, "loss": 0.8873, "step": 27970 }, { "epoch": 0.53, "learning_rate": 2.3970651364336525e-06, "loss": 1.0491, "step": 27971 }, { "epoch": 0.53, "learning_rate": 2.3969125006380846e-06, "loss": 0.9542, "step": 27972 }, { "epoch": 0.53, "learning_rate": 2.396759865227442e-06, "loss": 1.0478, "step": 27973 }, { "epoch": 0.53, "learning_rate": 2.3966072302022937e-06, "loss": 1.0587, "step": 27974 }, { "epoch": 0.53, "learning_rate": 2.396454595563212e-06, "loss": 1.0278, "step": 27975 }, { "epoch": 0.53, "learning_rate": 2.396301961310765e-06, "loss": 1.0107, "step": 27976 }, { "epoch": 0.53, "learning_rate": 2.396149327445523e-06, "loss": 1.0558, "step": 27977 }, { "epoch": 0.53, "learning_rate": 2.395996693968057e-06, "loss": 0.6675, "step": 27978 }, { "epoch": 0.53, "learning_rate": 2.3958440608789366e-06, "loss": 1.0013, "step": 27979 }, { "epoch": 0.53, "learning_rate": 2.39569142817873e-06, "loss": 0.8188, "step": 27980 }, { "epoch": 0.53, "learning_rate": 2.3955387958680093e-06, "loss": 0.9912, "step": 27981 }, { "epoch": 0.53, "learning_rate": 2.395386163947343e-06, "loss": 1.026, "step": 27982 }, { "epoch": 0.53, "learning_rate": 2.3952335324173023e-06, "loss": 0.895, "step": 27983 }, { "epoch": 0.53, "learning_rate": 2.3950809012784555e-06, "loss": 0.7252, "step": 27984 }, { "epoch": 0.53, "learning_rate": 2.3949282705313743e-06, "loss": 1.048, "step": 27985 }, { "epoch": 0.53, "learning_rate": 2.3947756401766263e-06, "loss": 0.734, "step": 27986 }, { "epoch": 0.53, "learning_rate": 2.3946230102147844e-06, "loss": 1.0925, "step": 27987 }, { "epoch": 0.53, "learning_rate": 2.3944703806464164e-06, "loss": 0.9453, "step": 27988 }, { "epoch": 0.53, "learning_rate": 2.3943177514720923e-06, "loss": 0.9299, "step": 27989 }, { "epoch": 0.53, "learning_rate": 2.3941651226923827e-06, "loss": 0.8988, "step": 27990 }, { "epoch": 0.53, "learning_rate": 2.3940124943078576e-06, "loss": 1.0415, "step": 27991 }, { "epoch": 0.53, "learning_rate": 2.393859866319086e-06, "loss": 0.7458, "step": 27992 }, { "epoch": 0.53, "learning_rate": 2.3937072387266393e-06, "loss": 1.179, "step": 27993 }, { "epoch": 0.53, "learning_rate": 2.3935546115310863e-06, "loss": 1.0766, "step": 27994 }, { "epoch": 0.53, "learning_rate": 2.3934019847329963e-06, "loss": 0.8553, "step": 27995 }, { "epoch": 0.53, "learning_rate": 2.3932493583329406e-06, "loss": 0.9101, "step": 27996 }, { "epoch": 0.53, "learning_rate": 2.3930967323314885e-06, "loss": 0.8321, "step": 27997 }, { "epoch": 0.53, "learning_rate": 2.3929441067292095e-06, "loss": 0.7883, "step": 27998 }, { "epoch": 0.53, "learning_rate": 2.3927914815266746e-06, "loss": 1.1177, "step": 27999 }, { "epoch": 0.53, "learning_rate": 2.3926388567244534e-06, "loss": 0.9782, "step": 28000 }, { "epoch": 0.53, "learning_rate": 2.3924862323231143e-06, "loss": 1.032, "step": 28001 }, { "epoch": 0.53, "learning_rate": 2.392333608323229e-06, "loss": 0.7587, "step": 28002 }, { "epoch": 0.53, "learning_rate": 2.392180984725366e-06, "loss": 0.793, "step": 28003 }, { "epoch": 0.53, "learning_rate": 2.3920283615300965e-06, "loss": 0.7346, "step": 28004 }, { "epoch": 0.53, "learning_rate": 2.3918757387379895e-06, "loss": 1.0185, "step": 28005 }, { "epoch": 0.53, "learning_rate": 2.391723116349616e-06, "loss": 0.9966, "step": 28006 }, { "epoch": 0.53, "learning_rate": 2.391570494365544e-06, "loss": 0.8575, "step": 28007 }, { "epoch": 0.53, "learning_rate": 2.391417872786345e-06, "loss": 0.7597, "step": 28008 }, { "epoch": 0.53, "learning_rate": 2.3912652516125888e-06, "loss": 0.8604, "step": 28009 }, { "epoch": 0.53, "learning_rate": 2.3911126308448435e-06, "loss": 0.8368, "step": 28010 }, { "epoch": 0.53, "learning_rate": 2.390960010483681e-06, "loss": 0.8813, "step": 28011 }, { "epoch": 0.53, "learning_rate": 2.390807390529671e-06, "loss": 0.7542, "step": 28012 }, { "epoch": 0.53, "learning_rate": 2.3906547709833814e-06, "loss": 1.1501, "step": 28013 }, { "epoch": 0.53, "learning_rate": 2.390502151845385e-06, "loss": 0.9015, "step": 28014 }, { "epoch": 0.53, "learning_rate": 2.39034953311625e-06, "loss": 1.0061, "step": 28015 }, { "epoch": 0.53, "learning_rate": 2.390196914796545e-06, "loss": 1.1143, "step": 28016 }, { "epoch": 0.53, "learning_rate": 2.3900442968868432e-06, "loss": 0.8402, "step": 28017 }, { "epoch": 0.53, "learning_rate": 2.389891679387712e-06, "loss": 1.0051, "step": 28018 }, { "epoch": 0.53, "learning_rate": 2.389739062299721e-06, "loss": 1.0365, "step": 28019 }, { "epoch": 0.53, "learning_rate": 2.3895864456234423e-06, "loss": 0.9888, "step": 28020 }, { "epoch": 0.53, "learning_rate": 2.3894338293594445e-06, "loss": 0.9302, "step": 28021 }, { "epoch": 0.53, "learning_rate": 2.389281213508296e-06, "loss": 0.925, "step": 28022 }, { "epoch": 0.53, "learning_rate": 2.3891285980705696e-06, "loss": 0.81, "step": 28023 }, { "epoch": 0.53, "learning_rate": 2.3889759830468326e-06, "loss": 1.0141, "step": 28024 }, { "epoch": 0.53, "learning_rate": 2.388823368437656e-06, "loss": 0.8755, "step": 28025 }, { "epoch": 0.53, "learning_rate": 2.3886707542436097e-06, "loss": 0.8131, "step": 28026 }, { "epoch": 0.53, "learning_rate": 2.388518140465264e-06, "loss": 0.929, "step": 28027 }, { "epoch": 0.53, "learning_rate": 2.3883655271031867e-06, "loss": 0.7526, "step": 28028 }, { "epoch": 0.53, "learning_rate": 2.3882129141579504e-06, "loss": 0.8185, "step": 28029 }, { "epoch": 0.53, "learning_rate": 2.3880603016301234e-06, "loss": 0.9723, "step": 28030 }, { "epoch": 0.53, "learning_rate": 2.387907689520275e-06, "loss": 1.0924, "step": 28031 }, { "epoch": 0.53, "learning_rate": 2.3877550778289766e-06, "loss": 0.974, "step": 28032 }, { "epoch": 0.53, "learning_rate": 2.387602466556797e-06, "loss": 1.0458, "step": 28033 }, { "epoch": 0.53, "learning_rate": 2.3874498557043065e-06, "loss": 0.8752, "step": 28034 }, { "epoch": 0.53, "learning_rate": 2.387297245272075e-06, "loss": 0.9916, "step": 28035 }, { "epoch": 0.53, "learning_rate": 2.387144635260672e-06, "loss": 0.8869, "step": 28036 }, { "epoch": 0.53, "learning_rate": 2.386992025670667e-06, "loss": 0.8672, "step": 28037 }, { "epoch": 0.53, "learning_rate": 2.386839416502631e-06, "loss": 0.8756, "step": 28038 }, { "epoch": 0.53, "learning_rate": 2.3866868077571327e-06, "loss": 0.8996, "step": 28039 }, { "epoch": 0.53, "learning_rate": 2.3865341994347418e-06, "loss": 0.8507, "step": 28040 }, { "epoch": 0.53, "learning_rate": 2.38638159153603e-06, "loss": 0.9465, "step": 28041 }, { "epoch": 0.53, "learning_rate": 2.3862289840615656e-06, "loss": 0.7942, "step": 28042 }, { "epoch": 0.53, "learning_rate": 2.386076377011918e-06, "loss": 0.9572, "step": 28043 }, { "epoch": 0.53, "learning_rate": 2.3859237703876585e-06, "loss": 1.1082, "step": 28044 }, { "epoch": 0.53, "learning_rate": 2.3857711641893556e-06, "loss": 0.8477, "step": 28045 }, { "epoch": 0.53, "learning_rate": 2.3856185584175795e-06, "loss": 0.8855, "step": 28046 }, { "epoch": 0.53, "learning_rate": 2.3854659530729007e-06, "loss": 0.8647, "step": 28047 }, { "epoch": 0.53, "learning_rate": 2.3853133481558884e-06, "loss": 0.8459, "step": 28048 }, { "epoch": 0.53, "learning_rate": 2.385160743667112e-06, "loss": 1.0341, "step": 28049 }, { "epoch": 0.53, "learning_rate": 2.3850081396071426e-06, "loss": 1.126, "step": 28050 }, { "epoch": 0.53, "learning_rate": 2.3848555359765498e-06, "loss": 0.8803, "step": 28051 }, { "epoch": 0.53, "learning_rate": 2.384702932775901e-06, "loss": 0.9783, "step": 28052 }, { "epoch": 0.53, "learning_rate": 2.384550330005769e-06, "loss": 1.0023, "step": 28053 }, { "epoch": 0.53, "learning_rate": 2.384397727666723e-06, "loss": 0.7426, "step": 28054 }, { "epoch": 0.53, "learning_rate": 2.3842451257593312e-06, "loss": 0.8814, "step": 28055 }, { "epoch": 0.53, "learning_rate": 2.3840925242841657e-06, "loss": 1.0408, "step": 28056 }, { "epoch": 0.53, "learning_rate": 2.383939923241795e-06, "loss": 1.0063, "step": 28057 }, { "epoch": 0.53, "learning_rate": 2.383787322632788e-06, "loss": 1.2099, "step": 28058 }, { "epoch": 0.53, "learning_rate": 2.383634722457717e-06, "loss": 1.013, "step": 28059 }, { "epoch": 0.53, "learning_rate": 2.3834821227171496e-06, "loss": 0.8604, "step": 28060 }, { "epoch": 0.53, "learning_rate": 2.3833295234116556e-06, "loss": 1.0057, "step": 28061 }, { "epoch": 0.53, "learning_rate": 2.3831769245418072e-06, "loss": 0.9783, "step": 28062 }, { "epoch": 0.53, "learning_rate": 2.3830243261081723e-06, "loss": 1.0147, "step": 28063 }, { "epoch": 0.53, "learning_rate": 2.3828717281113196e-06, "loss": 1.1149, "step": 28064 }, { "epoch": 0.53, "learning_rate": 2.382719130551822e-06, "loss": 0.9405, "step": 28065 }, { "epoch": 0.53, "learning_rate": 2.3825665334302465e-06, "loss": 0.8336, "step": 28066 }, { "epoch": 0.53, "learning_rate": 2.382413936747164e-06, "loss": 0.8683, "step": 28067 }, { "epoch": 0.53, "learning_rate": 2.3822613405031443e-06, "loss": 1.0253, "step": 28068 }, { "epoch": 0.53, "learning_rate": 2.382108744698758e-06, "loss": 1.0289, "step": 28069 }, { "epoch": 0.53, "learning_rate": 2.381956149334573e-06, "loss": 0.5761, "step": 28070 }, { "epoch": 0.53, "learning_rate": 2.3818035544111606e-06, "loss": 0.7621, "step": 28071 }, { "epoch": 0.53, "learning_rate": 2.3816509599290906e-06, "loss": 0.9067, "step": 28072 }, { "epoch": 0.53, "learning_rate": 2.381498365888931e-06, "loss": 0.6816, "step": 28073 }, { "epoch": 0.53, "learning_rate": 2.3813457722912535e-06, "loss": 0.9596, "step": 28074 }, { "epoch": 0.53, "learning_rate": 2.3811931791366278e-06, "loss": 0.9497, "step": 28075 }, { "epoch": 0.53, "learning_rate": 2.3810405864256216e-06, "loss": 0.8435, "step": 28076 }, { "epoch": 0.53, "learning_rate": 2.380887994158808e-06, "loss": 0.56, "step": 28077 }, { "epoch": 0.53, "learning_rate": 2.3807354023367547e-06, "loss": 0.8819, "step": 28078 }, { "epoch": 0.53, "learning_rate": 2.3805828109600303e-06, "loss": 0.7946, "step": 28079 }, { "epoch": 0.53, "learning_rate": 2.3804302200292074e-06, "loss": 1.0296, "step": 28080 }, { "epoch": 0.53, "learning_rate": 2.380277629544854e-06, "loss": 1.1583, "step": 28081 }, { "epoch": 0.53, "learning_rate": 2.3801250395075394e-06, "loss": 0.8419, "step": 28082 }, { "epoch": 0.53, "learning_rate": 2.3799724499178356e-06, "loss": 0.7331, "step": 28083 }, { "epoch": 0.53, "learning_rate": 2.379819860776311e-06, "loss": 0.8434, "step": 28084 }, { "epoch": 0.53, "learning_rate": 2.379667272083534e-06, "loss": 0.7112, "step": 28085 }, { "epoch": 0.53, "learning_rate": 2.379514683840077e-06, "loss": 0.96, "step": 28086 }, { "epoch": 0.53, "learning_rate": 2.3793620960465082e-06, "loss": 1.1008, "step": 28087 }, { "epoch": 0.53, "learning_rate": 2.379209508703397e-06, "loss": 0.7519, "step": 28088 }, { "epoch": 0.53, "learning_rate": 2.3790569218113145e-06, "loss": 0.8037, "step": 28089 }, { "epoch": 0.53, "learning_rate": 2.3789043353708297e-06, "loss": 0.8867, "step": 28090 }, { "epoch": 0.53, "learning_rate": 2.3787517493825114e-06, "loss": 0.7814, "step": 28091 }, { "epoch": 0.53, "learning_rate": 2.3785991638469317e-06, "loss": 0.7497, "step": 28092 }, { "epoch": 0.53, "learning_rate": 2.3784465787646587e-06, "loss": 0.9685, "step": 28093 }, { "epoch": 0.53, "learning_rate": 2.378293994136262e-06, "loss": 0.881, "step": 28094 }, { "epoch": 0.53, "learning_rate": 2.3781414099623115e-06, "loss": 0.9674, "step": 28095 }, { "epoch": 0.53, "learning_rate": 2.3779888262433782e-06, "loss": 0.8255, "step": 28096 }, { "epoch": 0.53, "learning_rate": 2.3778362429800297e-06, "loss": 0.8558, "step": 28097 }, { "epoch": 0.53, "learning_rate": 2.377683660172838e-06, "loss": 0.673, "step": 28098 }, { "epoch": 0.53, "learning_rate": 2.3775310778223717e-06, "loss": 0.9637, "step": 28099 }, { "epoch": 0.53, "learning_rate": 2.3773784959291997e-06, "loss": 1.1245, "step": 28100 }, { "epoch": 0.53, "learning_rate": 2.3772259144938935e-06, "loss": 0.9364, "step": 28101 }, { "epoch": 0.53, "learning_rate": 2.377073333517022e-06, "loss": 0.9648, "step": 28102 }, { "epoch": 0.53, "learning_rate": 2.3769207529991537e-06, "loss": 0.9102, "step": 28103 }, { "epoch": 0.53, "learning_rate": 2.376768172940861e-06, "loss": 0.86, "step": 28104 }, { "epoch": 0.53, "learning_rate": 2.3766155933427116e-06, "loss": 0.9161, "step": 28105 }, { "epoch": 0.53, "learning_rate": 2.3764630142052754e-06, "loss": 1.304, "step": 28106 }, { "epoch": 0.53, "learning_rate": 2.376310435529123e-06, "loss": 1.0248, "step": 28107 }, { "epoch": 0.53, "learning_rate": 2.376157857314824e-06, "loss": 0.7862, "step": 28108 }, { "epoch": 0.53, "learning_rate": 2.376005279562947e-06, "loss": 0.9519, "step": 28109 }, { "epoch": 0.53, "learning_rate": 2.3758527022740627e-06, "loss": 0.948, "step": 28110 }, { "epoch": 0.53, "learning_rate": 2.375700125448741e-06, "loss": 0.7404, "step": 28111 }, { "epoch": 0.53, "learning_rate": 2.3755475490875506e-06, "loss": 0.8607, "step": 28112 }, { "epoch": 0.53, "learning_rate": 2.3753949731910623e-06, "loss": 1.1799, "step": 28113 }, { "epoch": 0.53, "learning_rate": 2.375242397759846e-06, "loss": 0.9605, "step": 28114 }, { "epoch": 0.53, "learning_rate": 2.3750898227944695e-06, "loss": 0.7567, "step": 28115 }, { "epoch": 0.53, "learning_rate": 2.3749372482955035e-06, "loss": 0.8654, "step": 28116 }, { "epoch": 0.53, "learning_rate": 2.3747846742635194e-06, "loss": 0.9764, "step": 28117 }, { "epoch": 0.53, "learning_rate": 2.3746321006990847e-06, "loss": 1.0429, "step": 28118 }, { "epoch": 0.53, "learning_rate": 2.3744795276027697e-06, "loss": 1.1913, "step": 28119 }, { "epoch": 0.53, "learning_rate": 2.374326954975145e-06, "loss": 0.8691, "step": 28120 }, { "epoch": 0.53, "learning_rate": 2.374174382816779e-06, "loss": 0.7945, "step": 28121 }, { "epoch": 0.53, "learning_rate": 2.374021811128242e-06, "loss": 0.9982, "step": 28122 }, { "epoch": 0.53, "learning_rate": 2.3738692399101036e-06, "loss": 0.7433, "step": 28123 }, { "epoch": 0.53, "learning_rate": 2.3737166691629345e-06, "loss": 1.0413, "step": 28124 }, { "epoch": 0.53, "learning_rate": 2.373564098887302e-06, "loss": 0.98, "step": 28125 }, { "epoch": 0.53, "learning_rate": 2.373411529083779e-06, "loss": 0.885, "step": 28126 }, { "epoch": 0.53, "learning_rate": 2.3732589597529328e-06, "loss": 0.9055, "step": 28127 }, { "epoch": 0.53, "learning_rate": 2.3731063908953328e-06, "loss": 0.8313, "step": 28128 }, { "epoch": 0.53, "learning_rate": 2.3729538225115503e-06, "loss": 0.9493, "step": 28129 }, { "epoch": 0.53, "learning_rate": 2.372801254602155e-06, "loss": 0.8672, "step": 28130 }, { "epoch": 0.53, "learning_rate": 2.3726486871677147e-06, "loss": 1.0377, "step": 28131 }, { "epoch": 0.53, "learning_rate": 2.3724961202088013e-06, "loss": 0.8731, "step": 28132 }, { "epoch": 0.53, "learning_rate": 2.3723435537259835e-06, "loss": 0.7649, "step": 28133 }, { "epoch": 0.53, "learning_rate": 2.3721909877198297e-06, "loss": 0.8057, "step": 28134 }, { "epoch": 0.53, "learning_rate": 2.3720384221909125e-06, "loss": 0.8066, "step": 28135 }, { "epoch": 0.53, "learning_rate": 2.371885857139799e-06, "loss": 1.0669, "step": 28136 }, { "epoch": 0.53, "learning_rate": 2.371733292567059e-06, "loss": 1.0472, "step": 28137 }, { "epoch": 0.53, "learning_rate": 2.3715807284732647e-06, "loss": 1.0959, "step": 28138 }, { "epoch": 0.53, "learning_rate": 2.3714281648589833e-06, "loss": 0.8734, "step": 28139 }, { "epoch": 0.53, "learning_rate": 2.3712756017247845e-06, "loss": 0.9697, "step": 28140 }, { "epoch": 0.53, "learning_rate": 2.3711230390712396e-06, "loss": 0.8245, "step": 28141 }, { "epoch": 0.53, "learning_rate": 2.370970476898917e-06, "loss": 0.9118, "step": 28142 }, { "epoch": 0.53, "learning_rate": 2.3708179152083863e-06, "loss": 0.8872, "step": 28143 }, { "epoch": 0.53, "learning_rate": 2.3706653540002176e-06, "loss": 1.1141, "step": 28144 }, { "epoch": 0.53, "learning_rate": 2.3705127932749813e-06, "loss": 0.9058, "step": 28145 }, { "epoch": 0.53, "learning_rate": 2.370360233033245e-06, "loss": 1.0707, "step": 28146 }, { "epoch": 0.53, "learning_rate": 2.370207673275581e-06, "loss": 0.7567, "step": 28147 }, { "epoch": 0.53, "learning_rate": 2.370055114002557e-06, "loss": 0.7583, "step": 28148 }, { "epoch": 0.53, "learning_rate": 2.3699025552147428e-06, "loss": 0.9279, "step": 28149 }, { "epoch": 0.53, "learning_rate": 2.3697499969127085e-06, "loss": 0.8484, "step": 28150 }, { "epoch": 0.53, "learning_rate": 2.3695974390970245e-06, "loss": 0.9003, "step": 28151 }, { "epoch": 0.53, "learning_rate": 2.3694448817682587e-06, "loss": 0.7716, "step": 28152 }, { "epoch": 0.53, "learning_rate": 2.3692923249269827e-06, "loss": 0.7475, "step": 28153 }, { "epoch": 0.53, "learning_rate": 2.369139768573765e-06, "loss": 0.7872, "step": 28154 }, { "epoch": 0.53, "learning_rate": 2.3689872127091744e-06, "loss": 1.0098, "step": 28155 }, { "epoch": 0.53, "learning_rate": 2.3688346573337826e-06, "loss": 1.1254, "step": 28156 }, { "epoch": 0.53, "learning_rate": 2.3686821024481575e-06, "loss": 1.0099, "step": 28157 }, { "epoch": 0.53, "learning_rate": 2.368529548052869e-06, "loss": 0.9404, "step": 28158 }, { "epoch": 0.53, "learning_rate": 2.368376994148488e-06, "loss": 0.8995, "step": 28159 }, { "epoch": 0.53, "learning_rate": 2.3682244407355835e-06, "loss": 0.8981, "step": 28160 }, { "epoch": 0.53, "learning_rate": 2.368071887814724e-06, "loss": 0.8535, "step": 28161 }, { "epoch": 0.53, "learning_rate": 2.367919335386481e-06, "loss": 1.0192, "step": 28162 }, { "epoch": 0.53, "learning_rate": 2.3677667834514227e-06, "loss": 0.8246, "step": 28163 }, { "epoch": 0.53, "learning_rate": 2.3676142320101186e-06, "loss": 0.83, "step": 28164 }, { "epoch": 0.53, "learning_rate": 2.3674616810631395e-06, "loss": 0.9225, "step": 28165 }, { "epoch": 0.53, "learning_rate": 2.3673091306110547e-06, "loss": 0.7592, "step": 28166 }, { "epoch": 0.53, "learning_rate": 2.3671565806544325e-06, "loss": 0.7261, "step": 28167 }, { "epoch": 0.53, "learning_rate": 2.3670040311938446e-06, "loss": 0.9251, "step": 28168 }, { "epoch": 0.53, "learning_rate": 2.3668514822298595e-06, "loss": 0.9849, "step": 28169 }, { "epoch": 0.53, "learning_rate": 2.3666989337630462e-06, "loss": 0.9994, "step": 28170 }, { "epoch": 0.53, "learning_rate": 2.3665463857939754e-06, "loss": 0.8423, "step": 28171 }, { "epoch": 0.53, "learning_rate": 2.366393838323216e-06, "loss": 1.0851, "step": 28172 }, { "epoch": 0.53, "learning_rate": 2.366241291351338e-06, "loss": 0.9012, "step": 28173 }, { "epoch": 0.53, "learning_rate": 2.3660887448789114e-06, "loss": 1.0508, "step": 28174 }, { "epoch": 0.53, "learning_rate": 2.3659361989065056e-06, "loss": 1.0492, "step": 28175 }, { "epoch": 0.53, "learning_rate": 2.3657836534346886e-06, "loss": 0.8846, "step": 28176 }, { "epoch": 0.53, "learning_rate": 2.3656311084640322e-06, "loss": 0.9066, "step": 28177 }, { "epoch": 0.53, "learning_rate": 2.365478563995105e-06, "loss": 0.8773, "step": 28178 }, { "epoch": 0.53, "learning_rate": 2.365326020028476e-06, "loss": 0.7747, "step": 28179 }, { "epoch": 0.53, "learning_rate": 2.3651734765647166e-06, "loss": 1.1788, "step": 28180 }, { "epoch": 0.53, "learning_rate": 2.3650209336043955e-06, "loss": 1.1547, "step": 28181 }, { "epoch": 0.53, "learning_rate": 2.3648683911480806e-06, "loss": 0.8671, "step": 28182 }, { "epoch": 0.53, "learning_rate": 2.3647158491963446e-06, "loss": 0.7829, "step": 28183 }, { "epoch": 0.53, "learning_rate": 2.3645633077497544e-06, "loss": 0.976, "step": 28184 }, { "epoch": 0.53, "learning_rate": 2.364410766808881e-06, "loss": 0.9143, "step": 28185 }, { "epoch": 0.53, "learning_rate": 2.3642582263742935e-06, "loss": 0.8774, "step": 28186 }, { "epoch": 0.53, "learning_rate": 2.364105686446562e-06, "loss": 1.1454, "step": 28187 }, { "epoch": 0.53, "learning_rate": 2.363953147026255e-06, "loss": 1.103, "step": 28188 }, { "epoch": 0.53, "learning_rate": 2.363800608113944e-06, "loss": 1.03, "step": 28189 }, { "epoch": 0.53, "learning_rate": 2.363648069710197e-06, "loss": 1.0548, "step": 28190 }, { "epoch": 0.53, "learning_rate": 2.363495531815583e-06, "loss": 0.9042, "step": 28191 }, { "epoch": 0.53, "learning_rate": 2.363342994430673e-06, "loss": 1.0966, "step": 28192 }, { "epoch": 0.53, "learning_rate": 2.363190457556036e-06, "loss": 1.11, "step": 28193 }, { "epoch": 0.53, "learning_rate": 2.3630379211922412e-06, "loss": 1.1074, "step": 28194 }, { "epoch": 0.53, "learning_rate": 2.3628853853398598e-06, "loss": 0.9073, "step": 28195 }, { "epoch": 0.53, "learning_rate": 2.36273284999946e-06, "loss": 0.7724, "step": 28196 }, { "epoch": 0.53, "learning_rate": 2.3625803151716105e-06, "loss": 0.8975, "step": 28197 }, { "epoch": 0.53, "learning_rate": 2.3624277808568827e-06, "loss": 0.9273, "step": 28198 }, { "epoch": 0.53, "learning_rate": 2.362275247055845e-06, "loss": 1.1227, "step": 28199 }, { "epoch": 0.53, "learning_rate": 2.3621227137690664e-06, "loss": 1.0242, "step": 28200 }, { "epoch": 0.53, "learning_rate": 2.361970180997119e-06, "loss": 0.8308, "step": 28201 }, { "epoch": 0.53, "learning_rate": 2.3618176487405707e-06, "loss": 0.8485, "step": 28202 }, { "epoch": 0.53, "learning_rate": 2.3616651169999896e-06, "loss": 0.8809, "step": 28203 }, { "epoch": 0.53, "learning_rate": 2.361512585775948e-06, "loss": 0.9093, "step": 28204 }, { "epoch": 0.53, "learning_rate": 2.3613600550690137e-06, "loss": 0.9252, "step": 28205 }, { "epoch": 0.53, "learning_rate": 2.3612075248797565e-06, "loss": 0.9775, "step": 28206 }, { "epoch": 0.53, "learning_rate": 2.3610549952087462e-06, "loss": 1.0999, "step": 28207 }, { "epoch": 0.53, "learning_rate": 2.3609024660565525e-06, "loss": 1.0117, "step": 28208 }, { "epoch": 0.53, "learning_rate": 2.3607499374237442e-06, "loss": 0.8577, "step": 28209 }, { "epoch": 0.53, "learning_rate": 2.360597409310892e-06, "loss": 0.8605, "step": 28210 }, { "epoch": 0.53, "learning_rate": 2.360444881718565e-06, "loss": 0.8638, "step": 28211 }, { "epoch": 0.53, "learning_rate": 2.3602923546473315e-06, "loss": 0.9628, "step": 28212 }, { "epoch": 0.53, "learning_rate": 2.360139828097763e-06, "loss": 1.0145, "step": 28213 }, { "epoch": 0.53, "learning_rate": 2.359987302070428e-06, "loss": 0.9514, "step": 28214 }, { "epoch": 0.53, "learning_rate": 2.3598347765658953e-06, "loss": 1.0658, "step": 28215 }, { "epoch": 0.53, "learning_rate": 2.3596822515847366e-06, "loss": 0.8069, "step": 28216 }, { "epoch": 0.53, "learning_rate": 2.3595297271275195e-06, "loss": 0.8065, "step": 28217 }, { "epoch": 0.53, "learning_rate": 2.3593772031948136e-06, "loss": 0.8004, "step": 28218 }, { "epoch": 0.53, "learning_rate": 2.359224679787189e-06, "loss": 1.0283, "step": 28219 }, { "epoch": 0.53, "learning_rate": 2.359072156905216e-06, "loss": 0.7537, "step": 28220 }, { "epoch": 0.53, "learning_rate": 2.3589196345494616e-06, "loss": 0.9505, "step": 28221 }, { "epoch": 0.53, "learning_rate": 2.3587671127204984e-06, "loss": 0.9594, "step": 28222 }, { "epoch": 0.53, "learning_rate": 2.3586145914188945e-06, "loss": 0.9255, "step": 28223 }, { "epoch": 0.53, "learning_rate": 2.3584620706452182e-06, "loss": 0.9564, "step": 28224 }, { "epoch": 0.53, "learning_rate": 2.3583095504000414e-06, "loss": 0.8081, "step": 28225 }, { "epoch": 0.53, "learning_rate": 2.358157030683932e-06, "loss": 0.8791, "step": 28226 }, { "epoch": 0.53, "learning_rate": 2.358004511497459e-06, "loss": 1.0009, "step": 28227 }, { "epoch": 0.53, "learning_rate": 2.357851992841194e-06, "loss": 0.9797, "step": 28228 }, { "epoch": 0.53, "learning_rate": 2.3576994747157055e-06, "loss": 0.9428, "step": 28229 }, { "epoch": 0.53, "learning_rate": 2.3575469571215614e-06, "loss": 0.6305, "step": 28230 }, { "epoch": 0.53, "learning_rate": 2.357394440059334e-06, "loss": 1.0881, "step": 28231 }, { "epoch": 0.53, "learning_rate": 2.3572419235295906e-06, "loss": 0.9844, "step": 28232 }, { "epoch": 0.53, "learning_rate": 2.3570894075329015e-06, "loss": 0.721, "step": 28233 }, { "epoch": 0.53, "learning_rate": 2.3569368920698364e-06, "loss": 0.9796, "step": 28234 }, { "epoch": 0.53, "learning_rate": 2.356784377140965e-06, "loss": 0.9326, "step": 28235 }, { "epoch": 0.53, "learning_rate": 2.356631862746855e-06, "loss": 0.9199, "step": 28236 }, { "epoch": 0.53, "learning_rate": 2.3564793488880787e-06, "loss": 1.1288, "step": 28237 }, { "epoch": 0.53, "learning_rate": 2.3563268355652037e-06, "loss": 0.9384, "step": 28238 }, { "epoch": 0.53, "learning_rate": 2.356174322778799e-06, "loss": 0.852, "step": 28239 }, { "epoch": 0.53, "learning_rate": 2.3560218105294355e-06, "loss": 0.6887, "step": 28240 }, { "epoch": 0.53, "learning_rate": 2.355869298817683e-06, "loss": 1.0345, "step": 28241 }, { "epoch": 0.53, "learning_rate": 2.3557167876441086e-06, "loss": 0.7494, "step": 28242 }, { "epoch": 0.53, "learning_rate": 2.3555642770092846e-06, "loss": 1.2484, "step": 28243 }, { "epoch": 0.53, "learning_rate": 2.355411766913779e-06, "loss": 1.0596, "step": 28244 }, { "epoch": 0.53, "learning_rate": 2.3552592573581603e-06, "loss": 0.893, "step": 28245 }, { "epoch": 0.53, "learning_rate": 2.3551067483430005e-06, "loss": 0.9399, "step": 28246 }, { "epoch": 0.53, "learning_rate": 2.354954239868867e-06, "loss": 1.0645, "step": 28247 }, { "epoch": 0.53, "learning_rate": 2.354801731936329e-06, "loss": 0.9406, "step": 28248 }, { "epoch": 0.53, "learning_rate": 2.3546492245459586e-06, "loss": 0.9788, "step": 28249 }, { "epoch": 0.53, "learning_rate": 2.354496717698323e-06, "loss": 1.0651, "step": 28250 }, { "epoch": 0.53, "learning_rate": 2.3543442113939915e-06, "loss": 0.7999, "step": 28251 }, { "epoch": 0.53, "learning_rate": 2.354191705633535e-06, "loss": 1.1113, "step": 28252 }, { "epoch": 0.53, "learning_rate": 2.3540392004175217e-06, "loss": 0.8972, "step": 28253 }, { "epoch": 0.53, "learning_rate": 2.353886695746522e-06, "loss": 0.8601, "step": 28254 }, { "epoch": 0.53, "learning_rate": 2.3537341916211048e-06, "loss": 0.9979, "step": 28255 }, { "epoch": 0.53, "learning_rate": 2.3535816880418395e-06, "loss": 1.0488, "step": 28256 }, { "epoch": 0.53, "learning_rate": 2.3534291850092954e-06, "loss": 0.8621, "step": 28257 }, { "epoch": 0.53, "learning_rate": 2.3532766825240427e-06, "loss": 0.8869, "step": 28258 }, { "epoch": 0.53, "learning_rate": 2.353124180586651e-06, "loss": 0.8715, "step": 28259 }, { "epoch": 0.53, "learning_rate": 2.3529716791976874e-06, "loss": 0.8657, "step": 28260 }, { "epoch": 0.53, "learning_rate": 2.352819178357724e-06, "loss": 0.7318, "step": 28261 }, { "epoch": 0.53, "learning_rate": 2.3526666780673298e-06, "loss": 0.9784, "step": 28262 }, { "epoch": 0.53, "learning_rate": 2.3525141783270724e-06, "loss": 1.0305, "step": 28263 }, { "epoch": 0.53, "learning_rate": 2.3523616791375236e-06, "loss": 0.9583, "step": 28264 }, { "epoch": 0.53, "learning_rate": 2.3522091804992518e-06, "loss": 1.0175, "step": 28265 }, { "epoch": 0.53, "learning_rate": 2.3520566824128253e-06, "loss": 1.0031, "step": 28266 }, { "epoch": 0.53, "learning_rate": 2.351904184878816e-06, "loss": 0.6492, "step": 28267 }, { "epoch": 0.53, "learning_rate": 2.3517516878977912e-06, "loss": 0.9792, "step": 28268 }, { "epoch": 0.53, "learning_rate": 2.3515991914703203e-06, "loss": 0.9946, "step": 28269 }, { "epoch": 0.53, "learning_rate": 2.3514466955969746e-06, "loss": 0.7398, "step": 28270 }, { "epoch": 0.53, "learning_rate": 2.3512942002783227e-06, "loss": 0.8988, "step": 28271 }, { "epoch": 0.53, "learning_rate": 2.3511417055149323e-06, "loss": 0.9914, "step": 28272 }, { "epoch": 0.53, "learning_rate": 2.3509892113073755e-06, "loss": 0.737, "step": 28273 }, { "epoch": 0.53, "learning_rate": 2.35083671765622e-06, "loss": 0.8671, "step": 28274 }, { "epoch": 0.53, "learning_rate": 2.350684224562035e-06, "loss": 0.9341, "step": 28275 }, { "epoch": 0.53, "learning_rate": 2.350531732025391e-06, "loss": 0.9032, "step": 28276 }, { "epoch": 0.53, "learning_rate": 2.3503792400468575e-06, "loss": 1.0255, "step": 28277 }, { "epoch": 0.53, "learning_rate": 2.350226748627002e-06, "loss": 0.9603, "step": 28278 }, { "epoch": 0.53, "learning_rate": 2.3500742577663965e-06, "loss": 0.6658, "step": 28279 }, { "epoch": 0.53, "learning_rate": 2.3499217674656094e-06, "loss": 0.9212, "step": 28280 }, { "epoch": 0.53, "learning_rate": 2.349769277725208e-06, "loss": 0.9322, "step": 28281 }, { "epoch": 0.53, "learning_rate": 2.3496167885457648e-06, "loss": 0.9317, "step": 28282 }, { "epoch": 0.53, "learning_rate": 2.349464299927848e-06, "loss": 0.9497, "step": 28283 }, { "epoch": 0.53, "learning_rate": 2.3493118118720258e-06, "loss": 1.0172, "step": 28284 }, { "epoch": 0.53, "learning_rate": 2.3491593243788704e-06, "loss": 0.6759, "step": 28285 }, { "epoch": 0.53, "learning_rate": 2.3490068374489486e-06, "loss": 0.8334, "step": 28286 }, { "epoch": 0.53, "learning_rate": 2.34885435108283e-06, "loss": 0.9185, "step": 28287 }, { "epoch": 0.53, "learning_rate": 2.3487018652810857e-06, "loss": 0.8636, "step": 28288 }, { "epoch": 0.53, "learning_rate": 2.3485493800442833e-06, "loss": 0.9355, "step": 28289 }, { "epoch": 0.53, "learning_rate": 2.3483968953729923e-06, "loss": 0.9408, "step": 28290 }, { "epoch": 0.53, "learning_rate": 2.3482444112677836e-06, "loss": 1.1084, "step": 28291 }, { "epoch": 0.53, "learning_rate": 2.348091927729226e-06, "loss": 0.9011, "step": 28292 }, { "epoch": 0.53, "learning_rate": 2.3479394447578873e-06, "loss": 0.9745, "step": 28293 }, { "epoch": 0.53, "learning_rate": 2.347786962354339e-06, "loss": 1.1508, "step": 28294 }, { "epoch": 0.53, "learning_rate": 2.3476344805191494e-06, "loss": 0.797, "step": 28295 }, { "epoch": 0.53, "learning_rate": 2.3474819992528876e-06, "loss": 0.805, "step": 28296 }, { "epoch": 0.53, "learning_rate": 2.3473295185561234e-06, "loss": 0.9406, "step": 28297 }, { "epoch": 0.53, "learning_rate": 2.3471770384294263e-06, "loss": 0.8624, "step": 28298 }, { "epoch": 0.53, "learning_rate": 2.3470245588733643e-06, "loss": 1.0006, "step": 28299 }, { "epoch": 0.53, "learning_rate": 2.3468720798885096e-06, "loss": 0.8629, "step": 28300 }, { "epoch": 0.53, "learning_rate": 2.3467196014754296e-06, "loss": 0.7989, "step": 28301 }, { "epoch": 0.53, "learning_rate": 2.3465671236346928e-06, "loss": 0.7387, "step": 28302 }, { "epoch": 0.53, "learning_rate": 2.3464146463668704e-06, "loss": 0.9857, "step": 28303 }, { "epoch": 0.53, "learning_rate": 2.3462621696725312e-06, "loss": 0.8301, "step": 28304 }, { "epoch": 0.53, "learning_rate": 2.3461096935522437e-06, "loss": 1.0761, "step": 28305 }, { "epoch": 0.53, "learning_rate": 2.3459572180065786e-06, "loss": 1.0706, "step": 28306 }, { "epoch": 0.53, "learning_rate": 2.3458047430361048e-06, "loss": 0.6567, "step": 28307 }, { "epoch": 0.53, "learning_rate": 2.3456522686413898e-06, "loss": 0.8731, "step": 28308 }, { "epoch": 0.53, "learning_rate": 2.345499794823006e-06, "loss": 0.8036, "step": 28309 }, { "epoch": 0.53, "learning_rate": 2.3453473215815206e-06, "loss": 0.9431, "step": 28310 }, { "epoch": 0.53, "learning_rate": 2.345194848917503e-06, "loss": 0.8741, "step": 28311 }, { "epoch": 0.53, "learning_rate": 2.345042376831524e-06, "loss": 1.0758, "step": 28312 }, { "epoch": 0.53, "learning_rate": 2.3448899053241526e-06, "loss": 0.8347, "step": 28313 }, { "epoch": 0.53, "learning_rate": 2.344737434395956e-06, "loss": 0.7785, "step": 28314 }, { "epoch": 0.53, "learning_rate": 2.344584964047506e-06, "loss": 0.9391, "step": 28315 }, { "epoch": 0.53, "learning_rate": 2.3444324942793704e-06, "loss": 0.9922, "step": 28316 }, { "epoch": 0.53, "learning_rate": 2.3442800250921195e-06, "loss": 0.931, "step": 28317 }, { "epoch": 0.53, "learning_rate": 2.344127556486322e-06, "loss": 0.9566, "step": 28318 }, { "epoch": 0.53, "learning_rate": 2.343975088462548e-06, "loss": 1.1163, "step": 28319 }, { "epoch": 0.53, "learning_rate": 2.3438226210213653e-06, "loss": 1.0647, "step": 28320 }, { "epoch": 0.53, "learning_rate": 2.343670154163345e-06, "loss": 0.7307, "step": 28321 }, { "epoch": 0.53, "learning_rate": 2.3435176878890555e-06, "loss": 0.9747, "step": 28322 }, { "epoch": 0.53, "learning_rate": 2.343365222199065e-06, "loss": 0.8361, "step": 28323 }, { "epoch": 0.53, "learning_rate": 2.343212757093945e-06, "loss": 0.7792, "step": 28324 }, { "epoch": 0.53, "learning_rate": 2.3430602925742642e-06, "loss": 0.9443, "step": 28325 }, { "epoch": 0.53, "learning_rate": 2.34290782864059e-06, "loss": 1.0008, "step": 28326 }, { "epoch": 0.53, "learning_rate": 2.3427553652934944e-06, "loss": 0.8848, "step": 28327 }, { "epoch": 0.53, "learning_rate": 2.342602902533545e-06, "loss": 0.9362, "step": 28328 }, { "epoch": 0.53, "learning_rate": 2.3424504403613115e-06, "loss": 0.7331, "step": 28329 }, { "epoch": 0.53, "learning_rate": 2.3422979787773637e-06, "loss": 0.8466, "step": 28330 }, { "epoch": 0.53, "learning_rate": 2.3421455177822695e-06, "loss": 1.2495, "step": 28331 }, { "epoch": 0.53, "learning_rate": 2.341993057376599e-06, "loss": 0.8685, "step": 28332 }, { "epoch": 0.53, "learning_rate": 2.3418405975609225e-06, "loss": 0.8932, "step": 28333 }, { "epoch": 0.53, "learning_rate": 2.3416881383358087e-06, "loss": 0.8766, "step": 28334 }, { "epoch": 0.53, "learning_rate": 2.341535679701825e-06, "loss": 0.8006, "step": 28335 }, { "epoch": 0.53, "learning_rate": 2.3413832216595436e-06, "loss": 1.0168, "step": 28336 }, { "epoch": 0.53, "learning_rate": 2.3412307642095317e-06, "loss": 1.2838, "step": 28337 }, { "epoch": 0.53, "learning_rate": 2.3410783073523595e-06, "loss": 0.8837, "step": 28338 }, { "epoch": 0.53, "learning_rate": 2.3409258510885956e-06, "loss": 0.913, "step": 28339 }, { "epoch": 0.53, "learning_rate": 2.3407733954188106e-06, "loss": 0.9744, "step": 28340 }, { "epoch": 0.53, "learning_rate": 2.3406209403435716e-06, "loss": 0.9059, "step": 28341 }, { "epoch": 0.53, "learning_rate": 2.3404684858634504e-06, "loss": 0.8507, "step": 28342 }, { "epoch": 0.53, "learning_rate": 2.3403160319790147e-06, "loss": 0.812, "step": 28343 }, { "epoch": 0.53, "learning_rate": 2.340163578690833e-06, "loss": 1.1067, "step": 28344 }, { "epoch": 0.53, "learning_rate": 2.3400111259994765e-06, "loss": 0.8782, "step": 28345 }, { "epoch": 0.53, "learning_rate": 2.339858673905514e-06, "loss": 0.9521, "step": 28346 }, { "epoch": 0.53, "learning_rate": 2.339706222409513e-06, "loss": 1.028, "step": 28347 }, { "epoch": 0.53, "learning_rate": 2.339553771512045e-06, "loss": 0.7975, "step": 28348 }, { "epoch": 0.53, "learning_rate": 2.3394013212136785e-06, "loss": 1.1266, "step": 28349 }, { "epoch": 0.53, "learning_rate": 2.339248871514982e-06, "loss": 1.0226, "step": 28350 }, { "epoch": 0.53, "learning_rate": 2.339096422416525e-06, "loss": 0.9264, "step": 28351 }, { "epoch": 0.53, "learning_rate": 2.3389439739188773e-06, "loss": 0.8415, "step": 28352 }, { "epoch": 0.53, "learning_rate": 2.3387915260226085e-06, "loss": 0.647, "step": 28353 }, { "epoch": 0.53, "learning_rate": 2.338639078728286e-06, "loss": 0.628, "step": 28354 }, { "epoch": 0.53, "learning_rate": 2.3384866320364812e-06, "loss": 0.7677, "step": 28355 }, { "epoch": 0.53, "learning_rate": 2.3383341859477625e-06, "loss": 1.013, "step": 28356 }, { "epoch": 0.54, "learning_rate": 2.338181740462698e-06, "loss": 0.7578, "step": 28357 }, { "epoch": 0.54, "learning_rate": 2.3380292955818582e-06, "loss": 0.8632, "step": 28358 }, { "epoch": 0.54, "learning_rate": 2.3378768513058133e-06, "loss": 0.9536, "step": 28359 }, { "epoch": 0.54, "learning_rate": 2.3377244076351292e-06, "loss": 0.8897, "step": 28360 }, { "epoch": 0.54, "learning_rate": 2.3375719645703787e-06, "loss": 0.7514, "step": 28361 }, { "epoch": 0.54, "learning_rate": 2.3374195221121295e-06, "loss": 1.1245, "step": 28362 }, { "epoch": 0.54, "learning_rate": 2.3372670802609497e-06, "loss": 1.0683, "step": 28363 }, { "epoch": 0.54, "learning_rate": 2.337114639017411e-06, "loss": 0.9997, "step": 28364 }, { "epoch": 0.54, "learning_rate": 2.33696219838208e-06, "loss": 0.9351, "step": 28365 }, { "epoch": 0.54, "learning_rate": 2.3368097583555275e-06, "loss": 0.9689, "step": 28366 }, { "epoch": 0.54, "learning_rate": 2.3366573189383227e-06, "loss": 0.7621, "step": 28367 }, { "epoch": 0.54, "learning_rate": 2.336504880131035e-06, "loss": 1.017, "step": 28368 }, { "epoch": 0.54, "learning_rate": 2.336352441934232e-06, "loss": 1.1429, "step": 28369 }, { "epoch": 0.54, "learning_rate": 2.3362000043484844e-06, "loss": 0.6846, "step": 28370 }, { "epoch": 0.54, "learning_rate": 2.336047567374361e-06, "loss": 0.9819, "step": 28371 }, { "epoch": 0.54, "learning_rate": 2.335895131012431e-06, "loss": 0.8821, "step": 28372 }, { "epoch": 0.54, "learning_rate": 2.3357426952632633e-06, "loss": 0.8174, "step": 28373 }, { "epoch": 0.54, "learning_rate": 2.3355902601274276e-06, "loss": 1.0249, "step": 28374 }, { "epoch": 0.54, "learning_rate": 2.335437825605492e-06, "loss": 1.038, "step": 28375 }, { "epoch": 0.54, "learning_rate": 2.335285391698028e-06, "loss": 0.9636, "step": 28376 }, { "epoch": 0.54, "learning_rate": 2.335132958405603e-06, "loss": 0.7935, "step": 28377 }, { "epoch": 0.54, "learning_rate": 2.334980525728785e-06, "loss": 0.967, "step": 28378 }, { "epoch": 0.54, "learning_rate": 2.3348280936681458e-06, "loss": 0.8076, "step": 28379 }, { "epoch": 0.54, "learning_rate": 2.3346756622242535e-06, "loss": 0.7339, "step": 28380 }, { "epoch": 0.54, "learning_rate": 2.3345232313976764e-06, "loss": 1.0862, "step": 28381 }, { "epoch": 0.54, "learning_rate": 2.3343708011889852e-06, "loss": 0.8768, "step": 28382 }, { "epoch": 0.54, "learning_rate": 2.3342183715987492e-06, "loss": 0.882, "step": 28383 }, { "epoch": 0.54, "learning_rate": 2.3340659426275347e-06, "loss": 0.7547, "step": 28384 }, { "epoch": 0.54, "learning_rate": 2.3339135142759145e-06, "loss": 0.8381, "step": 28385 }, { "epoch": 0.54, "learning_rate": 2.3337610865444555e-06, "loss": 0.8329, "step": 28386 }, { "epoch": 0.54, "learning_rate": 2.3336086594337268e-06, "loss": 0.9459, "step": 28387 }, { "epoch": 0.54, "learning_rate": 2.3334562329442993e-06, "loss": 0.9751, "step": 28388 }, { "epoch": 0.54, "learning_rate": 2.3333038070767417e-06, "loss": 0.7532, "step": 28389 }, { "epoch": 0.54, "learning_rate": 2.333151381831621e-06, "loss": 0.8904, "step": 28390 }, { "epoch": 0.54, "learning_rate": 2.3329989572095092e-06, "loss": 0.8966, "step": 28391 }, { "epoch": 0.54, "learning_rate": 2.3328465332109735e-06, "loss": 0.9295, "step": 28392 }, { "epoch": 0.54, "learning_rate": 2.3326941098365834e-06, "loss": 0.9779, "step": 28393 }, { "epoch": 0.54, "learning_rate": 2.332541687086909e-06, "loss": 1.1367, "step": 28394 }, { "epoch": 0.54, "learning_rate": 2.332389264962519e-06, "loss": 0.8788, "step": 28395 }, { "epoch": 0.54, "learning_rate": 2.3322368434639816e-06, "loss": 1.1027, "step": 28396 }, { "epoch": 0.54, "learning_rate": 2.332084422591867e-06, "loss": 0.7742, "step": 28397 }, { "epoch": 0.54, "learning_rate": 2.3319320023467447e-06, "loss": 0.7224, "step": 28398 }, { "epoch": 0.54, "learning_rate": 2.3317795827291816e-06, "loss": 0.9329, "step": 28399 }, { "epoch": 0.54, "learning_rate": 2.3316271637397497e-06, "loss": 1.0867, "step": 28400 }, { "epoch": 0.54, "learning_rate": 2.3314747453790166e-06, "loss": 0.7222, "step": 28401 }, { "epoch": 0.54, "learning_rate": 2.331322327647551e-06, "loss": 0.9205, "step": 28402 }, { "epoch": 0.54, "learning_rate": 2.331169910545923e-06, "loss": 0.9958, "step": 28403 }, { "epoch": 0.54, "learning_rate": 2.3310174940747023e-06, "loss": 0.7574, "step": 28404 }, { "epoch": 0.54, "learning_rate": 2.3308650782344555e-06, "loss": 1.1395, "step": 28405 }, { "epoch": 0.54, "learning_rate": 2.3307126630257547e-06, "loss": 0.9946, "step": 28406 }, { "epoch": 0.54, "learning_rate": 2.3305602484491667e-06, "loss": 1.1623, "step": 28407 }, { "epoch": 0.54, "learning_rate": 2.330407834505261e-06, "loss": 0.8655, "step": 28408 }, { "epoch": 0.54, "learning_rate": 2.3302554211946087e-06, "loss": 0.8337, "step": 28409 }, { "epoch": 0.54, "learning_rate": 2.330103008517777e-06, "loss": 1.0624, "step": 28410 }, { "epoch": 0.54, "learning_rate": 2.329950596475335e-06, "loss": 1.0679, "step": 28411 }, { "epoch": 0.54, "learning_rate": 2.329798185067853e-06, "loss": 0.8204, "step": 28412 }, { "epoch": 0.54, "learning_rate": 2.3296457742958986e-06, "loss": 0.8515, "step": 28413 }, { "epoch": 0.54, "learning_rate": 2.329493364160042e-06, "loss": 1.0276, "step": 28414 }, { "epoch": 0.54, "learning_rate": 2.3293409546608517e-06, "loss": 0.7161, "step": 28415 }, { "epoch": 0.54, "learning_rate": 2.3291885457988977e-06, "loss": 0.6992, "step": 28416 }, { "epoch": 0.54, "learning_rate": 2.3290361375747476e-06, "loss": 0.631, "step": 28417 }, { "epoch": 0.54, "learning_rate": 2.328883729988972e-06, "loss": 0.9817, "step": 28418 }, { "epoch": 0.54, "learning_rate": 2.3287313230421395e-06, "loss": 0.6824, "step": 28419 }, { "epoch": 0.54, "learning_rate": 2.328578916734818e-06, "loss": 0.8081, "step": 28420 }, { "epoch": 0.54, "learning_rate": 2.3284265110675777e-06, "loss": 0.8181, "step": 28421 }, { "epoch": 0.54, "learning_rate": 2.3282741060409884e-06, "loss": 0.7824, "step": 28422 }, { "epoch": 0.54, "learning_rate": 2.3281217016556175e-06, "loss": 0.7, "step": 28423 }, { "epoch": 0.54, "learning_rate": 2.3279692979120354e-06, "loss": 1.0781, "step": 28424 }, { "epoch": 0.54, "learning_rate": 2.327816894810811e-06, "loss": 1.0803, "step": 28425 }, { "epoch": 0.54, "learning_rate": 2.327664492352512e-06, "loss": 0.7483, "step": 28426 }, { "epoch": 0.54, "learning_rate": 2.3275120905377094e-06, "loss": 0.827, "step": 28427 }, { "epoch": 0.54, "learning_rate": 2.327359689366971e-06, "loss": 0.8715, "step": 28428 }, { "epoch": 0.54, "learning_rate": 2.3272072888408654e-06, "loss": 0.9644, "step": 28429 }, { "epoch": 0.54, "learning_rate": 2.3270548889599636e-06, "loss": 0.8149, "step": 28430 }, { "epoch": 0.54, "learning_rate": 2.3269024897248338e-06, "loss": 1.2926, "step": 28431 }, { "epoch": 0.54, "learning_rate": 2.3267500911360435e-06, "loss": 0.8107, "step": 28432 }, { "epoch": 0.54, "learning_rate": 2.3265976931941644e-06, "loss": 0.9583, "step": 28433 }, { "epoch": 0.54, "learning_rate": 2.3264452958997637e-06, "loss": 1.0219, "step": 28434 }, { "epoch": 0.54, "learning_rate": 2.3262928992534105e-06, "loss": 0.7433, "step": 28435 }, { "epoch": 0.54, "learning_rate": 2.326140503255675e-06, "loss": 0.7187, "step": 28436 }, { "epoch": 0.54, "learning_rate": 2.3259881079071253e-06, "loss": 1.1449, "step": 28437 }, { "epoch": 0.54, "learning_rate": 2.32583571320833e-06, "loss": 0.8882, "step": 28438 }, { "epoch": 0.54, "learning_rate": 2.3256833191598594e-06, "loss": 1.0357, "step": 28439 }, { "epoch": 0.54, "learning_rate": 2.3255309257622825e-06, "loss": 0.8738, "step": 28440 }, { "epoch": 0.54, "learning_rate": 2.3253785330161666e-06, "loss": 0.8436, "step": 28441 }, { "epoch": 0.54, "learning_rate": 2.3252261409220823e-06, "loss": 0.8101, "step": 28442 }, { "epoch": 0.54, "learning_rate": 2.325073749480599e-06, "loss": 1.2432, "step": 28443 }, { "epoch": 0.54, "learning_rate": 2.3249213586922836e-06, "loss": 1.119, "step": 28444 }, { "epoch": 0.54, "learning_rate": 2.3247689685577075e-06, "loss": 0.9911, "step": 28445 }, { "epoch": 0.54, "learning_rate": 2.324616579077439e-06, "loss": 0.7878, "step": 28446 }, { "epoch": 0.54, "learning_rate": 2.3244641902520455e-06, "loss": 0.9561, "step": 28447 }, { "epoch": 0.54, "learning_rate": 2.324311802082099e-06, "loss": 0.754, "step": 28448 }, { "epoch": 0.54, "learning_rate": 2.324159414568165e-06, "loss": 1.0335, "step": 28449 }, { "epoch": 0.54, "learning_rate": 2.324007027710815e-06, "loss": 1.0222, "step": 28450 }, { "epoch": 0.54, "learning_rate": 2.323854641510618e-06, "loss": 1.0988, "step": 28451 }, { "epoch": 0.54, "learning_rate": 2.3237022559681427e-06, "loss": 0.8722, "step": 28452 }, { "epoch": 0.54, "learning_rate": 2.3235498710839562e-06, "loss": 0.9456, "step": 28453 }, { "epoch": 0.54, "learning_rate": 2.3233974868586306e-06, "loss": 0.8114, "step": 28454 }, { "epoch": 0.54, "learning_rate": 2.3232451032927323e-06, "loss": 0.9247, "step": 28455 }, { "epoch": 0.54, "learning_rate": 2.323092720386832e-06, "loss": 0.994, "step": 28456 }, { "epoch": 0.54, "learning_rate": 2.3229403381414975e-06, "loss": 0.9539, "step": 28457 }, { "epoch": 0.54, "learning_rate": 2.3227879565572994e-06, "loss": 0.7803, "step": 28458 }, { "epoch": 0.54, "learning_rate": 2.322635575634804e-06, "loss": 0.8803, "step": 28459 }, { "epoch": 0.54, "learning_rate": 2.3224831953745837e-06, "loss": 0.7253, "step": 28460 }, { "epoch": 0.54, "learning_rate": 2.322330815777205e-06, "loss": 0.8687, "step": 28461 }, { "epoch": 0.54, "learning_rate": 2.3221784368432366e-06, "loss": 1.0508, "step": 28462 }, { "epoch": 0.54, "learning_rate": 2.3220260585732493e-06, "loss": 1.0731, "step": 28463 }, { "epoch": 0.54, "learning_rate": 2.3218736809678118e-06, "loss": 0.8719, "step": 28464 }, { "epoch": 0.54, "learning_rate": 2.3217213040274912e-06, "loss": 0.9046, "step": 28465 }, { "epoch": 0.54, "learning_rate": 2.321568927752859e-06, "loss": 0.8242, "step": 28466 }, { "epoch": 0.54, "learning_rate": 2.3214165521444833e-06, "loss": 1.0318, "step": 28467 }, { "epoch": 0.54, "learning_rate": 2.321264177202931e-06, "loss": 1.0473, "step": 28468 }, { "epoch": 0.54, "learning_rate": 2.321111802928774e-06, "loss": 1.0232, "step": 28469 }, { "epoch": 0.54, "learning_rate": 2.3209594293225798e-06, "loss": 0.9708, "step": 28470 }, { "epoch": 0.54, "learning_rate": 2.320807056384917e-06, "loss": 0.9502, "step": 28471 }, { "epoch": 0.54, "learning_rate": 2.320654684116356e-06, "loss": 1.0262, "step": 28472 }, { "epoch": 0.54, "learning_rate": 2.320502312517465e-06, "loss": 0.782, "step": 28473 }, { "epoch": 0.54, "learning_rate": 2.320349941588812e-06, "loss": 1.0231, "step": 28474 }, { "epoch": 0.54, "learning_rate": 2.3201975713309676e-06, "loss": 0.8774, "step": 28475 }, { "epoch": 0.54, "learning_rate": 2.3200452017445e-06, "loss": 1.0284, "step": 28476 }, { "epoch": 0.54, "learning_rate": 2.3198928328299774e-06, "loss": 1.0784, "step": 28477 }, { "epoch": 0.54, "learning_rate": 2.3197404645879694e-06, "loss": 0.8508, "step": 28478 }, { "epoch": 0.54, "learning_rate": 2.319588097019046e-06, "loss": 0.6703, "step": 28479 }, { "epoch": 0.54, "learning_rate": 2.3194357301237735e-06, "loss": 0.8885, "step": 28480 }, { "epoch": 0.54, "learning_rate": 2.319283363902724e-06, "loss": 1.0535, "step": 28481 }, { "epoch": 0.54, "learning_rate": 2.319130998356465e-06, "loss": 0.8152, "step": 28482 }, { "epoch": 0.54, "learning_rate": 2.318978633485564e-06, "loss": 0.8421, "step": 28483 }, { "epoch": 0.54, "learning_rate": 2.318826269290591e-06, "loss": 0.9211, "step": 28484 }, { "epoch": 0.54, "learning_rate": 2.3186739057721167e-06, "loss": 0.8002, "step": 28485 }, { "epoch": 0.54, "learning_rate": 2.3185215429307074e-06, "loss": 1.0308, "step": 28486 }, { "epoch": 0.54, "learning_rate": 2.318369180766934e-06, "loss": 1.1025, "step": 28487 }, { "epoch": 0.54, "learning_rate": 2.3182168192813642e-06, "loss": 0.9668, "step": 28488 }, { "epoch": 0.54, "learning_rate": 2.3180644584745662e-06, "loss": 0.8566, "step": 28489 }, { "epoch": 0.54, "learning_rate": 2.317912098347111e-06, "loss": 0.9243, "step": 28490 }, { "epoch": 0.54, "learning_rate": 2.3177597388995663e-06, "loss": 0.8815, "step": 28491 }, { "epoch": 0.54, "learning_rate": 2.3176073801325007e-06, "loss": 0.8781, "step": 28492 }, { "epoch": 0.54, "learning_rate": 2.317455022046484e-06, "loss": 0.7137, "step": 28493 }, { "epoch": 0.54, "learning_rate": 2.317302664642085e-06, "loss": 0.9107, "step": 28494 }, { "epoch": 0.54, "learning_rate": 2.317150307919871e-06, "loss": 0.7982, "step": 28495 }, { "epoch": 0.54, "learning_rate": 2.3169979518804136e-06, "loss": 0.8887, "step": 28496 }, { "epoch": 0.54, "learning_rate": 2.3168455965242793e-06, "loss": 0.9435, "step": 28497 }, { "epoch": 0.54, "learning_rate": 2.3166932418520378e-06, "loss": 0.8292, "step": 28498 }, { "epoch": 0.54, "learning_rate": 2.3165408878642586e-06, "loss": 0.8558, "step": 28499 }, { "epoch": 0.54, "learning_rate": 2.3163885345615105e-06, "loss": 1.3382, "step": 28500 }, { "epoch": 0.54, "learning_rate": 2.3162361819443606e-06, "loss": 0.9527, "step": 28501 }, { "epoch": 0.54, "learning_rate": 2.3160838300133807e-06, "loss": 0.8401, "step": 28502 }, { "epoch": 0.54, "learning_rate": 2.315931478769138e-06, "loss": 0.9412, "step": 28503 }, { "epoch": 0.54, "learning_rate": 2.3157791282122004e-06, "loss": 0.832, "step": 28504 }, { "epoch": 0.54, "learning_rate": 2.3156267783431384e-06, "loss": 0.7845, "step": 28505 }, { "epoch": 0.54, "learning_rate": 2.3154744291625206e-06, "loss": 1.2513, "step": 28506 }, { "epoch": 0.54, "learning_rate": 2.3153220806709146e-06, "loss": 0.8188, "step": 28507 }, { "epoch": 0.54, "learning_rate": 2.3151697328688917e-06, "loss": 0.9752, "step": 28508 }, { "epoch": 0.54, "learning_rate": 2.3150173857570193e-06, "loss": 0.9806, "step": 28509 }, { "epoch": 0.54, "learning_rate": 2.314865039335865e-06, "loss": 0.7819, "step": 28510 }, { "epoch": 0.54, "learning_rate": 2.3147126936060007e-06, "loss": 0.845, "step": 28511 }, { "epoch": 0.54, "learning_rate": 2.3145603485679923e-06, "loss": 0.9041, "step": 28512 }, { "epoch": 0.54, "learning_rate": 2.3144080042224093e-06, "loss": 1.1313, "step": 28513 }, { "epoch": 0.54, "learning_rate": 2.3142556605698225e-06, "loss": 0.9236, "step": 28514 }, { "epoch": 0.54, "learning_rate": 2.3141033176107993e-06, "loss": 0.9, "step": 28515 }, { "epoch": 0.54, "learning_rate": 2.3139509753459074e-06, "loss": 0.8632, "step": 28516 }, { "epoch": 0.54, "learning_rate": 2.313798633775718e-06, "loss": 1.037, "step": 28517 }, { "epoch": 0.54, "learning_rate": 2.3136462929007988e-06, "loss": 1.1597, "step": 28518 }, { "epoch": 0.54, "learning_rate": 2.313493952721718e-06, "loss": 1.0256, "step": 28519 }, { "epoch": 0.54, "learning_rate": 2.313341613239045e-06, "loss": 1.0264, "step": 28520 }, { "epoch": 0.54, "learning_rate": 2.31318927445335e-06, "loss": 0.7961, "step": 28521 }, { "epoch": 0.54, "learning_rate": 2.313036936365198e-06, "loss": 0.9174, "step": 28522 }, { "epoch": 0.54, "learning_rate": 2.312884598975163e-06, "loss": 0.812, "step": 28523 }, { "epoch": 0.54, "learning_rate": 2.31273226228381e-06, "loss": 0.9629, "step": 28524 }, { "epoch": 0.54, "learning_rate": 2.3125799262917087e-06, "loss": 1.1309, "step": 28525 }, { "epoch": 0.54, "learning_rate": 2.312427590999428e-06, "loss": 0.8612, "step": 28526 }, { "epoch": 0.54, "learning_rate": 2.3122752564075384e-06, "loss": 0.9114, "step": 28527 }, { "epoch": 0.54, "learning_rate": 2.312122922516605e-06, "loss": 0.8552, "step": 28528 }, { "epoch": 0.54, "learning_rate": 2.3119705893272008e-06, "loss": 0.9728, "step": 28529 }, { "epoch": 0.54, "learning_rate": 2.3118182568398927e-06, "loss": 0.8424, "step": 28530 }, { "epoch": 0.54, "learning_rate": 2.311665925055248e-06, "loss": 1.0829, "step": 28531 }, { "epoch": 0.54, "learning_rate": 2.3115135939738383e-06, "loss": 1.0219, "step": 28532 }, { "epoch": 0.54, "learning_rate": 2.31136126359623e-06, "loss": 0.9079, "step": 28533 }, { "epoch": 0.54, "learning_rate": 2.3112089339229933e-06, "loss": 0.8619, "step": 28534 }, { "epoch": 0.54, "learning_rate": 2.311056604954697e-06, "loss": 1.1152, "step": 28535 }, { "epoch": 0.54, "learning_rate": 2.31090427669191e-06, "loss": 0.9915, "step": 28536 }, { "epoch": 0.54, "learning_rate": 2.310751949135199e-06, "loss": 1.0435, "step": 28537 }, { "epoch": 0.54, "learning_rate": 2.310599622285136e-06, "loss": 0.8328, "step": 28538 }, { "epoch": 0.54, "learning_rate": 2.3104472961422875e-06, "loss": 0.8434, "step": 28539 }, { "epoch": 0.54, "learning_rate": 2.310294970707223e-06, "loss": 0.9563, "step": 28540 }, { "epoch": 0.54, "learning_rate": 2.310142645980511e-06, "loss": 0.8749, "step": 28541 }, { "epoch": 0.54, "learning_rate": 2.3099903219627214e-06, "loss": 0.7297, "step": 28542 }, { "epoch": 0.54, "learning_rate": 2.309837998654421e-06, "loss": 1.0085, "step": 28543 }, { "epoch": 0.54, "learning_rate": 2.3096856760561805e-06, "loss": 1.1823, "step": 28544 }, { "epoch": 0.54, "learning_rate": 2.309533354168568e-06, "loss": 1.0305, "step": 28545 }, { "epoch": 0.54, "learning_rate": 2.3093810329921514e-06, "loss": 0.8826, "step": 28546 }, { "epoch": 0.54, "learning_rate": 2.3092287125275e-06, "loss": 0.8991, "step": 28547 }, { "epoch": 0.54, "learning_rate": 2.309076392775184e-06, "loss": 0.9868, "step": 28548 }, { "epoch": 0.54, "learning_rate": 2.3089240737357697e-06, "loss": 1.1289, "step": 28549 }, { "epoch": 0.54, "learning_rate": 2.3087717554098275e-06, "loss": 0.9666, "step": 28550 }, { "epoch": 0.54, "learning_rate": 2.3086194377979265e-06, "loss": 1.0753, "step": 28551 }, { "epoch": 0.54, "learning_rate": 2.3084671209006334e-06, "loss": 0.725, "step": 28552 }, { "epoch": 0.54, "learning_rate": 2.308314804718519e-06, "loss": 0.9653, "step": 28553 }, { "epoch": 0.54, "learning_rate": 2.3081624892521507e-06, "loss": 0.7115, "step": 28554 }, { "epoch": 0.54, "learning_rate": 2.308010174502097e-06, "loss": 1.1053, "step": 28555 }, { "epoch": 0.54, "learning_rate": 2.307857860468929e-06, "loss": 1.0411, "step": 28556 }, { "epoch": 0.54, "learning_rate": 2.3077055471532137e-06, "loss": 1.0052, "step": 28557 }, { "epoch": 0.54, "learning_rate": 2.307553234555519e-06, "loss": 0.8643, "step": 28558 }, { "epoch": 0.54, "learning_rate": 2.3074009226764154e-06, "loss": 0.8878, "step": 28559 }, { "epoch": 0.54, "learning_rate": 2.3072486115164707e-06, "loss": 0.9886, "step": 28560 }, { "epoch": 0.54, "learning_rate": 2.3070963010762532e-06, "loss": 1.0486, "step": 28561 }, { "epoch": 0.54, "learning_rate": 2.306943991356333e-06, "loss": 0.9462, "step": 28562 }, { "epoch": 0.54, "learning_rate": 2.3067916823572783e-06, "loss": 0.7734, "step": 28563 }, { "epoch": 0.54, "learning_rate": 2.3066393740796562e-06, "loss": 0.868, "step": 28564 }, { "epoch": 0.54, "learning_rate": 2.306487066524038e-06, "loss": 0.8282, "step": 28565 }, { "epoch": 0.54, "learning_rate": 2.3063347596909907e-06, "loss": 0.9049, "step": 28566 }, { "epoch": 0.54, "learning_rate": 2.3061824535810826e-06, "loss": 0.7132, "step": 28567 }, { "epoch": 0.54, "learning_rate": 2.306030148194884e-06, "loss": 0.9183, "step": 28568 }, { "epoch": 0.54, "learning_rate": 2.3058778435329637e-06, "loss": 0.9668, "step": 28569 }, { "epoch": 0.54, "learning_rate": 2.3057255395958883e-06, "loss": 0.7218, "step": 28570 }, { "epoch": 0.54, "learning_rate": 2.305573236384229e-06, "loss": 1.0411, "step": 28571 }, { "epoch": 0.54, "learning_rate": 2.305420933898553e-06, "loss": 1.0069, "step": 28572 }, { "epoch": 0.54, "learning_rate": 2.305268632139428e-06, "loss": 0.7842, "step": 28573 }, { "epoch": 0.54, "learning_rate": 2.305116331107425e-06, "loss": 1.0457, "step": 28574 }, { "epoch": 0.54, "learning_rate": 2.3049640308031115e-06, "loss": 0.8886, "step": 28575 }, { "epoch": 0.54, "learning_rate": 2.304811731227056e-06, "loss": 0.8532, "step": 28576 }, { "epoch": 0.54, "learning_rate": 2.304659432379828e-06, "loss": 0.9146, "step": 28577 }, { "epoch": 0.54, "learning_rate": 2.304507134261996e-06, "loss": 0.8492, "step": 28578 }, { "epoch": 0.54, "learning_rate": 2.3043548368741274e-06, "loss": 0.8411, "step": 28579 }, { "epoch": 0.54, "learning_rate": 2.3042025402167924e-06, "loss": 0.9908, "step": 28580 }, { "epoch": 0.54, "learning_rate": 2.304050244290559e-06, "loss": 1.021, "step": 28581 }, { "epoch": 0.54, "learning_rate": 2.303897949095996e-06, "loss": 0.7648, "step": 28582 }, { "epoch": 0.54, "learning_rate": 2.303745654633672e-06, "loss": 1.004, "step": 28583 }, { "epoch": 0.54, "learning_rate": 2.303593360904156e-06, "loss": 0.9423, "step": 28584 }, { "epoch": 0.54, "learning_rate": 2.3034410679080166e-06, "loss": 0.9154, "step": 28585 }, { "epoch": 0.54, "learning_rate": 2.303288775645821e-06, "loss": 0.8277, "step": 28586 }, { "epoch": 0.54, "learning_rate": 2.3031364841181406e-06, "loss": 1.1292, "step": 28587 }, { "epoch": 0.54, "learning_rate": 2.3029841933255414e-06, "loss": 1.178, "step": 28588 }, { "epoch": 0.54, "learning_rate": 2.302831903268593e-06, "loss": 0.9896, "step": 28589 }, { "epoch": 0.54, "learning_rate": 2.302679613947865e-06, "loss": 0.9091, "step": 28590 }, { "epoch": 0.54, "learning_rate": 2.302527325363926e-06, "loss": 0.5487, "step": 28591 }, { "epoch": 0.54, "learning_rate": 2.302375037517342e-06, "loss": 0.9702, "step": 28592 }, { "epoch": 0.54, "learning_rate": 2.302222750408685e-06, "loss": 0.9961, "step": 28593 }, { "epoch": 0.54, "learning_rate": 2.3020704640385217e-06, "loss": 0.9593, "step": 28594 }, { "epoch": 0.54, "learning_rate": 2.301918178407421e-06, "loss": 1.0241, "step": 28595 }, { "epoch": 0.54, "learning_rate": 2.301765893515952e-06, "loss": 1.0388, "step": 28596 }, { "epoch": 0.54, "learning_rate": 2.301613609364683e-06, "loss": 0.8287, "step": 28597 }, { "epoch": 0.54, "learning_rate": 2.3014613259541823e-06, "loss": 0.8683, "step": 28598 }, { "epoch": 0.54, "learning_rate": 2.30130904328502e-06, "loss": 1.1692, "step": 28599 }, { "epoch": 0.54, "learning_rate": 2.3011567613577633e-06, "loss": 0.9514, "step": 28600 }, { "epoch": 0.54, "learning_rate": 2.3010044801729805e-06, "loss": 0.7586, "step": 28601 }, { "epoch": 0.54, "learning_rate": 2.3008521997312408e-06, "loss": 1.1282, "step": 28602 }, { "epoch": 0.54, "learning_rate": 2.300699920033114e-06, "loss": 0.8603, "step": 28603 }, { "epoch": 0.54, "learning_rate": 2.300547641079166e-06, "loss": 0.7758, "step": 28604 }, { "epoch": 0.54, "learning_rate": 2.3003953628699684e-06, "loss": 0.833, "step": 28605 }, { "epoch": 0.54, "learning_rate": 2.3002430854060883e-06, "loss": 1.1824, "step": 28606 }, { "epoch": 0.54, "learning_rate": 2.300090808688093e-06, "loss": 1.0166, "step": 28607 }, { "epoch": 0.54, "learning_rate": 2.299938532716554e-06, "loss": 0.512, "step": 28608 }, { "epoch": 0.54, "learning_rate": 2.299786257492038e-06, "loss": 0.8007, "step": 28609 }, { "epoch": 0.54, "learning_rate": 2.2996339830151133e-06, "loss": 0.989, "step": 28610 }, { "epoch": 0.54, "learning_rate": 2.29948170928635e-06, "loss": 1.0518, "step": 28611 }, { "epoch": 0.54, "learning_rate": 2.299329436306316e-06, "loss": 0.949, "step": 28612 }, { "epoch": 0.54, "learning_rate": 2.2991771640755787e-06, "loss": 1.1217, "step": 28613 }, { "epoch": 0.54, "learning_rate": 2.2990248925947086e-06, "loss": 1.1053, "step": 28614 }, { "epoch": 0.54, "learning_rate": 2.298872621864273e-06, "loss": 0.7032, "step": 28615 }, { "epoch": 0.54, "learning_rate": 2.298720351884841e-06, "loss": 0.7955, "step": 28616 }, { "epoch": 0.54, "learning_rate": 2.2985680826569807e-06, "loss": 0.8191, "step": 28617 }, { "epoch": 0.54, "learning_rate": 2.298415814181262e-06, "loss": 1.1453, "step": 28618 }, { "epoch": 0.54, "learning_rate": 2.298263546458251e-06, "loss": 1.0816, "step": 28619 }, { "epoch": 0.54, "learning_rate": 2.2981112794885186e-06, "loss": 0.9086, "step": 28620 }, { "epoch": 0.54, "learning_rate": 2.297959013272633e-06, "loss": 0.8381, "step": 28621 }, { "epoch": 0.54, "learning_rate": 2.297806747811161e-06, "loss": 0.8132, "step": 28622 }, { "epoch": 0.54, "learning_rate": 2.2976544831046727e-06, "loss": 0.752, "step": 28623 }, { "epoch": 0.54, "learning_rate": 2.297502219153737e-06, "loss": 1.1205, "step": 28624 }, { "epoch": 0.54, "learning_rate": 2.297349955958921e-06, "loss": 0.8674, "step": 28625 }, { "epoch": 0.54, "learning_rate": 2.297197693520795e-06, "loss": 1.1313, "step": 28626 }, { "epoch": 0.54, "learning_rate": 2.2970454318399267e-06, "loss": 0.8994, "step": 28627 }, { "epoch": 0.54, "learning_rate": 2.296893170916883e-06, "loss": 0.8913, "step": 28628 }, { "epoch": 0.54, "learning_rate": 2.2967409107522355e-06, "loss": 0.675, "step": 28629 }, { "epoch": 0.54, "learning_rate": 2.2965886513465506e-06, "loss": 0.808, "step": 28630 }, { "epoch": 0.54, "learning_rate": 2.2964363927003968e-06, "loss": 1.0225, "step": 28631 }, { "epoch": 0.54, "learning_rate": 2.2962841348143444e-06, "loss": 0.9055, "step": 28632 }, { "epoch": 0.54, "learning_rate": 2.2961318776889608e-06, "loss": 0.7865, "step": 28633 }, { "epoch": 0.54, "learning_rate": 2.295979621324813e-06, "loss": 0.7836, "step": 28634 }, { "epoch": 0.54, "learning_rate": 2.295827365722473e-06, "loss": 0.9191, "step": 28635 }, { "epoch": 0.54, "learning_rate": 2.2956751108825063e-06, "loss": 0.8095, "step": 28636 }, { "epoch": 0.54, "learning_rate": 2.2955228568054824e-06, "loss": 0.9618, "step": 28637 }, { "epoch": 0.54, "learning_rate": 2.29537060349197e-06, "loss": 1.0284, "step": 28638 }, { "epoch": 0.54, "learning_rate": 2.2952183509425384e-06, "loss": 0.8361, "step": 28639 }, { "epoch": 0.54, "learning_rate": 2.2950660991577538e-06, "loss": 0.7749, "step": 28640 }, { "epoch": 0.54, "learning_rate": 2.2949138481381867e-06, "loss": 0.9942, "step": 28641 }, { "epoch": 0.54, "learning_rate": 2.2947615978844057e-06, "loss": 0.7842, "step": 28642 }, { "epoch": 0.54, "learning_rate": 2.2946093483969773e-06, "loss": 1.071, "step": 28643 }, { "epoch": 0.54, "learning_rate": 2.2944570996764716e-06, "loss": 0.9251, "step": 28644 }, { "epoch": 0.54, "learning_rate": 2.2943048517234577e-06, "loss": 0.7968, "step": 28645 }, { "epoch": 0.54, "learning_rate": 2.2941526045385016e-06, "loss": 1.0088, "step": 28646 }, { "epoch": 0.54, "learning_rate": 2.294000358122175e-06, "loss": 0.7806, "step": 28647 }, { "epoch": 0.54, "learning_rate": 2.2938481124750444e-06, "loss": 0.7171, "step": 28648 }, { "epoch": 0.54, "learning_rate": 2.293695867597678e-06, "loss": 1.1492, "step": 28649 }, { "epoch": 0.54, "learning_rate": 2.2935436234906456e-06, "loss": 1.0168, "step": 28650 }, { "epoch": 0.54, "learning_rate": 2.2933913801545145e-06, "loss": 0.8163, "step": 28651 }, { "epoch": 0.54, "learning_rate": 2.293239137589853e-06, "loss": 0.7792, "step": 28652 }, { "epoch": 0.54, "learning_rate": 2.2930868957972313e-06, "loss": 0.7162, "step": 28653 }, { "epoch": 0.54, "learning_rate": 2.292934654777217e-06, "loss": 0.7608, "step": 28654 }, { "epoch": 0.54, "learning_rate": 2.292782414530377e-06, "loss": 0.8326, "step": 28655 }, { "epoch": 0.54, "learning_rate": 2.2926301750572825e-06, "loss": 0.9642, "step": 28656 }, { "epoch": 0.54, "learning_rate": 2.2924779363585e-06, "loss": 1.0459, "step": 28657 }, { "epoch": 0.54, "learning_rate": 2.292325698434598e-06, "loss": 0.8085, "step": 28658 }, { "epoch": 0.54, "learning_rate": 2.292173461286146e-06, "loss": 1.0049, "step": 28659 }, { "epoch": 0.54, "learning_rate": 2.2920212249137124e-06, "loss": 0.7643, "step": 28660 }, { "epoch": 0.54, "learning_rate": 2.291868989317864e-06, "loss": 1.0411, "step": 28661 }, { "epoch": 0.54, "learning_rate": 2.2917167544991718e-06, "loss": 0.9932, "step": 28662 }, { "epoch": 0.54, "learning_rate": 2.2915645204582023e-06, "loss": 0.9626, "step": 28663 }, { "epoch": 0.54, "learning_rate": 2.291412287195524e-06, "loss": 0.8027, "step": 28664 }, { "epoch": 0.54, "learning_rate": 2.291260054711706e-06, "loss": 0.9019, "step": 28665 }, { "epoch": 0.54, "learning_rate": 2.2911078230073167e-06, "loss": 0.8218, "step": 28666 }, { "epoch": 0.54, "learning_rate": 2.290955592082924e-06, "loss": 0.8756, "step": 28667 }, { "epoch": 0.54, "learning_rate": 2.2908033619390973e-06, "loss": 1.0433, "step": 28668 }, { "epoch": 0.54, "learning_rate": 2.2906511325764048e-06, "loss": 0.9921, "step": 28669 }, { "epoch": 0.54, "learning_rate": 2.2904989039954135e-06, "loss": 0.9274, "step": 28670 }, { "epoch": 0.54, "learning_rate": 2.2903466761966936e-06, "loss": 1.0906, "step": 28671 }, { "epoch": 0.54, "learning_rate": 2.2901944491808125e-06, "loss": 0.7178, "step": 28672 }, { "epoch": 0.54, "learning_rate": 2.2900422229483382e-06, "loss": 0.8449, "step": 28673 }, { "epoch": 0.54, "learning_rate": 2.2898899974998413e-06, "loss": 0.9881, "step": 28674 }, { "epoch": 0.54, "learning_rate": 2.289737772835888e-06, "loss": 1.1283, "step": 28675 }, { "epoch": 0.54, "learning_rate": 2.2895855489570466e-06, "loss": 0.9122, "step": 28676 }, { "epoch": 0.54, "learning_rate": 2.2894333258638878e-06, "loss": 0.8348, "step": 28677 }, { "epoch": 0.54, "learning_rate": 2.2892811035569775e-06, "loss": 0.9263, "step": 28678 }, { "epoch": 0.54, "learning_rate": 2.2891288820368855e-06, "loss": 0.7751, "step": 28679 }, { "epoch": 0.54, "learning_rate": 2.2889766613041797e-06, "loss": 0.7745, "step": 28680 }, { "epoch": 0.54, "learning_rate": 2.2888244413594287e-06, "loss": 1.0342, "step": 28681 }, { "epoch": 0.54, "learning_rate": 2.2886722222032e-06, "loss": 1.0016, "step": 28682 }, { "epoch": 0.54, "learning_rate": 2.288520003836064e-06, "loss": 1.0773, "step": 28683 }, { "epoch": 0.54, "learning_rate": 2.2883677862585875e-06, "loss": 0.8367, "step": 28684 }, { "epoch": 0.54, "learning_rate": 2.2882155694713383e-06, "loss": 0.7666, "step": 28685 }, { "epoch": 0.54, "learning_rate": 2.2880633534748857e-06, "loss": 0.9468, "step": 28686 }, { "epoch": 0.54, "learning_rate": 2.287911138269799e-06, "loss": 1.0654, "step": 28687 }, { "epoch": 0.54, "learning_rate": 2.2877589238566448e-06, "loss": 0.8832, "step": 28688 }, { "epoch": 0.54, "learning_rate": 2.2876067102359926e-06, "loss": 1.2025, "step": 28689 }, { "epoch": 0.54, "learning_rate": 2.287454497408411e-06, "loss": 0.9177, "step": 28690 }, { "epoch": 0.54, "learning_rate": 2.287302285374467e-06, "loss": 0.9394, "step": 28691 }, { "epoch": 0.54, "learning_rate": 2.28715007413473e-06, "loss": 1.1242, "step": 28692 }, { "epoch": 0.54, "learning_rate": 2.2869978636897684e-06, "loss": 1.0025, "step": 28693 }, { "epoch": 0.54, "learning_rate": 2.2868456540401494e-06, "loss": 1.077, "step": 28694 }, { "epoch": 0.54, "learning_rate": 2.2866934451864433e-06, "loss": 0.7707, "step": 28695 }, { "epoch": 0.54, "learning_rate": 2.286541237129217e-06, "loss": 0.8807, "step": 28696 }, { "epoch": 0.54, "learning_rate": 2.286389029869038e-06, "loss": 0.8987, "step": 28697 }, { "epoch": 0.54, "learning_rate": 2.2862368234064776e-06, "loss": 0.9323, "step": 28698 }, { "epoch": 0.54, "learning_rate": 2.2860846177421012e-06, "loss": 1.115, "step": 28699 }, { "epoch": 0.54, "learning_rate": 2.2859324128764786e-06, "loss": 1.2021, "step": 28700 }, { "epoch": 0.54, "learning_rate": 2.2857802088101777e-06, "loss": 1.0742, "step": 28701 }, { "epoch": 0.54, "learning_rate": 2.2856280055437672e-06, "loss": 0.9117, "step": 28702 }, { "epoch": 0.54, "learning_rate": 2.2854758030778148e-06, "loss": 0.9434, "step": 28703 }, { "epoch": 0.54, "learning_rate": 2.2853236014128895e-06, "loss": 0.9868, "step": 28704 }, { "epoch": 0.54, "learning_rate": 2.2851714005495594e-06, "loss": 0.9581, "step": 28705 }, { "epoch": 0.54, "learning_rate": 2.285019200488392e-06, "loss": 1.0732, "step": 28706 }, { "epoch": 0.54, "learning_rate": 2.2848670012299567e-06, "loss": 0.8961, "step": 28707 }, { "epoch": 0.54, "learning_rate": 2.2847148027748217e-06, "loss": 0.9237, "step": 28708 }, { "epoch": 0.54, "learning_rate": 2.284562605123554e-06, "loss": 0.8333, "step": 28709 }, { "epoch": 0.54, "learning_rate": 2.2844104082767246e-06, "loss": 0.736, "step": 28710 }, { "epoch": 0.54, "learning_rate": 2.2842582122348995e-06, "loss": 0.8422, "step": 28711 }, { "epoch": 0.54, "learning_rate": 2.284106016998647e-06, "loss": 0.9535, "step": 28712 }, { "epoch": 0.54, "learning_rate": 2.2839538225685366e-06, "loss": 0.9873, "step": 28713 }, { "epoch": 0.54, "learning_rate": 2.283801628945136e-06, "loss": 0.9932, "step": 28714 }, { "epoch": 0.54, "learning_rate": 2.2836494361290122e-06, "loss": 0.9672, "step": 28715 }, { "epoch": 0.54, "learning_rate": 2.2834972441207365e-06, "loss": 0.9653, "step": 28716 }, { "epoch": 0.54, "learning_rate": 2.2833450529208753e-06, "loss": 0.7144, "step": 28717 }, { "epoch": 0.54, "learning_rate": 2.283192862529996e-06, "loss": 1.0571, "step": 28718 }, { "epoch": 0.54, "learning_rate": 2.2830406729486686e-06, "loss": 1.1082, "step": 28719 }, { "epoch": 0.54, "learning_rate": 2.2828884841774605e-06, "loss": 1.0786, "step": 28720 }, { "epoch": 0.54, "learning_rate": 2.28273629621694e-06, "loss": 0.8259, "step": 28721 }, { "epoch": 0.54, "learning_rate": 2.2825841090676756e-06, "loss": 0.6871, "step": 28722 }, { "epoch": 0.54, "learning_rate": 2.282431922730236e-06, "loss": 0.8845, "step": 28723 }, { "epoch": 0.54, "learning_rate": 2.282279737205188e-06, "loss": 1.1941, "step": 28724 }, { "epoch": 0.54, "learning_rate": 2.2821275524931016e-06, "loss": 0.9709, "step": 28725 }, { "epoch": 0.54, "learning_rate": 2.2819753685945446e-06, "loss": 0.9736, "step": 28726 }, { "epoch": 0.54, "learning_rate": 2.2818231855100833e-06, "loss": 0.8295, "step": 28727 }, { "epoch": 0.54, "learning_rate": 2.2816710032402885e-06, "loss": 1.0271, "step": 28728 }, { "epoch": 0.54, "learning_rate": 2.2815188217857277e-06, "loss": 0.8079, "step": 28729 }, { "epoch": 0.54, "learning_rate": 2.2813666411469677e-06, "loss": 0.9985, "step": 28730 }, { "epoch": 0.54, "learning_rate": 2.2812144613245798e-06, "loss": 1.0921, "step": 28731 }, { "epoch": 0.54, "learning_rate": 2.2810622823191297e-06, "loss": 0.8152, "step": 28732 }, { "epoch": 0.54, "learning_rate": 2.2809101041311854e-06, "loss": 0.7211, "step": 28733 }, { "epoch": 0.54, "learning_rate": 2.2807579267613173e-06, "loss": 0.9975, "step": 28734 }, { "epoch": 0.54, "learning_rate": 2.280605750210092e-06, "loss": 0.9066, "step": 28735 }, { "epoch": 0.54, "learning_rate": 2.280453574478077e-06, "loss": 0.9811, "step": 28736 }, { "epoch": 0.54, "learning_rate": 2.280301399565843e-06, "loss": 0.9911, "step": 28737 }, { "epoch": 0.54, "learning_rate": 2.280149225473957e-06, "loss": 0.9348, "step": 28738 }, { "epoch": 0.54, "learning_rate": 2.2799970522029856e-06, "loss": 0.9992, "step": 28739 }, { "epoch": 0.54, "learning_rate": 2.2798448797534998e-06, "loss": 0.908, "step": 28740 }, { "epoch": 0.54, "learning_rate": 2.279692708126066e-06, "loss": 0.6675, "step": 28741 }, { "epoch": 0.54, "learning_rate": 2.2795405373212524e-06, "loss": 0.916, "step": 28742 }, { "epoch": 0.54, "learning_rate": 2.2793883673396284e-06, "loss": 1.2594, "step": 28743 }, { "epoch": 0.54, "learning_rate": 2.2792361981817614e-06, "loss": 0.8442, "step": 28744 }, { "epoch": 0.54, "learning_rate": 2.279084029848219e-06, "loss": 1.0013, "step": 28745 }, { "epoch": 0.54, "learning_rate": 2.2789318623395705e-06, "loss": 0.6973, "step": 28746 }, { "epoch": 0.54, "learning_rate": 2.2787796956563843e-06, "loss": 0.9469, "step": 28747 }, { "epoch": 0.54, "learning_rate": 2.2786275297992267e-06, "loss": 0.8274, "step": 28748 }, { "epoch": 0.54, "learning_rate": 2.278475364768668e-06, "loss": 0.9365, "step": 28749 }, { "epoch": 0.54, "learning_rate": 2.2783232005652752e-06, "loss": 1.2502, "step": 28750 }, { "epoch": 0.54, "learning_rate": 2.2781710371896163e-06, "loss": 0.8946, "step": 28751 }, { "epoch": 0.54, "learning_rate": 2.2780188746422607e-06, "loss": 1.011, "step": 28752 }, { "epoch": 0.54, "learning_rate": 2.277866712923776e-06, "loss": 0.7299, "step": 28753 }, { "epoch": 0.54, "learning_rate": 2.2777145520347293e-06, "loss": 0.7645, "step": 28754 }, { "epoch": 0.54, "learning_rate": 2.2775623919756905e-06, "loss": 1.0986, "step": 28755 }, { "epoch": 0.54, "learning_rate": 2.2774102327472265e-06, "loss": 1.077, "step": 28756 }, { "epoch": 0.54, "learning_rate": 2.277258074349905e-06, "loss": 1.0216, "step": 28757 }, { "epoch": 0.54, "learning_rate": 2.2771059167842962e-06, "loss": 0.834, "step": 28758 }, { "epoch": 0.54, "learning_rate": 2.276953760050967e-06, "loss": 0.7682, "step": 28759 }, { "epoch": 0.54, "learning_rate": 2.276801604150485e-06, "loss": 0.8581, "step": 28760 }, { "epoch": 0.54, "learning_rate": 2.2766494490834197e-06, "loss": 0.7422, "step": 28761 }, { "epoch": 0.54, "learning_rate": 2.2764972948503383e-06, "loss": 1.0563, "step": 28762 }, { "epoch": 0.54, "learning_rate": 2.2763451414518085e-06, "loss": 0.7437, "step": 28763 }, { "epoch": 0.54, "learning_rate": 2.2761929888884e-06, "loss": 0.9764, "step": 28764 }, { "epoch": 0.54, "learning_rate": 2.2760408371606797e-06, "loss": 0.8615, "step": 28765 }, { "epoch": 0.54, "learning_rate": 2.2758886862692154e-06, "loss": 0.9428, "step": 28766 }, { "epoch": 0.54, "learning_rate": 2.275736536214577e-06, "loss": 0.7977, "step": 28767 }, { "epoch": 0.54, "learning_rate": 2.275584386997331e-06, "loss": 0.7623, "step": 28768 }, { "epoch": 0.54, "learning_rate": 2.2754322386180453e-06, "loss": 0.8824, "step": 28769 }, { "epoch": 0.54, "learning_rate": 2.275280091077289e-06, "loss": 0.8803, "step": 28770 }, { "epoch": 0.54, "learning_rate": 2.2751279443756313e-06, "loss": 0.7196, "step": 28771 }, { "epoch": 0.54, "learning_rate": 2.2749757985136373e-06, "loss": 0.9258, "step": 28772 }, { "epoch": 0.54, "learning_rate": 2.274823653491878e-06, "loss": 0.7878, "step": 28773 }, { "epoch": 0.54, "learning_rate": 2.2746715093109203e-06, "loss": 1.1497, "step": 28774 }, { "epoch": 0.54, "learning_rate": 2.2745193659713306e-06, "loss": 0.9006, "step": 28775 }, { "epoch": 0.54, "learning_rate": 2.2743672234736803e-06, "loss": 1.0222, "step": 28776 }, { "epoch": 0.54, "learning_rate": 2.2742150818185355e-06, "loss": 1.0767, "step": 28777 }, { "epoch": 0.54, "learning_rate": 2.2740629410064634e-06, "loss": 0.9053, "step": 28778 }, { "epoch": 0.54, "learning_rate": 2.2739108010380352e-06, "loss": 0.8462, "step": 28779 }, { "epoch": 0.54, "learning_rate": 2.273758661913817e-06, "loss": 0.7504, "step": 28780 }, { "epoch": 0.54, "learning_rate": 2.2736065236343753e-06, "loss": 1.0373, "step": 28781 }, { "epoch": 0.54, "learning_rate": 2.2734543862002816e-06, "loss": 1.1104, "step": 28782 }, { "epoch": 0.54, "learning_rate": 2.2733022496121015e-06, "loss": 0.8538, "step": 28783 }, { "epoch": 0.54, "learning_rate": 2.273150113870404e-06, "loss": 0.8153, "step": 28784 }, { "epoch": 0.54, "learning_rate": 2.272997978975757e-06, "loss": 0.7797, "step": 28785 }, { "epoch": 0.54, "learning_rate": 2.272845844928729e-06, "loss": 0.8738, "step": 28786 }, { "epoch": 0.54, "learning_rate": 2.2726937117298866e-06, "loss": 1.0537, "step": 28787 }, { "epoch": 0.54, "learning_rate": 2.2725415793798003e-06, "loss": 1.1039, "step": 28788 }, { "epoch": 0.54, "learning_rate": 2.2723894478790364e-06, "loss": 0.8383, "step": 28789 }, { "epoch": 0.54, "learning_rate": 2.2722373172281625e-06, "loss": 0.8915, "step": 28790 }, { "epoch": 0.54, "learning_rate": 2.272085187427748e-06, "loss": 0.9251, "step": 28791 }, { "epoch": 0.54, "learning_rate": 2.2719330584783607e-06, "loss": 0.9421, "step": 28792 }, { "epoch": 0.54, "learning_rate": 2.2717809303805673e-06, "loss": 0.8676, "step": 28793 }, { "epoch": 0.54, "learning_rate": 2.2716288031349382e-06, "loss": 1.1074, "step": 28794 }, { "epoch": 0.54, "learning_rate": 2.2714766767420397e-06, "loss": 0.9473, "step": 28795 }, { "epoch": 0.54, "learning_rate": 2.27132455120244e-06, "loss": 0.9312, "step": 28796 }, { "epoch": 0.54, "learning_rate": 2.271172426516708e-06, "loss": 1.0365, "step": 28797 }, { "epoch": 0.54, "learning_rate": 2.2710203026854107e-06, "loss": 0.8079, "step": 28798 }, { "epoch": 0.54, "learning_rate": 2.2708681797091157e-06, "loss": 0.9333, "step": 28799 }, { "epoch": 0.54, "learning_rate": 2.2707160575883934e-06, "loss": 0.9736, "step": 28800 }, { "epoch": 0.54, "learning_rate": 2.27056393632381e-06, "loss": 0.8201, "step": 28801 }, { "epoch": 0.54, "learning_rate": 2.270411815915933e-06, "loss": 0.9013, "step": 28802 }, { "epoch": 0.54, "learning_rate": 2.270259696365332e-06, "loss": 0.6539, "step": 28803 }, { "epoch": 0.54, "learning_rate": 2.270107577672574e-06, "loss": 1.0137, "step": 28804 }, { "epoch": 0.54, "learning_rate": 2.2699554598382274e-06, "loss": 0.9378, "step": 28805 }, { "epoch": 0.54, "learning_rate": 2.26980334286286e-06, "loss": 1.0964, "step": 28806 }, { "epoch": 0.54, "learning_rate": 2.26965122674704e-06, "loss": 1.1204, "step": 28807 }, { "epoch": 0.54, "learning_rate": 2.2694991114913345e-06, "loss": 0.8602, "step": 28808 }, { "epoch": 0.54, "learning_rate": 2.2693469970963133e-06, "loss": 0.7792, "step": 28809 }, { "epoch": 0.54, "learning_rate": 2.2691948835625434e-06, "loss": 0.7466, "step": 28810 }, { "epoch": 0.54, "learning_rate": 2.2690427708905918e-06, "loss": 0.8844, "step": 28811 }, { "epoch": 0.54, "learning_rate": 2.2688906590810273e-06, "loss": 1.066, "step": 28812 }, { "epoch": 0.54, "learning_rate": 2.268738548134419e-06, "loss": 1.0037, "step": 28813 }, { "epoch": 0.54, "learning_rate": 2.2685864380513326e-06, "loss": 1.1104, "step": 28814 }, { "epoch": 0.54, "learning_rate": 2.268434328832339e-06, "loss": 0.8837, "step": 28815 }, { "epoch": 0.54, "learning_rate": 2.268282220478004e-06, "loss": 0.6939, "step": 28816 }, { "epoch": 0.54, "learning_rate": 2.268130112988895e-06, "loss": 0.8957, "step": 28817 }, { "epoch": 0.54, "learning_rate": 2.267978006365582e-06, "loss": 0.9462, "step": 28818 }, { "epoch": 0.54, "learning_rate": 2.2678259006086318e-06, "loss": 1.0386, "step": 28819 }, { "epoch": 0.54, "learning_rate": 2.267673795718613e-06, "loss": 0.7517, "step": 28820 }, { "epoch": 0.54, "learning_rate": 2.267521691696092e-06, "loss": 0.8887, "step": 28821 }, { "epoch": 0.54, "learning_rate": 2.267369588541639e-06, "loss": 0.7287, "step": 28822 }, { "epoch": 0.54, "learning_rate": 2.2672174862558207e-06, "loss": 0.7499, "step": 28823 }, { "epoch": 0.54, "learning_rate": 2.267065384839204e-06, "loss": 1.1071, "step": 28824 }, { "epoch": 0.54, "learning_rate": 2.2669132842923587e-06, "loss": 0.9666, "step": 28825 }, { "epoch": 0.54, "learning_rate": 2.2667611846158525e-06, "loss": 0.8529, "step": 28826 }, { "epoch": 0.54, "learning_rate": 2.2666090858102525e-06, "loss": 0.9045, "step": 28827 }, { "epoch": 0.54, "learning_rate": 2.2664569878761274e-06, "loss": 0.6671, "step": 28828 }, { "epoch": 0.54, "learning_rate": 2.2663048908140448e-06, "loss": 0.9861, "step": 28829 }, { "epoch": 0.54, "learning_rate": 2.2661527946245717e-06, "loss": 0.6686, "step": 28830 }, { "epoch": 0.54, "learning_rate": 2.2660006993082773e-06, "loss": 1.025, "step": 28831 }, { "epoch": 0.54, "learning_rate": 2.2658486048657296e-06, "loss": 1.0439, "step": 28832 }, { "epoch": 0.54, "learning_rate": 2.265696511297495e-06, "loss": 0.8505, "step": 28833 }, { "epoch": 0.54, "learning_rate": 2.2655444186041434e-06, "loss": 0.838, "step": 28834 }, { "epoch": 0.54, "learning_rate": 2.265392326786242e-06, "loss": 0.9316, "step": 28835 }, { "epoch": 0.54, "learning_rate": 2.2652402358443575e-06, "loss": 0.8391, "step": 28836 }, { "epoch": 0.54, "learning_rate": 2.265088145779059e-06, "loss": 0.9142, "step": 28837 }, { "epoch": 0.54, "learning_rate": 2.2649360565909144e-06, "loss": 1.0706, "step": 28838 }, { "epoch": 0.54, "learning_rate": 2.264783968280491e-06, "loss": 0.8624, "step": 28839 }, { "epoch": 0.54, "learning_rate": 2.2646318808483576e-06, "loss": 0.9429, "step": 28840 }, { "epoch": 0.54, "learning_rate": 2.2644797942950816e-06, "loss": 0.8873, "step": 28841 }, { "epoch": 0.54, "learning_rate": 2.2643277086212303e-06, "loss": 0.9203, "step": 28842 }, { "epoch": 0.54, "learning_rate": 2.2641756238273725e-06, "loss": 1.1331, "step": 28843 }, { "epoch": 0.54, "learning_rate": 2.2640235399140754e-06, "loss": 1.0828, "step": 28844 }, { "epoch": 0.54, "learning_rate": 2.263871456881907e-06, "loss": 0.8287, "step": 28845 }, { "epoch": 0.54, "learning_rate": 2.2637193747314356e-06, "loss": 0.8236, "step": 28846 }, { "epoch": 0.54, "learning_rate": 2.2635672934632293e-06, "loss": 0.8128, "step": 28847 }, { "epoch": 0.54, "learning_rate": 2.2634152130778544e-06, "loss": 0.8322, "step": 28848 }, { "epoch": 0.54, "learning_rate": 2.2632631335758807e-06, "loss": 0.9095, "step": 28849 }, { "epoch": 0.54, "learning_rate": 2.2631110549578757e-06, "loss": 1.2366, "step": 28850 }, { "epoch": 0.54, "learning_rate": 2.262958977224405e-06, "loss": 1.1246, "step": 28851 }, { "epoch": 0.54, "learning_rate": 2.2628069003760396e-06, "loss": 0.7737, "step": 28852 }, { "epoch": 0.54, "learning_rate": 2.2626548244133457e-06, "loss": 1.0115, "step": 28853 }, { "epoch": 0.54, "learning_rate": 2.2625027493368905e-06, "loss": 0.8146, "step": 28854 }, { "epoch": 0.54, "learning_rate": 2.262350675147244e-06, "loss": 0.79, "step": 28855 }, { "epoch": 0.54, "learning_rate": 2.262198601844973e-06, "loss": 0.9852, "step": 28856 }, { "epoch": 0.54, "learning_rate": 2.2620465294306436e-06, "loss": 0.8079, "step": 28857 }, { "epoch": 0.54, "learning_rate": 2.2618944579048264e-06, "loss": 0.9277, "step": 28858 }, { "epoch": 0.54, "learning_rate": 2.2617423872680876e-06, "loss": 0.9518, "step": 28859 }, { "epoch": 0.54, "learning_rate": 2.261590317520995e-06, "loss": 0.9435, "step": 28860 }, { "epoch": 0.54, "learning_rate": 2.2614382486641178e-06, "loss": 0.9584, "step": 28861 }, { "epoch": 0.54, "learning_rate": 2.2612861806980226e-06, "loss": 1.1879, "step": 28862 }, { "epoch": 0.54, "learning_rate": 2.2611341136232763e-06, "loss": 1.0088, "step": 28863 }, { "epoch": 0.54, "learning_rate": 2.2609820474404493e-06, "loss": 0.802, "step": 28864 }, { "epoch": 0.54, "learning_rate": 2.2608299821501075e-06, "loss": 0.88, "step": 28865 }, { "epoch": 0.54, "learning_rate": 2.2606779177528192e-06, "loss": 0.7707, "step": 28866 }, { "epoch": 0.54, "learning_rate": 2.2605258542491524e-06, "loss": 0.9553, "step": 28867 }, { "epoch": 0.54, "learning_rate": 2.260373791639675e-06, "loss": 1.0793, "step": 28868 }, { "epoch": 0.54, "learning_rate": 2.260221729924953e-06, "loss": 1.188, "step": 28869 }, { "epoch": 0.54, "learning_rate": 2.260069669105558e-06, "loss": 0.9147, "step": 28870 }, { "epoch": 0.54, "learning_rate": 2.2599176091820545e-06, "loss": 0.9375, "step": 28871 }, { "epoch": 0.54, "learning_rate": 2.25976555015501e-06, "loss": 0.8416, "step": 28872 }, { "epoch": 0.54, "learning_rate": 2.259613492024995e-06, "loss": 0.7952, "step": 28873 }, { "epoch": 0.54, "learning_rate": 2.2594614347925757e-06, "loss": 0.9981, "step": 28874 }, { "epoch": 0.54, "learning_rate": 2.2593093784583194e-06, "loss": 1.0907, "step": 28875 }, { "epoch": 0.54, "learning_rate": 2.259157323022795e-06, "loss": 0.9544, "step": 28876 }, { "epoch": 0.54, "learning_rate": 2.2590052684865704e-06, "loss": 0.7989, "step": 28877 }, { "epoch": 0.54, "learning_rate": 2.2588532148502114e-06, "loss": 0.9204, "step": 28878 }, { "epoch": 0.54, "learning_rate": 2.2587011621142883e-06, "loss": 0.7765, "step": 28879 }, { "epoch": 0.54, "learning_rate": 2.258549110279367e-06, "loss": 1.1154, "step": 28880 }, { "epoch": 0.54, "learning_rate": 2.2583970593460154e-06, "loss": 0.9948, "step": 28881 }, { "epoch": 0.54, "learning_rate": 2.2582450093148027e-06, "loss": 1.0035, "step": 28882 }, { "epoch": 0.54, "learning_rate": 2.258092960186296e-06, "loss": 0.7863, "step": 28883 }, { "epoch": 0.54, "learning_rate": 2.2579409119610612e-06, "loss": 1.0176, "step": 28884 }, { "epoch": 0.54, "learning_rate": 2.257788864639669e-06, "loss": 0.8687, "step": 28885 }, { "epoch": 0.54, "learning_rate": 2.2576368182226855e-06, "loss": 0.9969, "step": 28886 }, { "epoch": 0.55, "learning_rate": 2.2574847727106787e-06, "loss": 0.9653, "step": 28887 }, { "epoch": 0.55, "learning_rate": 2.2573327281042157e-06, "loss": 1.1942, "step": 28888 }, { "epoch": 0.55, "learning_rate": 2.2571806844038657e-06, "loss": 1.0034, "step": 28889 }, { "epoch": 0.55, "learning_rate": 2.2570286416101947e-06, "loss": 0.9956, "step": 28890 }, { "epoch": 0.55, "learning_rate": 2.2568765997237726e-06, "loss": 0.9569, "step": 28891 }, { "epoch": 0.55, "learning_rate": 2.2567245587451652e-06, "loss": 0.9108, "step": 28892 }, { "epoch": 0.55, "learning_rate": 2.2565725186749397e-06, "loss": 0.9426, "step": 28893 }, { "epoch": 0.55, "learning_rate": 2.256420479513666e-06, "loss": 0.778, "step": 28894 }, { "epoch": 0.55, "learning_rate": 2.256268441261911e-06, "loss": 0.6577, "step": 28895 }, { "epoch": 0.55, "learning_rate": 2.2561164039202414e-06, "loss": 0.9261, "step": 28896 }, { "epoch": 0.55, "learning_rate": 2.2559643674892264e-06, "loss": 0.9599, "step": 28897 }, { "epoch": 0.55, "learning_rate": 2.2558123319694335e-06, "loss": 0.7919, "step": 28898 }, { "epoch": 0.55, "learning_rate": 2.2556602973614283e-06, "loss": 1.0156, "step": 28899 }, { "epoch": 0.55, "learning_rate": 2.255508263665781e-06, "loss": 1.2556, "step": 28900 }, { "epoch": 0.55, "learning_rate": 2.255356230883058e-06, "loss": 1.0518, "step": 28901 }, { "epoch": 0.55, "learning_rate": 2.255204199013827e-06, "loss": 0.7704, "step": 28902 }, { "epoch": 0.55, "learning_rate": 2.255052168058657e-06, "loss": 0.7149, "step": 28903 }, { "epoch": 0.55, "learning_rate": 2.2549001380181147e-06, "loss": 0.7868, "step": 28904 }, { "epoch": 0.55, "learning_rate": 2.2547481088927666e-06, "loss": 0.8528, "step": 28905 }, { "epoch": 0.55, "learning_rate": 2.2545960806831826e-06, "loss": 1.2386, "step": 28906 }, { "epoch": 0.55, "learning_rate": 2.254444053389929e-06, "loss": 0.8052, "step": 28907 }, { "epoch": 0.55, "learning_rate": 2.2542920270135734e-06, "loss": 0.7577, "step": 28908 }, { "epoch": 0.55, "learning_rate": 2.254140001554684e-06, "loss": 0.9236, "step": 28909 }, { "epoch": 0.55, "learning_rate": 2.253987977013829e-06, "loss": 0.8076, "step": 28910 }, { "epoch": 0.55, "learning_rate": 2.2538359533915742e-06, "loss": 1.1634, "step": 28911 }, { "epoch": 0.55, "learning_rate": 2.253683930688489e-06, "loss": 1.0111, "step": 28912 }, { "epoch": 0.55, "learning_rate": 2.253531908905141e-06, "loss": 1.0152, "step": 28913 }, { "epoch": 0.55, "learning_rate": 2.253379888042096e-06, "loss": 0.9797, "step": 28914 }, { "epoch": 0.55, "learning_rate": 2.253227868099924e-06, "loss": 0.8061, "step": 28915 }, { "epoch": 0.55, "learning_rate": 2.2530758490791917e-06, "loss": 0.9541, "step": 28916 }, { "epoch": 0.55, "learning_rate": 2.252923830980465e-06, "loss": 0.9367, "step": 28917 }, { "epoch": 0.55, "learning_rate": 2.252771813804315e-06, "loss": 0.9939, "step": 28918 }, { "epoch": 0.55, "learning_rate": 2.2526197975513074e-06, "loss": 1.1283, "step": 28919 }, { "epoch": 0.55, "learning_rate": 2.2524677822220084e-06, "loss": 0.6963, "step": 28920 }, { "epoch": 0.55, "learning_rate": 2.2523157678169884e-06, "loss": 0.9891, "step": 28921 }, { "epoch": 0.55, "learning_rate": 2.252163754336813e-06, "loss": 0.9034, "step": 28922 }, { "epoch": 0.55, "learning_rate": 2.25201174178205e-06, "loss": 0.813, "step": 28923 }, { "epoch": 0.55, "learning_rate": 2.251859730153269e-06, "loss": 1.0076, "step": 28924 }, { "epoch": 0.55, "learning_rate": 2.2517077194510363e-06, "loss": 1.1363, "step": 28925 }, { "epoch": 0.55, "learning_rate": 2.251555709675918e-06, "loss": 1.0522, "step": 28926 }, { "epoch": 0.55, "learning_rate": 2.251403700828484e-06, "loss": 1.0648, "step": 28927 }, { "epoch": 0.55, "learning_rate": 2.2512516929093005e-06, "loss": 1.0007, "step": 28928 }, { "epoch": 0.55, "learning_rate": 2.2510996859189354e-06, "loss": 0.9277, "step": 28929 }, { "epoch": 0.55, "learning_rate": 2.250947679857957e-06, "loss": 1.0235, "step": 28930 }, { "epoch": 0.55, "learning_rate": 2.250795674726932e-06, "loss": 1.1378, "step": 28931 }, { "epoch": 0.55, "learning_rate": 2.250643670526428e-06, "loss": 0.9235, "step": 28932 }, { "epoch": 0.55, "learning_rate": 2.2504916672570138e-06, "loss": 0.7796, "step": 28933 }, { "epoch": 0.55, "learning_rate": 2.250339664919256e-06, "loss": 0.9798, "step": 28934 }, { "epoch": 0.55, "learning_rate": 2.250187663513721e-06, "loss": 0.834, "step": 28935 }, { "epoch": 0.55, "learning_rate": 2.250035663040978e-06, "loss": 0.928, "step": 28936 }, { "epoch": 0.55, "learning_rate": 2.249883663501595e-06, "loss": 0.9855, "step": 28937 }, { "epoch": 0.55, "learning_rate": 2.249731664896138e-06, "loss": 0.9329, "step": 28938 }, { "epoch": 0.55, "learning_rate": 2.2495796672251757e-06, "loss": 0.8058, "step": 28939 }, { "epoch": 0.55, "learning_rate": 2.2494276704892757e-06, "loss": 1.0194, "step": 28940 }, { "epoch": 0.55, "learning_rate": 2.2492756746890036e-06, "loss": 0.9779, "step": 28941 }, { "epoch": 0.55, "learning_rate": 2.24912367982493e-06, "loss": 0.7824, "step": 28942 }, { "epoch": 0.55, "learning_rate": 2.24897168589762e-06, "loss": 0.7971, "step": 28943 }, { "epoch": 0.55, "learning_rate": 2.248819692907642e-06, "loss": 1.0057, "step": 28944 }, { "epoch": 0.55, "learning_rate": 2.2486677008555637e-06, "loss": 0.8068, "step": 28945 }, { "epoch": 0.55, "learning_rate": 2.2485157097419533e-06, "loss": 0.6966, "step": 28946 }, { "epoch": 0.55, "learning_rate": 2.248363719567376e-06, "loss": 0.9427, "step": 28947 }, { "epoch": 0.55, "learning_rate": 2.2482117303324023e-06, "loss": 0.8835, "step": 28948 }, { "epoch": 0.55, "learning_rate": 2.2480597420375972e-06, "loss": 1.1536, "step": 28949 }, { "epoch": 0.55, "learning_rate": 2.24790775468353e-06, "loss": 1.1345, "step": 28950 }, { "epoch": 0.55, "learning_rate": 2.247755768270767e-06, "loss": 0.8561, "step": 28951 }, { "epoch": 0.55, "learning_rate": 2.247603782799877e-06, "loss": 0.6883, "step": 28952 }, { "epoch": 0.55, "learning_rate": 2.2474517982714257e-06, "loss": 0.8577, "step": 28953 }, { "epoch": 0.55, "learning_rate": 2.2472998146859824e-06, "loss": 0.9526, "step": 28954 }, { "epoch": 0.55, "learning_rate": 2.2471478320441142e-06, "loss": 0.8109, "step": 28955 }, { "epoch": 0.55, "learning_rate": 2.246995850346387e-06, "loss": 1.1068, "step": 28956 }, { "epoch": 0.55, "learning_rate": 2.2468438695933703e-06, "loss": 0.918, "step": 28957 }, { "epoch": 0.55, "learning_rate": 2.2466918897856312e-06, "loss": 0.8416, "step": 28958 }, { "epoch": 0.55, "learning_rate": 2.2465399109237357e-06, "loss": 0.6459, "step": 28959 }, { "epoch": 0.55, "learning_rate": 2.2463879330082534e-06, "loss": 0.8607, "step": 28960 }, { "epoch": 0.55, "learning_rate": 2.246235956039751e-06, "loss": 0.8156, "step": 28961 }, { "epoch": 0.55, "learning_rate": 2.2460839800187943e-06, "loss": 1.0496, "step": 28962 }, { "epoch": 0.55, "learning_rate": 2.2459320049459537e-06, "loss": 1.002, "step": 28963 }, { "epoch": 0.55, "learning_rate": 2.2457800308217947e-06, "loss": 0.762, "step": 28964 }, { "epoch": 0.55, "learning_rate": 2.2456280576468843e-06, "loss": 0.8152, "step": 28965 }, { "epoch": 0.55, "learning_rate": 2.2454760854217927e-06, "loss": 1.0032, "step": 28966 }, { "epoch": 0.55, "learning_rate": 2.245324114147085e-06, "loss": 0.9243, "step": 28967 }, { "epoch": 0.55, "learning_rate": 2.2451721438233283e-06, "loss": 0.9679, "step": 28968 }, { "epoch": 0.55, "learning_rate": 2.2450201744510923e-06, "loss": 1.0659, "step": 28969 }, { "epoch": 0.55, "learning_rate": 2.2448682060309425e-06, "loss": 0.6185, "step": 28970 }, { "epoch": 0.55, "learning_rate": 2.2447162385634464e-06, "loss": 0.978, "step": 28971 }, { "epoch": 0.55, "learning_rate": 2.244564272049173e-06, "loss": 0.8242, "step": 28972 }, { "epoch": 0.55, "learning_rate": 2.244412306488689e-06, "loss": 0.7423, "step": 28973 }, { "epoch": 0.55, "learning_rate": 2.2442603418825603e-06, "loss": 0.707, "step": 28974 }, { "epoch": 0.55, "learning_rate": 2.244108378231357e-06, "loss": 1.225, "step": 28975 }, { "epoch": 0.55, "learning_rate": 2.2439564155356446e-06, "loss": 0.8472, "step": 28976 }, { "epoch": 0.55, "learning_rate": 2.2438044537959903e-06, "loss": 1.0155, "step": 28977 }, { "epoch": 0.55, "learning_rate": 2.243652493012963e-06, "loss": 0.9813, "step": 28978 }, { "epoch": 0.55, "learning_rate": 2.2435005331871302e-06, "loss": 0.8733, "step": 28979 }, { "epoch": 0.55, "learning_rate": 2.2433485743190574e-06, "loss": 1.055, "step": 28980 }, { "epoch": 0.55, "learning_rate": 2.243196616409314e-06, "loss": 1.0854, "step": 28981 }, { "epoch": 0.55, "learning_rate": 2.2430446594584666e-06, "loss": 0.8914, "step": 28982 }, { "epoch": 0.55, "learning_rate": 2.2428927034670815e-06, "loss": 0.8943, "step": 28983 }, { "epoch": 0.55, "learning_rate": 2.242740748435728e-06, "loss": 0.9786, "step": 28984 }, { "epoch": 0.55, "learning_rate": 2.2425887943649722e-06, "loss": 0.8095, "step": 28985 }, { "epoch": 0.55, "learning_rate": 2.2424368412553817e-06, "loss": 0.7997, "step": 28986 }, { "epoch": 0.55, "learning_rate": 2.242284889107525e-06, "loss": 1.1048, "step": 28987 }, { "epoch": 0.55, "learning_rate": 2.2421329379219687e-06, "loss": 1.0551, "step": 28988 }, { "epoch": 0.55, "learning_rate": 2.241980987699279e-06, "loss": 0.9126, "step": 28989 }, { "epoch": 0.55, "learning_rate": 2.2418290384400255e-06, "loss": 0.9425, "step": 28990 }, { "epoch": 0.55, "learning_rate": 2.241677090144774e-06, "loss": 0.7873, "step": 28991 }, { "epoch": 0.55, "learning_rate": 2.2415251428140922e-06, "loss": 0.8038, "step": 28992 }, { "epoch": 0.55, "learning_rate": 2.2413731964485476e-06, "loss": 0.9352, "step": 28993 }, { "epoch": 0.55, "learning_rate": 2.241221251048708e-06, "loss": 1.1103, "step": 28994 }, { "epoch": 0.55, "learning_rate": 2.2410693066151397e-06, "loss": 0.7621, "step": 28995 }, { "epoch": 0.55, "learning_rate": 2.240917363148411e-06, "loss": 0.8189, "step": 28996 }, { "epoch": 0.55, "learning_rate": 2.24076542064909e-06, "loss": 0.8692, "step": 28997 }, { "epoch": 0.55, "learning_rate": 2.240613479117741e-06, "loss": 1.0144, "step": 28998 }, { "epoch": 0.55, "learning_rate": 2.240461538554934e-06, "loss": 1.0474, "step": 28999 }, { "epoch": 0.55, "learning_rate": 2.240309598961236e-06, "loss": 1.1833, "step": 29000 }, { "epoch": 0.55, "learning_rate": 2.2401576603372134e-06, "loss": 0.7818, "step": 29001 }, { "epoch": 0.55, "learning_rate": 2.2400057226834353e-06, "loss": 0.8628, "step": 29002 }, { "epoch": 0.55, "learning_rate": 2.2398537860004674e-06, "loss": 0.8718, "step": 29003 }, { "epoch": 0.55, "learning_rate": 2.2397018502888764e-06, "loss": 0.7687, "step": 29004 }, { "epoch": 0.55, "learning_rate": 2.239549915549232e-06, "loss": 0.9745, "step": 29005 }, { "epoch": 0.55, "learning_rate": 2.2393979817820997e-06, "loss": 1.0263, "step": 29006 }, { "epoch": 0.55, "learning_rate": 2.2392460489880464e-06, "loss": 0.9799, "step": 29007 }, { "epoch": 0.55, "learning_rate": 2.239094117167642e-06, "loss": 0.8955, "step": 29008 }, { "epoch": 0.55, "learning_rate": 2.2389421863214518e-06, "loss": 1.0623, "step": 29009 }, { "epoch": 0.55, "learning_rate": 2.238790256450043e-06, "loss": 0.8625, "step": 29010 }, { "epoch": 0.55, "learning_rate": 2.2386383275539835e-06, "loss": 0.6848, "step": 29011 }, { "epoch": 0.55, "learning_rate": 2.238486399633841e-06, "loss": 1.0833, "step": 29012 }, { "epoch": 0.55, "learning_rate": 2.2383344726901814e-06, "loss": 0.9657, "step": 29013 }, { "epoch": 0.55, "learning_rate": 2.238182546723573e-06, "loss": 0.8958, "step": 29014 }, { "epoch": 0.55, "learning_rate": 2.238030621734584e-06, "loss": 0.991, "step": 29015 }, { "epoch": 0.55, "learning_rate": 2.2378786977237785e-06, "loss": 0.8078, "step": 29016 }, { "epoch": 0.55, "learning_rate": 2.237726774691728e-06, "loss": 0.7671, "step": 29017 }, { "epoch": 0.55, "learning_rate": 2.2375748526389972e-06, "loss": 0.8748, "step": 29018 }, { "epoch": 0.55, "learning_rate": 2.237422931566153e-06, "loss": 1.2134, "step": 29019 }, { "epoch": 0.55, "learning_rate": 2.2372710114737643e-06, "loss": 1.0488, "step": 29020 }, { "epoch": 0.55, "learning_rate": 2.2371190923623975e-06, "loss": 0.7651, "step": 29021 }, { "epoch": 0.55, "learning_rate": 2.2369671742326195e-06, "loss": 0.884, "step": 29022 }, { "epoch": 0.55, "learning_rate": 2.2368152570849986e-06, "loss": 0.9074, "step": 29023 }, { "epoch": 0.55, "learning_rate": 2.2366633409201015e-06, "loss": 0.8662, "step": 29024 }, { "epoch": 0.55, "learning_rate": 2.2365114257384945e-06, "loss": 0.8197, "step": 29025 }, { "epoch": 0.55, "learning_rate": 2.2363595115407468e-06, "loss": 0.9347, "step": 29026 }, { "epoch": 0.55, "learning_rate": 2.236207598327424e-06, "loss": 0.712, "step": 29027 }, { "epoch": 0.55, "learning_rate": 2.2360556860990936e-06, "loss": 0.8347, "step": 29028 }, { "epoch": 0.55, "learning_rate": 2.235903774856324e-06, "loss": 0.8228, "step": 29029 }, { "epoch": 0.55, "learning_rate": 2.2357518645996817e-06, "loss": 1.048, "step": 29030 }, { "epoch": 0.55, "learning_rate": 2.2355999553297328e-06, "loss": 1.1295, "step": 29031 }, { "epoch": 0.55, "learning_rate": 2.2354480470470465e-06, "loss": 0.9335, "step": 29032 }, { "epoch": 0.55, "learning_rate": 2.2352961397521886e-06, "loss": 0.9543, "step": 29033 }, { "epoch": 0.55, "learning_rate": 2.235144233445727e-06, "loss": 0.8, "step": 29034 }, { "epoch": 0.55, "learning_rate": 2.2349923281282284e-06, "loss": 0.9258, "step": 29035 }, { "epoch": 0.55, "learning_rate": 2.2348404238002614e-06, "loss": 0.8448, "step": 29036 }, { "epoch": 0.55, "learning_rate": 2.2346885204623905e-06, "loss": 1.0606, "step": 29037 }, { "epoch": 0.55, "learning_rate": 2.2345366181151855e-06, "loss": 0.9731, "step": 29038 }, { "epoch": 0.55, "learning_rate": 2.234384716759213e-06, "loss": 0.9533, "step": 29039 }, { "epoch": 0.55, "learning_rate": 2.234232816395039e-06, "loss": 0.7568, "step": 29040 }, { "epoch": 0.55, "learning_rate": 2.2340809170232316e-06, "loss": 0.8385, "step": 29041 }, { "epoch": 0.55, "learning_rate": 2.2339290186443586e-06, "loss": 0.7516, "step": 29042 }, { "epoch": 0.55, "learning_rate": 2.2337771212589854e-06, "loss": 0.9244, "step": 29043 }, { "epoch": 0.55, "learning_rate": 2.233625224867681e-06, "loss": 0.9846, "step": 29044 }, { "epoch": 0.55, "learning_rate": 2.233473329471012e-06, "loss": 1.1125, "step": 29045 }, { "epoch": 0.55, "learning_rate": 2.2333214350695446e-06, "loss": 0.8698, "step": 29046 }, { "epoch": 0.55, "learning_rate": 2.233169541663848e-06, "loss": 0.9188, "step": 29047 }, { "epoch": 0.55, "learning_rate": 2.2330176492544873e-06, "loss": 0.9921, "step": 29048 }, { "epoch": 0.55, "learning_rate": 2.23286575784203e-06, "loss": 0.9845, "step": 29049 }, { "epoch": 0.55, "learning_rate": 2.232713867427045e-06, "loss": 1.0167, "step": 29050 }, { "epoch": 0.55, "learning_rate": 2.232561978010098e-06, "loss": 0.8428, "step": 29051 }, { "epoch": 0.55, "learning_rate": 2.2324100895917568e-06, "loss": 0.6748, "step": 29052 }, { "epoch": 0.55, "learning_rate": 2.2322582021725863e-06, "loss": 0.915, "step": 29053 }, { "epoch": 0.55, "learning_rate": 2.232106315753156e-06, "loss": 0.7473, "step": 29054 }, { "epoch": 0.55, "learning_rate": 2.231954430334034e-06, "loss": 0.8912, "step": 29055 }, { "epoch": 0.55, "learning_rate": 2.2318025459157843e-06, "loss": 0.9311, "step": 29056 }, { "epoch": 0.55, "learning_rate": 2.2316506624989766e-06, "loss": 0.9706, "step": 29057 }, { "epoch": 0.55, "learning_rate": 2.2314987800841777e-06, "loss": 0.9908, "step": 29058 }, { "epoch": 0.55, "learning_rate": 2.2313468986719523e-06, "loss": 0.7969, "step": 29059 }, { "epoch": 0.55, "learning_rate": 2.231195018262871e-06, "loss": 0.7036, "step": 29060 }, { "epoch": 0.55, "learning_rate": 2.2310431388574984e-06, "loss": 1.08, "step": 29061 }, { "epoch": 0.55, "learning_rate": 2.230891260456402e-06, "loss": 1.0742, "step": 29062 }, { "epoch": 0.55, "learning_rate": 2.2307393830601503e-06, "loss": 0.9626, "step": 29063 }, { "epoch": 0.55, "learning_rate": 2.23058750666931e-06, "loss": 0.9947, "step": 29064 }, { "epoch": 0.55, "learning_rate": 2.230435631284446e-06, "loss": 0.9426, "step": 29065 }, { "epoch": 0.55, "learning_rate": 2.2302837569061283e-06, "loss": 0.7699, "step": 29066 }, { "epoch": 0.55, "learning_rate": 2.2301318835349222e-06, "loss": 0.9658, "step": 29067 }, { "epoch": 0.55, "learning_rate": 2.2299800111713957e-06, "loss": 1.1975, "step": 29068 }, { "epoch": 0.55, "learning_rate": 2.2298281398161153e-06, "loss": 1.0291, "step": 29069 }, { "epoch": 0.55, "learning_rate": 2.229676269469649e-06, "loss": 0.9448, "step": 29070 }, { "epoch": 0.55, "learning_rate": 2.2295244001325623e-06, "loss": 0.8965, "step": 29071 }, { "epoch": 0.55, "learning_rate": 2.229372531805424e-06, "loss": 0.8166, "step": 29072 }, { "epoch": 0.55, "learning_rate": 2.2292206644888005e-06, "loss": 0.7322, "step": 29073 }, { "epoch": 0.55, "learning_rate": 2.2290687981832578e-06, "loss": 1.1445, "step": 29074 }, { "epoch": 0.55, "learning_rate": 2.228916932889364e-06, "loss": 1.0308, "step": 29075 }, { "epoch": 0.55, "learning_rate": 2.228765068607687e-06, "loss": 0.9414, "step": 29076 }, { "epoch": 0.55, "learning_rate": 2.2286132053387917e-06, "loss": 0.7959, "step": 29077 }, { "epoch": 0.55, "learning_rate": 2.2284613430832477e-06, "loss": 0.9135, "step": 29078 }, { "epoch": 0.55, "learning_rate": 2.2283094818416203e-06, "loss": 0.9655, "step": 29079 }, { "epoch": 0.55, "learning_rate": 2.228157621614476e-06, "loss": 0.8458, "step": 29080 }, { "epoch": 0.55, "learning_rate": 2.228005762402384e-06, "loss": 0.8257, "step": 29081 }, { "epoch": 0.55, "learning_rate": 2.2278539042059094e-06, "loss": 0.9255, "step": 29082 }, { "epoch": 0.55, "learning_rate": 2.2277020470256196e-06, "loss": 0.9248, "step": 29083 }, { "epoch": 0.55, "learning_rate": 2.227550190862083e-06, "loss": 0.9095, "step": 29084 }, { "epoch": 0.55, "learning_rate": 2.2273983357158657e-06, "loss": 0.8728, "step": 29085 }, { "epoch": 0.55, "learning_rate": 2.227246481587534e-06, "loss": 0.8873, "step": 29086 }, { "epoch": 0.55, "learning_rate": 2.227094628477656e-06, "loss": 1.0421, "step": 29087 }, { "epoch": 0.55, "learning_rate": 2.226942776386798e-06, "loss": 1.0277, "step": 29088 }, { "epoch": 0.55, "learning_rate": 2.226790925315527e-06, "loss": 0.9302, "step": 29089 }, { "epoch": 0.55, "learning_rate": 2.2266390752644106e-06, "loss": 0.8037, "step": 29090 }, { "epoch": 0.55, "learning_rate": 2.2264872262340164e-06, "loss": 1.0689, "step": 29091 }, { "epoch": 0.55, "learning_rate": 2.226335378224909e-06, "loss": 0.7666, "step": 29092 }, { "epoch": 0.55, "learning_rate": 2.226183531237658e-06, "loss": 1.1099, "step": 29093 }, { "epoch": 0.55, "learning_rate": 2.2260316852728293e-06, "loss": 0.9698, "step": 29094 }, { "epoch": 0.55, "learning_rate": 2.225879840330989e-06, "loss": 0.6909, "step": 29095 }, { "epoch": 0.55, "learning_rate": 2.225727996412705e-06, "loss": 0.8893, "step": 29096 }, { "epoch": 0.55, "learning_rate": 2.2255761535185457e-06, "loss": 1.0284, "step": 29097 }, { "epoch": 0.55, "learning_rate": 2.2254243116490747e-06, "loss": 0.8368, "step": 29098 }, { "epoch": 0.55, "learning_rate": 2.225272470804862e-06, "loss": 0.7526, "step": 29099 }, { "epoch": 0.55, "learning_rate": 2.2251206309864742e-06, "loss": 1.032, "step": 29100 }, { "epoch": 0.55, "learning_rate": 2.224968792194476e-06, "loss": 0.7905, "step": 29101 }, { "epoch": 0.55, "learning_rate": 2.224816954429437e-06, "loss": 0.9287, "step": 29102 }, { "epoch": 0.55, "learning_rate": 2.2246651176919226e-06, "loss": 0.9218, "step": 29103 }, { "epoch": 0.55, "learning_rate": 2.224513281982499e-06, "loss": 0.8416, "step": 29104 }, { "epoch": 0.55, "learning_rate": 2.2243614473017363e-06, "loss": 1.0436, "step": 29105 }, { "epoch": 0.55, "learning_rate": 2.2242096136501997e-06, "loss": 0.9808, "step": 29106 }, { "epoch": 0.55, "learning_rate": 2.224057781028454e-06, "loss": 0.8941, "step": 29107 }, { "epoch": 0.55, "learning_rate": 2.2239059494370697e-06, "loss": 0.8856, "step": 29108 }, { "epoch": 0.55, "learning_rate": 2.2237541188766113e-06, "loss": 0.8578, "step": 29109 }, { "epoch": 0.55, "learning_rate": 2.223602289347647e-06, "loss": 0.8137, "step": 29110 }, { "epoch": 0.55, "learning_rate": 2.223450460850743e-06, "loss": 0.8661, "step": 29111 }, { "epoch": 0.55, "learning_rate": 2.223298633386467e-06, "loss": 0.8157, "step": 29112 }, { "epoch": 0.55, "learning_rate": 2.2231468069553842e-06, "loss": 0.9977, "step": 29113 }, { "epoch": 0.55, "learning_rate": 2.222994981558064e-06, "loss": 0.9729, "step": 29114 }, { "epoch": 0.55, "learning_rate": 2.222843157195072e-06, "loss": 1.0487, "step": 29115 }, { "epoch": 0.55, "learning_rate": 2.222691333866974e-06, "loss": 0.7986, "step": 29116 }, { "epoch": 0.55, "learning_rate": 2.2225395115743385e-06, "loss": 0.8059, "step": 29117 }, { "epoch": 0.55, "learning_rate": 2.222387690317733e-06, "loss": 0.7826, "step": 29118 }, { "epoch": 0.55, "learning_rate": 2.2222358700977217e-06, "loss": 0.96, "step": 29119 }, { "epoch": 0.55, "learning_rate": 2.2220840509148746e-06, "loss": 0.9785, "step": 29120 }, { "epoch": 0.55, "learning_rate": 2.221932232769757e-06, "loss": 0.8146, "step": 29121 }, { "epoch": 0.55, "learning_rate": 2.221780415662935e-06, "loss": 0.7292, "step": 29122 }, { "epoch": 0.55, "learning_rate": 2.2216285995949772e-06, "loss": 0.8145, "step": 29123 }, { "epoch": 0.55, "learning_rate": 2.2214767845664494e-06, "loss": 0.8318, "step": 29124 }, { "epoch": 0.55, "learning_rate": 2.221324970577918e-06, "loss": 1.0342, "step": 29125 }, { "epoch": 0.55, "learning_rate": 2.2211731576299515e-06, "loss": 0.9887, "step": 29126 }, { "epoch": 0.55, "learning_rate": 2.2210213457231165e-06, "loss": 0.9517, "step": 29127 }, { "epoch": 0.55, "learning_rate": 2.2208695348579775e-06, "loss": 0.8568, "step": 29128 }, { "epoch": 0.55, "learning_rate": 2.2207177250351044e-06, "loss": 0.949, "step": 29129 }, { "epoch": 0.55, "learning_rate": 2.2205659162550624e-06, "loss": 0.7099, "step": 29130 }, { "epoch": 0.55, "learning_rate": 2.2204141085184188e-06, "loss": 0.955, "step": 29131 }, { "epoch": 0.55, "learning_rate": 2.22026230182574e-06, "loss": 0.8617, "step": 29132 }, { "epoch": 0.55, "learning_rate": 2.2201104961775937e-06, "loss": 0.9067, "step": 29133 }, { "epoch": 0.55, "learning_rate": 2.2199586915745455e-06, "loss": 0.9097, "step": 29134 }, { "epoch": 0.55, "learning_rate": 2.2198068880171638e-06, "loss": 0.8967, "step": 29135 }, { "epoch": 0.55, "learning_rate": 2.2196550855060146e-06, "loss": 0.8699, "step": 29136 }, { "epoch": 0.55, "learning_rate": 2.2195032840416636e-06, "loss": 0.9887, "step": 29137 }, { "epoch": 0.55, "learning_rate": 2.2193514836246793e-06, "loss": 1.0367, "step": 29138 }, { "epoch": 0.55, "learning_rate": 2.2191996842556286e-06, "loss": 0.9051, "step": 29139 }, { "epoch": 0.55, "learning_rate": 2.2190478859350767e-06, "loss": 0.9171, "step": 29140 }, { "epoch": 0.55, "learning_rate": 2.2188960886635926e-06, "loss": 0.873, "step": 29141 }, { "epoch": 0.55, "learning_rate": 2.2187442924417414e-06, "loss": 0.8232, "step": 29142 }, { "epoch": 0.55, "learning_rate": 2.218592497270089e-06, "loss": 1.0723, "step": 29143 }, { "epoch": 0.55, "learning_rate": 2.2184407031492054e-06, "loss": 1.3024, "step": 29144 }, { "epoch": 0.55, "learning_rate": 2.2182889100796548e-06, "loss": 1.0568, "step": 29145 }, { "epoch": 0.55, "learning_rate": 2.2181371180620043e-06, "loss": 0.7435, "step": 29146 }, { "epoch": 0.55, "learning_rate": 2.2179853270968222e-06, "loss": 1.0497, "step": 29147 }, { "epoch": 0.55, "learning_rate": 2.217833537184674e-06, "loss": 0.7565, "step": 29148 }, { "epoch": 0.55, "learning_rate": 2.217681748326126e-06, "loss": 0.8813, "step": 29149 }, { "epoch": 0.55, "learning_rate": 2.2175299605217467e-06, "loss": 1.0873, "step": 29150 }, { "epoch": 0.55, "learning_rate": 2.217378173772101e-06, "loss": 1.0414, "step": 29151 }, { "epoch": 0.55, "learning_rate": 2.217226388077757e-06, "loss": 0.8831, "step": 29152 }, { "epoch": 0.55, "learning_rate": 2.217074603439281e-06, "loss": 0.9128, "step": 29153 }, { "epoch": 0.55, "learning_rate": 2.21692281985724e-06, "loss": 0.8984, "step": 29154 }, { "epoch": 0.55, "learning_rate": 2.2167710373321995e-06, "loss": 1.0208, "step": 29155 }, { "epoch": 0.55, "learning_rate": 2.216619255864728e-06, "loss": 1.0638, "step": 29156 }, { "epoch": 0.55, "learning_rate": 2.216467475455392e-06, "loss": 0.9004, "step": 29157 }, { "epoch": 0.55, "learning_rate": 2.2163156961047564e-06, "loss": 0.7568, "step": 29158 }, { "epoch": 0.55, "learning_rate": 2.2161639178133904e-06, "loss": 1.092, "step": 29159 }, { "epoch": 0.55, "learning_rate": 2.2160121405818596e-06, "loss": 0.7892, "step": 29160 }, { "epoch": 0.55, "learning_rate": 2.2158603644107297e-06, "loss": 0.8102, "step": 29161 }, { "epoch": 0.55, "learning_rate": 2.2157085893005696e-06, "loss": 0.9884, "step": 29162 }, { "epoch": 0.55, "learning_rate": 2.215556815251945e-06, "loss": 0.9189, "step": 29163 }, { "epoch": 0.55, "learning_rate": 2.2154050422654215e-06, "loss": 0.8274, "step": 29164 }, { "epoch": 0.55, "learning_rate": 2.215253270341568e-06, "loss": 0.8352, "step": 29165 }, { "epoch": 0.55, "learning_rate": 2.2151014994809493e-06, "loss": 0.8561, "step": 29166 }, { "epoch": 0.55, "learning_rate": 2.214949729684133e-06, "loss": 1.0198, "step": 29167 }, { "epoch": 0.55, "learning_rate": 2.2147979609516857e-06, "loss": 1.1711, "step": 29168 }, { "epoch": 0.55, "learning_rate": 2.2146461932841746e-06, "loss": 0.9667, "step": 29169 }, { "epoch": 0.55, "learning_rate": 2.214494426682165e-06, "loss": 0.9872, "step": 29170 }, { "epoch": 0.55, "learning_rate": 2.2143426611462248e-06, "loss": 0.8997, "step": 29171 }, { "epoch": 0.55, "learning_rate": 2.2141908966769203e-06, "loss": 0.8083, "step": 29172 }, { "epoch": 0.55, "learning_rate": 2.2140391332748184e-06, "loss": 0.9303, "step": 29173 }, { "epoch": 0.55, "learning_rate": 2.2138873709404855e-06, "loss": 0.9846, "step": 29174 }, { "epoch": 0.55, "learning_rate": 2.2137356096744885e-06, "loss": 1.0257, "step": 29175 }, { "epoch": 0.55, "learning_rate": 2.2135838494773933e-06, "loss": 0.8263, "step": 29176 }, { "epoch": 0.55, "learning_rate": 2.2134320903497683e-06, "loss": 0.9815, "step": 29177 }, { "epoch": 0.55, "learning_rate": 2.213280332292179e-06, "loss": 0.8771, "step": 29178 }, { "epoch": 0.55, "learning_rate": 2.213128575305191e-06, "loss": 0.8428, "step": 29179 }, { "epoch": 0.55, "learning_rate": 2.2129768193893727e-06, "loss": 0.8267, "step": 29180 }, { "epoch": 0.55, "learning_rate": 2.2128250645452907e-06, "loss": 0.9844, "step": 29181 }, { "epoch": 0.55, "learning_rate": 2.21267331077351e-06, "loss": 0.7881, "step": 29182 }, { "epoch": 0.55, "learning_rate": 2.2125215580745995e-06, "loss": 0.9031, "step": 29183 }, { "epoch": 0.55, "learning_rate": 2.2123698064491245e-06, "loss": 0.8922, "step": 29184 }, { "epoch": 0.55, "learning_rate": 2.212218055897651e-06, "loss": 0.851, "step": 29185 }, { "epoch": 0.55, "learning_rate": 2.2120663064207474e-06, "loss": 0.9771, "step": 29186 }, { "epoch": 0.55, "learning_rate": 2.211914558018979e-06, "loss": 1.1329, "step": 29187 }, { "epoch": 0.55, "learning_rate": 2.211762810692912e-06, "loss": 1.1702, "step": 29188 }, { "epoch": 0.55, "learning_rate": 2.211611064443115e-06, "loss": 1.0192, "step": 29189 }, { "epoch": 0.55, "learning_rate": 2.211459319270154e-06, "loss": 0.9016, "step": 29190 }, { "epoch": 0.55, "learning_rate": 2.211307575174593e-06, "loss": 0.8551, "step": 29191 }, { "epoch": 0.55, "learning_rate": 2.211155832157002e-06, "loss": 0.746, "step": 29192 }, { "epoch": 0.55, "learning_rate": 2.2110040902179466e-06, "loss": 1.0071, "step": 29193 }, { "epoch": 0.55, "learning_rate": 2.210852349357992e-06, "loss": 1.0083, "step": 29194 }, { "epoch": 0.55, "learning_rate": 2.210700609577706e-06, "loss": 0.9316, "step": 29195 }, { "epoch": 0.55, "learning_rate": 2.210548870877656e-06, "loss": 0.9528, "step": 29196 }, { "epoch": 0.55, "learning_rate": 2.2103971332584066e-06, "loss": 0.9573, "step": 29197 }, { "epoch": 0.55, "learning_rate": 2.210245396720526e-06, "loss": 0.7908, "step": 29198 }, { "epoch": 0.55, "learning_rate": 2.2100936612645805e-06, "loss": 0.9325, "step": 29199 }, { "epoch": 0.55, "learning_rate": 2.209941926891136e-06, "loss": 0.8987, "step": 29200 }, { "epoch": 0.55, "learning_rate": 2.209790193600759e-06, "loss": 0.9106, "step": 29201 }, { "epoch": 0.55, "learning_rate": 2.2096384613940173e-06, "loss": 0.9953, "step": 29202 }, { "epoch": 0.55, "learning_rate": 2.2094867302714755e-06, "loss": 0.965, "step": 29203 }, { "epoch": 0.55, "learning_rate": 2.209335000233703e-06, "loss": 1.0355, "step": 29204 }, { "epoch": 0.55, "learning_rate": 2.209183271281264e-06, "loss": 0.8467, "step": 29205 }, { "epoch": 0.55, "learning_rate": 2.209031543414725e-06, "loss": 1.0775, "step": 29206 }, { "epoch": 0.55, "learning_rate": 2.2088798166346545e-06, "loss": 0.9839, "step": 29207 }, { "epoch": 0.55, "learning_rate": 2.208728090941617e-06, "loss": 0.9382, "step": 29208 }, { "epoch": 0.55, "learning_rate": 2.2085763663361797e-06, "loss": 1.0127, "step": 29209 }, { "epoch": 0.55, "learning_rate": 2.20842464281891e-06, "loss": 0.7886, "step": 29210 }, { "epoch": 0.55, "learning_rate": 2.208272920390374e-06, "loss": 0.7179, "step": 29211 }, { "epoch": 0.55, "learning_rate": 2.2081211990511367e-06, "loss": 1.0344, "step": 29212 }, { "epoch": 0.55, "learning_rate": 2.207969478801767e-06, "loss": 0.8768, "step": 29213 }, { "epoch": 0.55, "learning_rate": 2.20781775964283e-06, "loss": 0.8942, "step": 29214 }, { "epoch": 0.55, "learning_rate": 2.2076660415748923e-06, "loss": 0.8771, "step": 29215 }, { "epoch": 0.55, "learning_rate": 2.2075143245985206e-06, "loss": 0.7499, "step": 29216 }, { "epoch": 0.55, "learning_rate": 2.2073626087142823e-06, "loss": 0.9179, "step": 29217 }, { "epoch": 0.55, "learning_rate": 2.2072108939227414e-06, "loss": 0.8938, "step": 29218 }, { "epoch": 0.55, "learning_rate": 2.2070591802244677e-06, "loss": 1.0269, "step": 29219 }, { "epoch": 0.55, "learning_rate": 2.2069074676200257e-06, "loss": 0.7705, "step": 29220 }, { "epoch": 0.55, "learning_rate": 2.2067557561099815e-06, "loss": 0.8147, "step": 29221 }, { "epoch": 0.55, "learning_rate": 2.2066040456949024e-06, "loss": 0.9538, "step": 29222 }, { "epoch": 0.55, "learning_rate": 2.2064523363753557e-06, "loss": 0.6501, "step": 29223 }, { "epoch": 0.55, "learning_rate": 2.2063006281519057e-06, "loss": 0.864, "step": 29224 }, { "epoch": 0.55, "learning_rate": 2.206148921025121e-06, "loss": 0.9703, "step": 29225 }, { "epoch": 0.55, "learning_rate": 2.205997214995568e-06, "loss": 0.9584, "step": 29226 }, { "epoch": 0.55, "learning_rate": 2.2058455100638106e-06, "loss": 0.9776, "step": 29227 }, { "epoch": 0.55, "learning_rate": 2.2056938062304185e-06, "loss": 0.8991, "step": 29228 }, { "epoch": 0.55, "learning_rate": 2.2055421034959563e-06, "loss": 0.7051, "step": 29229 }, { "epoch": 0.55, "learning_rate": 2.20539040186099e-06, "loss": 0.9647, "step": 29230 }, { "epoch": 0.55, "learning_rate": 2.205238701326088e-06, "loss": 0.9878, "step": 29231 }, { "epoch": 0.55, "learning_rate": 2.2050870018918156e-06, "loss": 0.8678, "step": 29232 }, { "epoch": 0.55, "learning_rate": 2.204935303558738e-06, "loss": 0.8771, "step": 29233 }, { "epoch": 0.55, "learning_rate": 2.2047836063274245e-06, "loss": 0.6805, "step": 29234 }, { "epoch": 0.55, "learning_rate": 2.2046319101984394e-06, "loss": 0.9141, "step": 29235 }, { "epoch": 0.55, "learning_rate": 2.2044802151723493e-06, "loss": 1.0823, "step": 29236 }, { "epoch": 0.55, "learning_rate": 2.2043285212497212e-06, "loss": 1.1818, "step": 29237 }, { "epoch": 0.55, "learning_rate": 2.2041768284311218e-06, "loss": 1.0275, "step": 29238 }, { "epoch": 0.55, "learning_rate": 2.204025136717116e-06, "loss": 0.955, "step": 29239 }, { "epoch": 0.55, "learning_rate": 2.2038734461082726e-06, "loss": 0.8378, "step": 29240 }, { "epoch": 0.55, "learning_rate": 2.2037217566051562e-06, "loss": 1.0712, "step": 29241 }, { "epoch": 0.55, "learning_rate": 2.203570068208333e-06, "loss": 0.688, "step": 29242 }, { "epoch": 0.55, "learning_rate": 2.2034183809183706e-06, "loss": 0.9863, "step": 29243 }, { "epoch": 0.55, "learning_rate": 2.203266694735835e-06, "loss": 0.9613, "step": 29244 }, { "epoch": 0.55, "learning_rate": 2.203115009661292e-06, "loss": 0.9543, "step": 29245 }, { "epoch": 0.55, "learning_rate": 2.202963325695309e-06, "loss": 0.9722, "step": 29246 }, { "epoch": 0.55, "learning_rate": 2.202811642838452e-06, "loss": 0.746, "step": 29247 }, { "epoch": 0.55, "learning_rate": 2.2026599610912865e-06, "loss": 0.9574, "step": 29248 }, { "epoch": 0.55, "learning_rate": 2.2025082804543803e-06, "loss": 0.8952, "step": 29249 }, { "epoch": 0.55, "learning_rate": 2.2023566009282985e-06, "loss": 1.0666, "step": 29250 }, { "epoch": 0.55, "learning_rate": 2.202204922513608e-06, "loss": 0.8995, "step": 29251 }, { "epoch": 0.55, "learning_rate": 2.202053245210876e-06, "loss": 0.9477, "step": 29252 }, { "epoch": 0.55, "learning_rate": 2.2019015690206673e-06, "loss": 1.0633, "step": 29253 }, { "epoch": 0.55, "learning_rate": 2.2017498939435486e-06, "loss": 0.8621, "step": 29254 }, { "epoch": 0.55, "learning_rate": 2.2015982199800877e-06, "loss": 0.9411, "step": 29255 }, { "epoch": 0.55, "learning_rate": 2.2014465471308494e-06, "loss": 1.2163, "step": 29256 }, { "epoch": 0.55, "learning_rate": 2.2012948753964e-06, "loss": 0.9866, "step": 29257 }, { "epoch": 0.55, "learning_rate": 2.201143204777307e-06, "loss": 0.8127, "step": 29258 }, { "epoch": 0.55, "learning_rate": 2.2009915352741364e-06, "loss": 0.9558, "step": 29259 }, { "epoch": 0.55, "learning_rate": 2.2008398668874535e-06, "loss": 0.9491, "step": 29260 }, { "epoch": 0.55, "learning_rate": 2.2006881996178263e-06, "loss": 0.7957, "step": 29261 }, { "epoch": 0.55, "learning_rate": 2.20053653346582e-06, "loss": 1.0201, "step": 29262 }, { "epoch": 0.55, "learning_rate": 2.200384868432e-06, "loss": 0.8538, "step": 29263 }, { "epoch": 0.55, "learning_rate": 2.2002332045169343e-06, "loss": 0.86, "step": 29264 }, { "epoch": 0.55, "learning_rate": 2.200081541721189e-06, "loss": 0.7783, "step": 29265 }, { "epoch": 0.55, "learning_rate": 2.1999298800453293e-06, "loss": 0.7332, "step": 29266 }, { "epoch": 0.55, "learning_rate": 2.199778219489923e-06, "loss": 0.892, "step": 29267 }, { "epoch": 0.55, "learning_rate": 2.199626560055536e-06, "loss": 0.8861, "step": 29268 }, { "epoch": 0.55, "learning_rate": 2.199474901742733e-06, "loss": 1.1077, "step": 29269 }, { "epoch": 0.55, "learning_rate": 2.1993232445520824e-06, "loss": 1.0311, "step": 29270 }, { "epoch": 0.55, "learning_rate": 2.199171588484149e-06, "loss": 0.806, "step": 29271 }, { "epoch": 0.55, "learning_rate": 2.1990199335394992e-06, "loss": 1.0576, "step": 29272 }, { "epoch": 0.55, "learning_rate": 2.1988682797187007e-06, "loss": 0.7231, "step": 29273 }, { "epoch": 0.55, "learning_rate": 2.1987166270223194e-06, "loss": 0.8285, "step": 29274 }, { "epoch": 0.55, "learning_rate": 2.1985649754509194e-06, "loss": 1.0004, "step": 29275 }, { "epoch": 0.55, "learning_rate": 2.1984133250050694e-06, "loss": 0.897, "step": 29276 }, { "epoch": 0.55, "learning_rate": 2.198261675685335e-06, "loss": 0.7297, "step": 29277 }, { "epoch": 0.55, "learning_rate": 2.1981100274922814e-06, "loss": 0.8585, "step": 29278 }, { "epoch": 0.55, "learning_rate": 2.197958380426476e-06, "loss": 0.7663, "step": 29279 }, { "epoch": 0.55, "learning_rate": 2.1978067344884856e-06, "loss": 1.1954, "step": 29280 }, { "epoch": 0.55, "learning_rate": 2.1976550896788746e-06, "loss": 1.084, "step": 29281 }, { "epoch": 0.55, "learning_rate": 2.1975034459982108e-06, "loss": 0.9901, "step": 29282 }, { "epoch": 0.55, "learning_rate": 2.19735180344706e-06, "loss": 0.834, "step": 29283 }, { "epoch": 0.55, "learning_rate": 2.197200162025988e-06, "loss": 0.8433, "step": 29284 }, { "epoch": 0.55, "learning_rate": 2.1970485217355605e-06, "loss": 0.8458, "step": 29285 }, { "epoch": 0.55, "learning_rate": 2.1968968825763458e-06, "loss": 0.8527, "step": 29286 }, { "epoch": 0.55, "learning_rate": 2.1967452445489086e-06, "loss": 1.1177, "step": 29287 }, { "epoch": 0.55, "learning_rate": 2.196593607653814e-06, "loss": 0.8413, "step": 29288 }, { "epoch": 0.55, "learning_rate": 2.1964419718916315e-06, "loss": 1.0724, "step": 29289 }, { "epoch": 0.55, "learning_rate": 2.1962903372629246e-06, "loss": 0.7511, "step": 29290 }, { "epoch": 0.55, "learning_rate": 2.19613870376826e-06, "loss": 0.8293, "step": 29291 }, { "epoch": 0.55, "learning_rate": 2.1959870714082043e-06, "loss": 0.9142, "step": 29292 }, { "epoch": 0.55, "learning_rate": 2.1958354401833242e-06, "loss": 1.0777, "step": 29293 }, { "epoch": 0.55, "learning_rate": 2.1956838100941836e-06, "loss": 1.0073, "step": 29294 }, { "epoch": 0.55, "learning_rate": 2.1955321811413517e-06, "loss": 0.9852, "step": 29295 }, { "epoch": 0.55, "learning_rate": 2.1953805533253935e-06, "loss": 0.8293, "step": 29296 }, { "epoch": 0.55, "learning_rate": 2.195228926646874e-06, "loss": 0.8676, "step": 29297 }, { "epoch": 0.55, "learning_rate": 2.1950773011063608e-06, "loss": 0.9913, "step": 29298 }, { "epoch": 0.55, "learning_rate": 2.1949256767044196e-06, "loss": 0.8268, "step": 29299 }, { "epoch": 0.55, "learning_rate": 2.1947740534416162e-06, "loss": 1.2681, "step": 29300 }, { "epoch": 0.55, "learning_rate": 2.1946224313185177e-06, "loss": 0.7991, "step": 29301 }, { "epoch": 0.55, "learning_rate": 2.19447081033569e-06, "loss": 0.8933, "step": 29302 }, { "epoch": 0.55, "learning_rate": 2.1943191904936977e-06, "loss": 1.0269, "step": 29303 }, { "epoch": 0.55, "learning_rate": 2.1941675717931094e-06, "loss": 0.7814, "step": 29304 }, { "epoch": 0.55, "learning_rate": 2.1940159542344894e-06, "loss": 0.8867, "step": 29305 }, { "epoch": 0.55, "learning_rate": 2.1938643378184036e-06, "loss": 1.0518, "step": 29306 }, { "epoch": 0.55, "learning_rate": 2.1937127225454207e-06, "loss": 0.9897, "step": 29307 }, { "epoch": 0.55, "learning_rate": 2.1935611084161045e-06, "loss": 1.1612, "step": 29308 }, { "epoch": 0.55, "learning_rate": 2.193409495431021e-06, "loss": 0.7996, "step": 29309 }, { "epoch": 0.55, "learning_rate": 2.1932578835907378e-06, "loss": 0.7678, "step": 29310 }, { "epoch": 0.55, "learning_rate": 2.19310627289582e-06, "loss": 0.7932, "step": 29311 }, { "epoch": 0.55, "learning_rate": 2.1929546633468337e-06, "loss": 1.1636, "step": 29312 }, { "epoch": 0.55, "learning_rate": 2.1928030549443454e-06, "loss": 0.8959, "step": 29313 }, { "epoch": 0.55, "learning_rate": 2.192651447688922e-06, "loss": 0.7025, "step": 29314 }, { "epoch": 0.55, "learning_rate": 2.192499841581127e-06, "loss": 0.8907, "step": 29315 }, { "epoch": 0.55, "learning_rate": 2.1923482366215297e-06, "loss": 0.9248, "step": 29316 }, { "epoch": 0.55, "learning_rate": 2.1921966328106944e-06, "loss": 0.8851, "step": 29317 }, { "epoch": 0.55, "learning_rate": 2.1920450301491862e-06, "loss": 1.0436, "step": 29318 }, { "epoch": 0.55, "learning_rate": 2.1918934286375736e-06, "loss": 1.0508, "step": 29319 }, { "epoch": 0.55, "learning_rate": 2.1917418282764214e-06, "loss": 0.8775, "step": 29320 }, { "epoch": 0.55, "learning_rate": 2.191590229066295e-06, "loss": 0.78, "step": 29321 }, { "epoch": 0.55, "learning_rate": 2.191438631007762e-06, "loss": 0.9805, "step": 29322 }, { "epoch": 0.55, "learning_rate": 2.191287034101388e-06, "loss": 1.0062, "step": 29323 }, { "epoch": 0.55, "learning_rate": 2.191135438347737e-06, "loss": 0.8361, "step": 29324 }, { "epoch": 0.55, "learning_rate": 2.190983843747379e-06, "loss": 1.1046, "step": 29325 }, { "epoch": 0.55, "learning_rate": 2.190832250300877e-06, "loss": 0.8528, "step": 29326 }, { "epoch": 0.55, "learning_rate": 2.190680658008797e-06, "loss": 0.8958, "step": 29327 }, { "epoch": 0.55, "learning_rate": 2.190529066871707e-06, "loss": 0.6695, "step": 29328 }, { "epoch": 0.55, "learning_rate": 2.190377476890172e-06, "loss": 0.7569, "step": 29329 }, { "epoch": 0.55, "learning_rate": 2.190225888064757e-06, "loss": 1.0123, "step": 29330 }, { "epoch": 0.55, "learning_rate": 2.19007430039603e-06, "loss": 1.1951, "step": 29331 }, { "epoch": 0.55, "learning_rate": 2.1899227138845558e-06, "loss": 0.8828, "step": 29332 }, { "epoch": 0.55, "learning_rate": 2.1897711285309004e-06, "loss": 0.8751, "step": 29333 }, { "epoch": 0.55, "learning_rate": 2.1896195443356304e-06, "loss": 0.9011, "step": 29334 }, { "epoch": 0.55, "learning_rate": 2.1894679612993115e-06, "loss": 0.9125, "step": 29335 }, { "epoch": 0.55, "learning_rate": 2.189316379422509e-06, "loss": 0.958, "step": 29336 }, { "epoch": 0.55, "learning_rate": 2.1891647987057908e-06, "loss": 0.965, "step": 29337 }, { "epoch": 0.55, "learning_rate": 2.189013219149722e-06, "loss": 1.1368, "step": 29338 }, { "epoch": 0.55, "learning_rate": 2.1888616407548665e-06, "loss": 0.7959, "step": 29339 }, { "epoch": 0.55, "learning_rate": 2.188710063521793e-06, "loss": 0.8449, "step": 29340 }, { "epoch": 0.55, "learning_rate": 2.188558487451067e-06, "loss": 1.0453, "step": 29341 }, { "epoch": 0.55, "learning_rate": 2.1884069125432532e-06, "loss": 1.0193, "step": 29342 }, { "epoch": 0.55, "learning_rate": 2.1882553387989196e-06, "loss": 0.801, "step": 29343 }, { "epoch": 0.55, "learning_rate": 2.1881037662186304e-06, "loss": 0.8414, "step": 29344 }, { "epoch": 0.55, "learning_rate": 2.1879521948029517e-06, "loss": 0.8003, "step": 29345 }, { "epoch": 0.55, "learning_rate": 2.1878006245524507e-06, "loss": 0.8255, "step": 29346 }, { "epoch": 0.55, "learning_rate": 2.187649055467692e-06, "loss": 0.877, "step": 29347 }, { "epoch": 0.55, "learning_rate": 2.187497487549242e-06, "loss": 0.814, "step": 29348 }, { "epoch": 0.55, "learning_rate": 2.187345920797668e-06, "loss": 0.9114, "step": 29349 }, { "epoch": 0.55, "learning_rate": 2.187194355213534e-06, "loss": 0.9914, "step": 29350 }, { "epoch": 0.55, "learning_rate": 2.187042790797406e-06, "loss": 1.082, "step": 29351 }, { "epoch": 0.55, "learning_rate": 2.1868912275498517e-06, "loss": 0.8782, "step": 29352 }, { "epoch": 0.55, "learning_rate": 2.186739665471435e-06, "loss": 0.9537, "step": 29353 }, { "epoch": 0.55, "learning_rate": 2.1865881045627234e-06, "loss": 0.8115, "step": 29354 }, { "epoch": 0.55, "learning_rate": 2.186436544824282e-06, "loss": 1.0921, "step": 29355 }, { "epoch": 0.55, "learning_rate": 2.1862849862566778e-06, "loss": 1.0956, "step": 29356 }, { "epoch": 0.55, "learning_rate": 2.1861334288604744e-06, "loss": 0.7992, "step": 29357 }, { "epoch": 0.55, "learning_rate": 2.18598187263624e-06, "loss": 0.8608, "step": 29358 }, { "epoch": 0.55, "learning_rate": 2.18583031758454e-06, "loss": 0.9659, "step": 29359 }, { "epoch": 0.55, "learning_rate": 2.185678763705939e-06, "loss": 1.0018, "step": 29360 }, { "epoch": 0.55, "learning_rate": 2.1855272110010044e-06, "loss": 0.7603, "step": 29361 }, { "epoch": 0.55, "learning_rate": 2.1853756594703017e-06, "loss": 1.0706, "step": 29362 }, { "epoch": 0.55, "learning_rate": 2.185224109114396e-06, "loss": 0.9781, "step": 29363 }, { "epoch": 0.55, "learning_rate": 2.1850725599338544e-06, "loss": 0.9589, "step": 29364 }, { "epoch": 0.55, "learning_rate": 2.1849210119292423e-06, "loss": 0.9424, "step": 29365 }, { "epoch": 0.55, "learning_rate": 2.1847694651011246e-06, "loss": 0.9388, "step": 29366 }, { "epoch": 0.55, "learning_rate": 2.1846179194500694e-06, "loss": 1.0847, "step": 29367 }, { "epoch": 0.55, "learning_rate": 2.1844663749766402e-06, "loss": 1.0552, "step": 29368 }, { "epoch": 0.55, "learning_rate": 2.184314831681404e-06, "loss": 1.0432, "step": 29369 }, { "epoch": 0.55, "learning_rate": 2.184163289564927e-06, "loss": 0.8198, "step": 29370 }, { "epoch": 0.55, "learning_rate": 2.1840117486277747e-06, "loss": 0.8584, "step": 29371 }, { "epoch": 0.55, "learning_rate": 2.1838602088705115e-06, "loss": 0.6951, "step": 29372 }, { "epoch": 0.55, "learning_rate": 2.183708670293706e-06, "loss": 0.9403, "step": 29373 }, { "epoch": 0.55, "learning_rate": 2.1835571328979223e-06, "loss": 1.0436, "step": 29374 }, { "epoch": 0.55, "learning_rate": 2.183405596683726e-06, "loss": 1.196, "step": 29375 }, { "epoch": 0.55, "learning_rate": 2.183254061651684e-06, "loss": 0.9091, "step": 29376 }, { "epoch": 0.55, "learning_rate": 2.183102527802362e-06, "loss": 0.9367, "step": 29377 }, { "epoch": 0.55, "learning_rate": 2.1829509951363243e-06, "loss": 0.7726, "step": 29378 }, { "epoch": 0.55, "learning_rate": 2.182799463654139e-06, "loss": 0.7805, "step": 29379 }, { "epoch": 0.55, "learning_rate": 2.1826479333563707e-06, "loss": 1.0796, "step": 29380 }, { "epoch": 0.55, "learning_rate": 2.182496404243584e-06, "loss": 0.967, "step": 29381 }, { "epoch": 0.55, "learning_rate": 2.1823448763163473e-06, "loss": 1.0461, "step": 29382 }, { "epoch": 0.55, "learning_rate": 2.182193349575225e-06, "loss": 0.9246, "step": 29383 }, { "epoch": 0.55, "learning_rate": 2.182041824020782e-06, "loss": 0.6763, "step": 29384 }, { "epoch": 0.55, "learning_rate": 2.181890299653586e-06, "loss": 0.8668, "step": 29385 }, { "epoch": 0.55, "learning_rate": 2.1817387764742024e-06, "loss": 0.8301, "step": 29386 }, { "epoch": 0.55, "learning_rate": 2.181587254483195e-06, "loss": 1.0021, "step": 29387 }, { "epoch": 0.55, "learning_rate": 2.181435733681132e-06, "loss": 1.0273, "step": 29388 }, { "epoch": 0.55, "learning_rate": 2.1812842140685782e-06, "loss": 1.0251, "step": 29389 }, { "epoch": 0.55, "learning_rate": 2.1811326956460984e-06, "loss": 1.0887, "step": 29390 }, { "epoch": 0.55, "learning_rate": 2.18098117841426e-06, "loss": 0.9636, "step": 29391 }, { "epoch": 0.55, "learning_rate": 2.180829662373629e-06, "loss": 0.7349, "step": 29392 }, { "epoch": 0.55, "learning_rate": 2.1806781475247684e-06, "loss": 1.2349, "step": 29393 }, { "epoch": 0.55, "learning_rate": 2.1805266338682474e-06, "loss": 1.2324, "step": 29394 }, { "epoch": 0.55, "learning_rate": 2.180375121404629e-06, "loss": 0.8154, "step": 29395 }, { "epoch": 0.55, "learning_rate": 2.180223610134481e-06, "loss": 0.9316, "step": 29396 }, { "epoch": 0.55, "learning_rate": 2.180072100058368e-06, "loss": 1.0428, "step": 29397 }, { "epoch": 0.55, "learning_rate": 2.179920591176856e-06, "loss": 1.0048, "step": 29398 }, { "epoch": 0.55, "learning_rate": 2.17976908349051e-06, "loss": 1.0469, "step": 29399 }, { "epoch": 0.55, "learning_rate": 2.1796175769998975e-06, "loss": 1.1128, "step": 29400 }, { "epoch": 0.55, "learning_rate": 2.179466071705583e-06, "loss": 0.7849, "step": 29401 }, { "epoch": 0.55, "learning_rate": 2.179314567608131e-06, "loss": 0.8742, "step": 29402 }, { "epoch": 0.55, "learning_rate": 2.1791630647081095e-06, "loss": 0.7588, "step": 29403 }, { "epoch": 0.55, "learning_rate": 2.1790115630060837e-06, "loss": 0.9387, "step": 29404 }, { "epoch": 0.55, "learning_rate": 2.178860062502618e-06, "loss": 1.0093, "step": 29405 }, { "epoch": 0.55, "learning_rate": 2.17870856319828e-06, "loss": 1.1732, "step": 29406 }, { "epoch": 0.55, "learning_rate": 2.1785570650936346e-06, "loss": 0.9296, "step": 29407 }, { "epoch": 0.55, "learning_rate": 2.1784055681892454e-06, "loss": 0.973, "step": 29408 }, { "epoch": 0.55, "learning_rate": 2.1782540724856817e-06, "loss": 0.7927, "step": 29409 }, { "epoch": 0.55, "learning_rate": 2.1781025779835068e-06, "loss": 0.7716, "step": 29410 }, { "epoch": 0.55, "learning_rate": 2.1779510846832864e-06, "loss": 0.9256, "step": 29411 }, { "epoch": 0.55, "learning_rate": 2.1777995925855877e-06, "loss": 0.9862, "step": 29412 }, { "epoch": 0.55, "learning_rate": 2.1776481016909756e-06, "loss": 0.9946, "step": 29413 }, { "epoch": 0.55, "learning_rate": 2.1774966120000143e-06, "loss": 0.8121, "step": 29414 }, { "epoch": 0.55, "learning_rate": 2.177345123513272e-06, "loss": 0.907, "step": 29415 }, { "epoch": 0.55, "learning_rate": 2.1771936362313127e-06, "loss": 0.7311, "step": 29416 }, { "epoch": 0.56, "learning_rate": 2.1770421501547024e-06, "loss": 1.0125, "step": 29417 }, { "epoch": 0.56, "learning_rate": 2.1768906652840065e-06, "loss": 0.8795, "step": 29418 }, { "epoch": 0.56, "learning_rate": 2.1767391816197918e-06, "loss": 1.0977, "step": 29419 }, { "epoch": 0.56, "learning_rate": 2.1765876991626223e-06, "loss": 0.7653, "step": 29420 }, { "epoch": 0.56, "learning_rate": 2.176436217913065e-06, "loss": 0.9139, "step": 29421 }, { "epoch": 0.56, "learning_rate": 2.1762847378716852e-06, "loss": 0.94, "step": 29422 }, { "epoch": 0.56, "learning_rate": 2.1761332590390472e-06, "loss": 0.9586, "step": 29423 }, { "epoch": 0.56, "learning_rate": 2.175981781415718e-06, "loss": 1.2342, "step": 29424 }, { "epoch": 0.56, "learning_rate": 2.1758303050022634e-06, "loss": 1.2494, "step": 29425 }, { "epoch": 0.56, "learning_rate": 2.1756788297992475e-06, "loss": 0.9717, "step": 29426 }, { "epoch": 0.56, "learning_rate": 2.175527355807238e-06, "loss": 0.7265, "step": 29427 }, { "epoch": 0.56, "learning_rate": 2.1753758830267995e-06, "loss": 0.9737, "step": 29428 }, { "epoch": 0.56, "learning_rate": 2.1752244114584965e-06, "loss": 0.8892, "step": 29429 }, { "epoch": 0.56, "learning_rate": 2.1750729411028964e-06, "loss": 0.7468, "step": 29430 }, { "epoch": 0.56, "learning_rate": 2.174921471960564e-06, "loss": 1.0394, "step": 29431 }, { "epoch": 0.56, "learning_rate": 2.1747700040320635e-06, "loss": 0.8503, "step": 29432 }, { "epoch": 0.56, "learning_rate": 2.1746185373179636e-06, "loss": 0.8771, "step": 29433 }, { "epoch": 0.56, "learning_rate": 2.1744670718188278e-06, "loss": 0.8741, "step": 29434 }, { "epoch": 0.56, "learning_rate": 2.1743156075352207e-06, "loss": 0.7604, "step": 29435 }, { "epoch": 0.56, "learning_rate": 2.1741641444677107e-06, "loss": 0.9371, "step": 29436 }, { "epoch": 0.56, "learning_rate": 2.1740126826168605e-06, "loss": 0.8954, "step": 29437 }, { "epoch": 0.56, "learning_rate": 2.173861221983238e-06, "loss": 1.0561, "step": 29438 }, { "epoch": 0.56, "learning_rate": 2.173709762567407e-06, "loss": 0.8425, "step": 29439 }, { "epoch": 0.56, "learning_rate": 2.173558304369934e-06, "loss": 0.9523, "step": 29440 }, { "epoch": 0.56, "learning_rate": 2.173406847391384e-06, "loss": 1.0108, "step": 29441 }, { "epoch": 0.56, "learning_rate": 2.1732553916323233e-06, "loss": 0.843, "step": 29442 }, { "epoch": 0.56, "learning_rate": 2.1731039370933165e-06, "loss": 0.8331, "step": 29443 }, { "epoch": 0.56, "learning_rate": 2.17295248377493e-06, "loss": 0.942, "step": 29444 }, { "epoch": 0.56, "learning_rate": 2.1728010316777286e-06, "loss": 0.7931, "step": 29445 }, { "epoch": 0.56, "learning_rate": 2.1726495808022783e-06, "loss": 0.8742, "step": 29446 }, { "epoch": 0.56, "learning_rate": 2.172498131149144e-06, "loss": 0.9108, "step": 29447 }, { "epoch": 0.56, "learning_rate": 2.172346682718892e-06, "loss": 1.029, "step": 29448 }, { "epoch": 0.56, "learning_rate": 2.172195235512088e-06, "loss": 0.827, "step": 29449 }, { "epoch": 0.56, "learning_rate": 2.1720437895292957e-06, "loss": 1.0222, "step": 29450 }, { "epoch": 0.56, "learning_rate": 2.1718923447710826e-06, "loss": 1.05, "step": 29451 }, { "epoch": 0.56, "learning_rate": 2.1717409012380136e-06, "loss": 0.7847, "step": 29452 }, { "epoch": 0.56, "learning_rate": 2.171589458930653e-06, "loss": 0.6886, "step": 29453 }, { "epoch": 0.56, "learning_rate": 2.1714380178495688e-06, "loss": 0.893, "step": 29454 }, { "epoch": 0.56, "learning_rate": 2.1712865779953245e-06, "loss": 0.9653, "step": 29455 }, { "epoch": 0.56, "learning_rate": 2.1711351393684847e-06, "loss": 1.3723, "step": 29456 }, { "epoch": 0.56, "learning_rate": 2.1709837019696178e-06, "loss": 1.08, "step": 29457 }, { "epoch": 0.56, "learning_rate": 2.170832265799287e-06, "loss": 0.8711, "step": 29458 }, { "epoch": 0.56, "learning_rate": 2.170680830858058e-06, "loss": 0.8171, "step": 29459 }, { "epoch": 0.56, "learning_rate": 2.1705293971464978e-06, "loss": 0.8267, "step": 29460 }, { "epoch": 0.56, "learning_rate": 2.1703779646651704e-06, "loss": 0.9836, "step": 29461 }, { "epoch": 0.56, "learning_rate": 2.170226533414641e-06, "loss": 0.8543, "step": 29462 }, { "epoch": 0.56, "learning_rate": 2.170075103395476e-06, "loss": 0.9377, "step": 29463 }, { "epoch": 0.56, "learning_rate": 2.1699236746082403e-06, "loss": 0.9669, "step": 29464 }, { "epoch": 0.56, "learning_rate": 2.1697722470534996e-06, "loss": 0.8954, "step": 29465 }, { "epoch": 0.56, "learning_rate": 2.1696208207318188e-06, "loss": 0.8193, "step": 29466 }, { "epoch": 0.56, "learning_rate": 2.1694693956437647e-06, "loss": 0.819, "step": 29467 }, { "epoch": 0.56, "learning_rate": 2.1693179717899004e-06, "loss": 1.08, "step": 29468 }, { "epoch": 0.56, "learning_rate": 2.169166549170794e-06, "loss": 1.1922, "step": 29469 }, { "epoch": 0.56, "learning_rate": 2.169015127787009e-06, "loss": 1.0868, "step": 29470 }, { "epoch": 0.56, "learning_rate": 2.1688637076391108e-06, "loss": 0.9276, "step": 29471 }, { "epoch": 0.56, "learning_rate": 2.168712288727666e-06, "loss": 0.9268, "step": 29472 }, { "epoch": 0.56, "learning_rate": 2.1685608710532397e-06, "loss": 0.8956, "step": 29473 }, { "epoch": 0.56, "learning_rate": 2.1684094546163957e-06, "loss": 1.0372, "step": 29474 }, { "epoch": 0.56, "learning_rate": 2.1682580394177016e-06, "loss": 1.0475, "step": 29475 }, { "epoch": 0.56, "learning_rate": 2.168106625457722e-06, "loss": 0.8974, "step": 29476 }, { "epoch": 0.56, "learning_rate": 2.167955212737021e-06, "loss": 0.9568, "step": 29477 }, { "epoch": 0.56, "learning_rate": 2.1678038012561664e-06, "loss": 0.7009, "step": 29478 }, { "epoch": 0.56, "learning_rate": 2.1676523910157216e-06, "loss": 0.9245, "step": 29479 }, { "epoch": 0.56, "learning_rate": 2.167500982016252e-06, "loss": 1.0701, "step": 29480 }, { "epoch": 0.56, "learning_rate": 2.1673495742583243e-06, "loss": 1.1448, "step": 29481 }, { "epoch": 0.56, "learning_rate": 2.167198167742503e-06, "loss": 1.0156, "step": 29482 }, { "epoch": 0.56, "learning_rate": 2.167046762469353e-06, "loss": 0.9254, "step": 29483 }, { "epoch": 0.56, "learning_rate": 2.166895358439441e-06, "loss": 0.8127, "step": 29484 }, { "epoch": 0.56, "learning_rate": 2.166743955653331e-06, "loss": 0.9539, "step": 29485 }, { "epoch": 0.56, "learning_rate": 2.166592554111589e-06, "loss": 0.9781, "step": 29486 }, { "epoch": 0.56, "learning_rate": 2.16644115381478e-06, "loss": 0.9559, "step": 29487 }, { "epoch": 0.56, "learning_rate": 2.16628975476347e-06, "loss": 0.8932, "step": 29488 }, { "epoch": 0.56, "learning_rate": 2.1661383569582227e-06, "loss": 0.9082, "step": 29489 }, { "epoch": 0.56, "learning_rate": 2.165986960399606e-06, "loss": 0.9193, "step": 29490 }, { "epoch": 0.56, "learning_rate": 2.1658355650881836e-06, "loss": 0.7135, "step": 29491 }, { "epoch": 0.56, "learning_rate": 2.1656841710245196e-06, "loss": 0.8819, "step": 29492 }, { "epoch": 0.56, "learning_rate": 2.1655327782091815e-06, "loss": 0.9845, "step": 29493 }, { "epoch": 0.56, "learning_rate": 2.165381386642734e-06, "loss": 0.9229, "step": 29494 }, { "epoch": 0.56, "learning_rate": 2.1652299963257413e-06, "loss": 0.8457, "step": 29495 }, { "epoch": 0.56, "learning_rate": 2.1650786072587705e-06, "loss": 0.9119, "step": 29496 }, { "epoch": 0.56, "learning_rate": 2.164927219442386e-06, "loss": 0.8573, "step": 29497 }, { "epoch": 0.56, "learning_rate": 2.1647758328771518e-06, "loss": 0.9501, "step": 29498 }, { "epoch": 0.56, "learning_rate": 2.1646244475636355e-06, "loss": 0.7658, "step": 29499 }, { "epoch": 0.56, "learning_rate": 2.1644730635024007e-06, "loss": 1.1317, "step": 29500 }, { "epoch": 0.56, "learning_rate": 2.1643216806940127e-06, "loss": 1.1074, "step": 29501 }, { "epoch": 0.56, "learning_rate": 2.1641702991390382e-06, "loss": 0.9467, "step": 29502 }, { "epoch": 0.56, "learning_rate": 2.164018918838042e-06, "loss": 1.0206, "step": 29503 }, { "epoch": 0.56, "learning_rate": 2.163867539791587e-06, "loss": 0.6711, "step": 29504 }, { "epoch": 0.56, "learning_rate": 2.1637161620002415e-06, "loss": 0.6973, "step": 29505 }, { "epoch": 0.56, "learning_rate": 2.1635647854645696e-06, "loss": 0.9982, "step": 29506 }, { "epoch": 0.56, "learning_rate": 2.163413410185136e-06, "loss": 0.8772, "step": 29507 }, { "epoch": 0.56, "learning_rate": 2.1632620361625063e-06, "loss": 0.9146, "step": 29508 }, { "epoch": 0.56, "learning_rate": 2.163110663397247e-06, "loss": 0.8417, "step": 29509 }, { "epoch": 0.56, "learning_rate": 2.1629592918899205e-06, "loss": 0.8354, "step": 29510 }, { "epoch": 0.56, "learning_rate": 2.1628079216410948e-06, "loss": 1.0041, "step": 29511 }, { "epoch": 0.56, "learning_rate": 2.162656552651334e-06, "loss": 0.9711, "step": 29512 }, { "epoch": 0.56, "learning_rate": 2.1625051849212023e-06, "loss": 0.8831, "step": 29513 }, { "epoch": 0.56, "learning_rate": 2.1623538184512668e-06, "loss": 0.9397, "step": 29514 }, { "epoch": 0.56, "learning_rate": 2.1622024532420915e-06, "loss": 0.9214, "step": 29515 }, { "epoch": 0.56, "learning_rate": 2.1620510892942414e-06, "loss": 0.9035, "step": 29516 }, { "epoch": 0.56, "learning_rate": 2.1618997266082832e-06, "loss": 0.9342, "step": 29517 }, { "epoch": 0.56, "learning_rate": 2.161748365184781e-06, "loss": 0.9003, "step": 29518 }, { "epoch": 0.56, "learning_rate": 2.1615970050242995e-06, "loss": 0.9905, "step": 29519 }, { "epoch": 0.56, "learning_rate": 2.1614456461274043e-06, "loss": 1.0113, "step": 29520 }, { "epoch": 0.56, "learning_rate": 2.161294288494661e-06, "loss": 0.9947, "step": 29521 }, { "epoch": 0.56, "learning_rate": 2.1611429321266346e-06, "loss": 0.9459, "step": 29522 }, { "epoch": 0.56, "learning_rate": 2.160991577023889e-06, "loss": 0.7469, "step": 29523 }, { "epoch": 0.56, "learning_rate": 2.160840223186992e-06, "loss": 1.1404, "step": 29524 }, { "epoch": 0.56, "learning_rate": 2.1606888706165066e-06, "loss": 1.0836, "step": 29525 }, { "epoch": 0.56, "learning_rate": 2.1605375193129975e-06, "loss": 0.9606, "step": 29526 }, { "epoch": 0.56, "learning_rate": 2.160386169277032e-06, "loss": 0.7441, "step": 29527 }, { "epoch": 0.56, "learning_rate": 2.1602348205091746e-06, "loss": 1.0776, "step": 29528 }, { "epoch": 0.56, "learning_rate": 2.1600834730099886e-06, "loss": 0.8469, "step": 29529 }, { "epoch": 0.56, "learning_rate": 2.1599321267800412e-06, "loss": 1.2494, "step": 29530 }, { "epoch": 0.56, "learning_rate": 2.1597807818198975e-06, "loss": 1.1355, "step": 29531 }, { "epoch": 0.56, "learning_rate": 2.1596294381301207e-06, "loss": 1.043, "step": 29532 }, { "epoch": 0.56, "learning_rate": 2.159478095711278e-06, "loss": 0.7796, "step": 29533 }, { "epoch": 0.56, "learning_rate": 2.159326754563933e-06, "loss": 0.7908, "step": 29534 }, { "epoch": 0.56, "learning_rate": 2.1591754146886513e-06, "loss": 0.9457, "step": 29535 }, { "epoch": 0.56, "learning_rate": 2.159024076085999e-06, "loss": 0.7589, "step": 29536 }, { "epoch": 0.56, "learning_rate": 2.1588727387565404e-06, "loss": 0.8249, "step": 29537 }, { "epoch": 0.56, "learning_rate": 2.15872140270084e-06, "loss": 1.1992, "step": 29538 }, { "epoch": 0.56, "learning_rate": 2.1585700679194635e-06, "loss": 0.9443, "step": 29539 }, { "epoch": 0.56, "learning_rate": 2.158418734412976e-06, "loss": 0.9172, "step": 29540 }, { "epoch": 0.56, "learning_rate": 2.158267402181942e-06, "loss": 0.8583, "step": 29541 }, { "epoch": 0.56, "learning_rate": 2.1581160712269274e-06, "loss": 0.9253, "step": 29542 }, { "epoch": 0.56, "learning_rate": 2.1579647415484977e-06, "loss": 1.0749, "step": 29543 }, { "epoch": 0.56, "learning_rate": 2.1578134131472158e-06, "loss": 1.124, "step": 29544 }, { "epoch": 0.56, "learning_rate": 2.1576620860236487e-06, "loss": 0.9157, "step": 29545 }, { "epoch": 0.56, "learning_rate": 2.1575107601783616e-06, "loss": 0.8042, "step": 29546 }, { "epoch": 0.56, "learning_rate": 2.157359435611917e-06, "loss": 0.9137, "step": 29547 }, { "epoch": 0.56, "learning_rate": 2.1572081123248834e-06, "loss": 0.8343, "step": 29548 }, { "epoch": 0.56, "learning_rate": 2.157056790317824e-06, "loss": 0.9775, "step": 29549 }, { "epoch": 0.56, "learning_rate": 2.156905469591303e-06, "loss": 1.2362, "step": 29550 }, { "epoch": 0.56, "learning_rate": 2.1567541501458876e-06, "loss": 0.7655, "step": 29551 }, { "epoch": 0.56, "learning_rate": 2.1566028319821415e-06, "loss": 0.9775, "step": 29552 }, { "epoch": 0.56, "learning_rate": 2.1564515151006292e-06, "loss": 1.0705, "step": 29553 }, { "epoch": 0.56, "learning_rate": 2.1563001995019174e-06, "loss": 0.8105, "step": 29554 }, { "epoch": 0.56, "learning_rate": 2.1561488851865694e-06, "loss": 1.0374, "step": 29555 }, { "epoch": 0.56, "learning_rate": 2.1559975721551505e-06, "loss": 0.9455, "step": 29556 }, { "epoch": 0.56, "learning_rate": 2.1558462604082274e-06, "loss": 0.9162, "step": 29557 }, { "epoch": 0.56, "learning_rate": 2.1556949499463634e-06, "loss": 1.0103, "step": 29558 }, { "epoch": 0.56, "learning_rate": 2.155543640770123e-06, "loss": 0.9324, "step": 29559 }, { "epoch": 0.56, "learning_rate": 2.155392332880073e-06, "loss": 0.9562, "step": 29560 }, { "epoch": 0.56, "learning_rate": 2.155241026276777e-06, "loss": 0.9422, "step": 29561 }, { "epoch": 0.56, "learning_rate": 2.155089720960801e-06, "loss": 1.1054, "step": 29562 }, { "epoch": 0.56, "learning_rate": 2.1549384169327086e-06, "loss": 1.0444, "step": 29563 }, { "epoch": 0.56, "learning_rate": 2.1547871141930665e-06, "loss": 0.9272, "step": 29564 }, { "epoch": 0.56, "learning_rate": 2.1546358127424375e-06, "loss": 0.9033, "step": 29565 }, { "epoch": 0.56, "learning_rate": 2.154484512581389e-06, "loss": 0.7562, "step": 29566 }, { "epoch": 0.56, "learning_rate": 2.154333213710485e-06, "loss": 0.819, "step": 29567 }, { "epoch": 0.56, "learning_rate": 2.1541819161302886e-06, "loss": 0.9158, "step": 29568 }, { "epoch": 0.56, "learning_rate": 2.154030619841367e-06, "loss": 0.9565, "step": 29569 }, { "epoch": 0.56, "learning_rate": 2.153879324844285e-06, "loss": 0.711, "step": 29570 }, { "epoch": 0.56, "learning_rate": 2.153728031139606e-06, "loss": 0.9464, "step": 29571 }, { "epoch": 0.56, "learning_rate": 2.153576738727897e-06, "loss": 0.9478, "step": 29572 }, { "epoch": 0.56, "learning_rate": 2.1534254476097215e-06, "loss": 0.7997, "step": 29573 }, { "epoch": 0.56, "learning_rate": 2.153274157785644e-06, "loss": 0.9305, "step": 29574 }, { "epoch": 0.56, "learning_rate": 2.1531228692562313e-06, "loss": 0.9915, "step": 29575 }, { "epoch": 0.56, "learning_rate": 2.1529715820220466e-06, "loss": 1.0547, "step": 29576 }, { "epoch": 0.56, "learning_rate": 2.1528202960836546e-06, "loss": 1.0474, "step": 29577 }, { "epoch": 0.56, "learning_rate": 2.1526690114416223e-06, "loss": 0.8773, "step": 29578 }, { "epoch": 0.56, "learning_rate": 2.152517728096513e-06, "loss": 0.8762, "step": 29579 }, { "epoch": 0.56, "learning_rate": 2.152366446048891e-06, "loss": 0.8752, "step": 29580 }, { "epoch": 0.56, "learning_rate": 2.152215165299323e-06, "loss": 1.0631, "step": 29581 }, { "epoch": 0.56, "learning_rate": 2.152063885848373e-06, "loss": 0.9477, "step": 29582 }, { "epoch": 0.56, "learning_rate": 2.1519126076966048e-06, "loss": 1.0239, "step": 29583 }, { "epoch": 0.56, "learning_rate": 2.1517613308445846e-06, "loss": 0.8789, "step": 29584 }, { "epoch": 0.56, "learning_rate": 2.1516100552928778e-06, "loss": 0.8552, "step": 29585 }, { "epoch": 0.56, "learning_rate": 2.1514587810420467e-06, "loss": 0.9763, "step": 29586 }, { "epoch": 0.56, "learning_rate": 2.1513075080926592e-06, "loss": 0.9694, "step": 29587 }, { "epoch": 0.56, "learning_rate": 2.151156236445279e-06, "loss": 0.7696, "step": 29588 }, { "epoch": 0.56, "learning_rate": 2.1510049661004694e-06, "loss": 0.9037, "step": 29589 }, { "epoch": 0.56, "learning_rate": 2.150853697058797e-06, "loss": 0.9106, "step": 29590 }, { "epoch": 0.56, "learning_rate": 2.150702429320827e-06, "loss": 0.9023, "step": 29591 }, { "epoch": 0.56, "learning_rate": 2.150551162887122e-06, "loss": 0.7843, "step": 29592 }, { "epoch": 0.56, "learning_rate": 2.1503998977582496e-06, "loss": 1.1082, "step": 29593 }, { "epoch": 0.56, "learning_rate": 2.150248633934773e-06, "loss": 0.97, "step": 29594 }, { "epoch": 0.56, "learning_rate": 2.1500973714172567e-06, "loss": 1.0955, "step": 29595 }, { "epoch": 0.56, "learning_rate": 2.149946110206267e-06, "loss": 0.7902, "step": 29596 }, { "epoch": 0.56, "learning_rate": 2.149794850302367e-06, "loss": 0.7791, "step": 29597 }, { "epoch": 0.56, "learning_rate": 2.1496435917061214e-06, "loss": 0.7733, "step": 29598 }, { "epoch": 0.56, "learning_rate": 2.1494923344180974e-06, "loss": 0.862, "step": 29599 }, { "epoch": 0.56, "learning_rate": 2.1493410784388584e-06, "loss": 1.0633, "step": 29600 }, { "epoch": 0.56, "learning_rate": 2.149189823768968e-06, "loss": 0.8231, "step": 29601 }, { "epoch": 0.56, "learning_rate": 2.149038570408993e-06, "loss": 0.7423, "step": 29602 }, { "epoch": 0.56, "learning_rate": 2.1488873183594967e-06, "loss": 0.7097, "step": 29603 }, { "epoch": 0.56, "learning_rate": 2.1487360676210445e-06, "loss": 0.8321, "step": 29604 }, { "epoch": 0.56, "learning_rate": 2.1485848181942008e-06, "loss": 1.0032, "step": 29605 }, { "epoch": 0.56, "learning_rate": 2.148433570079531e-06, "loss": 1.2071, "step": 29606 }, { "epoch": 0.56, "learning_rate": 2.148282323277599e-06, "loss": 0.8552, "step": 29607 }, { "epoch": 0.56, "learning_rate": 2.1481310777889703e-06, "loss": 0.8404, "step": 29608 }, { "epoch": 0.56, "learning_rate": 2.1479798336142103e-06, "loss": 0.8913, "step": 29609 }, { "epoch": 0.56, "learning_rate": 2.147828590753881e-06, "loss": 0.7311, "step": 29610 }, { "epoch": 0.56, "learning_rate": 2.1476773492085498e-06, "loss": 1.05, "step": 29611 }, { "epoch": 0.56, "learning_rate": 2.147526108978781e-06, "loss": 1.0929, "step": 29612 }, { "epoch": 0.56, "learning_rate": 2.1473748700651378e-06, "loss": 0.9814, "step": 29613 }, { "epoch": 0.56, "learning_rate": 2.147223632468187e-06, "loss": 0.9371, "step": 29614 }, { "epoch": 0.56, "learning_rate": 2.1470723961884928e-06, "loss": 1.0634, "step": 29615 }, { "epoch": 0.56, "learning_rate": 2.146921161226618e-06, "loss": 0.8757, "step": 29616 }, { "epoch": 0.56, "learning_rate": 2.14676992758313e-06, "loss": 0.9084, "step": 29617 }, { "epoch": 0.56, "learning_rate": 2.1466186952585916e-06, "loss": 1.0735, "step": 29618 }, { "epoch": 0.56, "learning_rate": 2.1464674642535676e-06, "loss": 1.0782, "step": 29619 }, { "epoch": 0.56, "learning_rate": 2.1463162345686246e-06, "loss": 1.0079, "step": 29620 }, { "epoch": 0.56, "learning_rate": 2.1461650062043257e-06, "loss": 0.7665, "step": 29621 }, { "epoch": 0.56, "learning_rate": 2.1460137791612344e-06, "loss": 0.9147, "step": 29622 }, { "epoch": 0.56, "learning_rate": 2.1458625534399185e-06, "loss": 0.8353, "step": 29623 }, { "epoch": 0.56, "learning_rate": 2.1457113290409405e-06, "loss": 0.9225, "step": 29624 }, { "epoch": 0.56, "learning_rate": 2.145560105964865e-06, "loss": 0.8153, "step": 29625 }, { "epoch": 0.56, "learning_rate": 2.1454088842122574e-06, "loss": 0.8743, "step": 29626 }, { "epoch": 0.56, "learning_rate": 2.1452576637836824e-06, "loss": 0.9347, "step": 29627 }, { "epoch": 0.56, "learning_rate": 2.145106444679704e-06, "loss": 1.0297, "step": 29628 }, { "epoch": 0.56, "learning_rate": 2.144955226900888e-06, "loss": 0.7481, "step": 29629 }, { "epoch": 0.56, "learning_rate": 2.144804010447798e-06, "loss": 0.809, "step": 29630 }, { "epoch": 0.56, "learning_rate": 2.144652795320998e-06, "loss": 1.0582, "step": 29631 }, { "epoch": 0.56, "learning_rate": 2.144501581521054e-06, "loss": 1.0189, "step": 29632 }, { "epoch": 0.56, "learning_rate": 2.144350369048531e-06, "loss": 0.9089, "step": 29633 }, { "epoch": 0.56, "learning_rate": 2.144199157903992e-06, "loss": 0.7208, "step": 29634 }, { "epoch": 0.56, "learning_rate": 2.1440479480880033e-06, "loss": 1.0031, "step": 29635 }, { "epoch": 0.56, "learning_rate": 2.1438967396011283e-06, "loss": 1.0148, "step": 29636 }, { "epoch": 0.56, "learning_rate": 2.143745532443931e-06, "loss": 0.9342, "step": 29637 }, { "epoch": 0.56, "learning_rate": 2.1435943266169784e-06, "loss": 0.8842, "step": 29638 }, { "epoch": 0.56, "learning_rate": 2.143443122120833e-06, "loss": 0.8757, "step": 29639 }, { "epoch": 0.56, "learning_rate": 2.143291918956059e-06, "loss": 0.8054, "step": 29640 }, { "epoch": 0.56, "learning_rate": 2.143140717123224e-06, "loss": 0.9504, "step": 29641 }, { "epoch": 0.56, "learning_rate": 2.14298951662289e-06, "loss": 1.0474, "step": 29642 }, { "epoch": 0.56, "learning_rate": 2.142838317455621e-06, "loss": 1.0662, "step": 29643 }, { "epoch": 0.56, "learning_rate": 2.142687119621984e-06, "loss": 0.8783, "step": 29644 }, { "epoch": 0.56, "learning_rate": 2.142535923122542e-06, "loss": 0.6318, "step": 29645 }, { "epoch": 0.56, "learning_rate": 2.14238472795786e-06, "loss": 0.9453, "step": 29646 }, { "epoch": 0.56, "learning_rate": 2.1422335341285024e-06, "loss": 0.8727, "step": 29647 }, { "epoch": 0.56, "learning_rate": 2.1420823416350337e-06, "loss": 0.8223, "step": 29648 }, { "epoch": 0.56, "learning_rate": 2.1419311504780183e-06, "loss": 0.8405, "step": 29649 }, { "epoch": 0.56, "learning_rate": 2.141779960658022e-06, "loss": 1.0785, "step": 29650 }, { "epoch": 0.56, "learning_rate": 2.141628772175608e-06, "loss": 0.9596, "step": 29651 }, { "epoch": 0.56, "learning_rate": 2.1414775850313403e-06, "loss": 0.8602, "step": 29652 }, { "epoch": 0.56, "learning_rate": 2.1413263992257846e-06, "loss": 0.9616, "step": 29653 }, { "epoch": 0.56, "learning_rate": 2.1411752147595057e-06, "loss": 0.8204, "step": 29654 }, { "epoch": 0.56, "learning_rate": 2.1410240316330664e-06, "loss": 1.1239, "step": 29655 }, { "epoch": 0.56, "learning_rate": 2.140872849847034e-06, "loss": 1.1293, "step": 29656 }, { "epoch": 0.56, "learning_rate": 2.140721669401971e-06, "loss": 1.0489, "step": 29657 }, { "epoch": 0.56, "learning_rate": 2.1405704902984412e-06, "loss": 0.9366, "step": 29658 }, { "epoch": 0.56, "learning_rate": 2.1404193125370113e-06, "loss": 0.9837, "step": 29659 }, { "epoch": 0.56, "learning_rate": 2.140268136118244e-06, "loss": 0.8111, "step": 29660 }, { "epoch": 0.56, "learning_rate": 2.140116961042704e-06, "loss": 1.002, "step": 29661 }, { "epoch": 0.56, "learning_rate": 2.139965787310957e-06, "loss": 1.0513, "step": 29662 }, { "epoch": 0.56, "learning_rate": 2.1398146149235676e-06, "loss": 0.975, "step": 29663 }, { "epoch": 0.56, "learning_rate": 2.1396634438810977e-06, "loss": 0.7342, "step": 29664 }, { "epoch": 0.56, "learning_rate": 2.1395122741841143e-06, "loss": 0.9919, "step": 29665 }, { "epoch": 0.56, "learning_rate": 2.1393611058331806e-06, "loss": 0.8163, "step": 29666 }, { "epoch": 0.56, "learning_rate": 2.1392099388288616e-06, "loss": 0.8763, "step": 29667 }, { "epoch": 0.56, "learning_rate": 2.1390587731717218e-06, "loss": 1.0417, "step": 29668 }, { "epoch": 0.56, "learning_rate": 2.1389076088623257e-06, "loss": 0.8619, "step": 29669 }, { "epoch": 0.56, "learning_rate": 2.1387564459012367e-06, "loss": 1.0399, "step": 29670 }, { "epoch": 0.56, "learning_rate": 2.138605284289021e-06, "loss": 0.9092, "step": 29671 }, { "epoch": 0.56, "learning_rate": 2.138454124026242e-06, "loss": 0.9495, "step": 29672 }, { "epoch": 0.56, "learning_rate": 2.138302965113463e-06, "loss": 0.8254, "step": 29673 }, { "epoch": 0.56, "learning_rate": 2.1381518075512506e-06, "loss": 1.1423, "step": 29674 }, { "epoch": 0.56, "learning_rate": 2.1380006513401685e-06, "loss": 1.1075, "step": 29675 }, { "epoch": 0.56, "learning_rate": 2.1378494964807798e-06, "loss": 0.7533, "step": 29676 }, { "epoch": 0.56, "learning_rate": 2.1376983429736512e-06, "loss": 0.8467, "step": 29677 }, { "epoch": 0.56, "learning_rate": 2.137547190819346e-06, "loss": 0.9709, "step": 29678 }, { "epoch": 0.56, "learning_rate": 2.1373960400184273e-06, "loss": 0.8001, "step": 29679 }, { "epoch": 0.56, "learning_rate": 2.1372448905714614e-06, "loss": 0.921, "step": 29680 }, { "epoch": 0.56, "learning_rate": 2.137093742479012e-06, "loss": 1.1473, "step": 29681 }, { "epoch": 0.56, "learning_rate": 2.1369425957416424e-06, "loss": 1.0684, "step": 29682 }, { "epoch": 0.56, "learning_rate": 2.1367914503599193e-06, "loss": 0.9857, "step": 29683 }, { "epoch": 0.56, "learning_rate": 2.136640306334406e-06, "loss": 1.029, "step": 29684 }, { "epoch": 0.56, "learning_rate": 2.136489163665665e-06, "loss": 0.9176, "step": 29685 }, { "epoch": 0.56, "learning_rate": 2.136338022354264e-06, "loss": 0.7784, "step": 29686 }, { "epoch": 0.56, "learning_rate": 2.1361868824007648e-06, "loss": 1.1532, "step": 29687 }, { "epoch": 0.56, "learning_rate": 2.1360357438057326e-06, "loss": 1.109, "step": 29688 }, { "epoch": 0.56, "learning_rate": 2.135884606569732e-06, "loss": 1.0157, "step": 29689 }, { "epoch": 0.56, "learning_rate": 2.1357334706933276e-06, "loss": 0.8289, "step": 29690 }, { "epoch": 0.56, "learning_rate": 2.1355823361770818e-06, "loss": 0.9371, "step": 29691 }, { "epoch": 0.56, "learning_rate": 2.1354312030215618e-06, "loss": 0.5652, "step": 29692 }, { "epoch": 0.56, "learning_rate": 2.135280071227331e-06, "loss": 0.9839, "step": 29693 }, { "epoch": 0.56, "learning_rate": 2.1351289407949515e-06, "loss": 0.9299, "step": 29694 }, { "epoch": 0.56, "learning_rate": 2.13497781172499e-06, "loss": 0.8508, "step": 29695 }, { "epoch": 0.56, "learning_rate": 2.1348266840180106e-06, "loss": 0.8341, "step": 29696 }, { "epoch": 0.56, "learning_rate": 2.134675557674576e-06, "loss": 1.1055, "step": 29697 }, { "epoch": 0.56, "learning_rate": 2.134524432695253e-06, "loss": 0.9514, "step": 29698 }, { "epoch": 0.56, "learning_rate": 2.1343733090806044e-06, "loss": 0.7889, "step": 29699 }, { "epoch": 0.56, "learning_rate": 2.134222186831194e-06, "loss": 0.8544, "step": 29700 }, { "epoch": 0.56, "learning_rate": 2.1340710659475876e-06, "loss": 0.9725, "step": 29701 }, { "epoch": 0.56, "learning_rate": 2.133919946430348e-06, "loss": 0.9553, "step": 29702 }, { "epoch": 0.56, "learning_rate": 2.133768828280039e-06, "loss": 0.7655, "step": 29703 }, { "epoch": 0.56, "learning_rate": 2.133617711497228e-06, "loss": 0.8224, "step": 29704 }, { "epoch": 0.56, "learning_rate": 2.133466596082477e-06, "loss": 0.903, "step": 29705 }, { "epoch": 0.56, "learning_rate": 2.1333154820363487e-06, "loss": 1.0071, "step": 29706 }, { "epoch": 0.56, "learning_rate": 2.133164369359411e-06, "loss": 1.0763, "step": 29707 }, { "epoch": 0.56, "learning_rate": 2.1330132580522257e-06, "loss": 0.6689, "step": 29708 }, { "epoch": 0.56, "learning_rate": 2.1328621481153573e-06, "loss": 0.9438, "step": 29709 }, { "epoch": 0.56, "learning_rate": 2.1327110395493706e-06, "loss": 0.7916, "step": 29710 }, { "epoch": 0.56, "learning_rate": 2.13255993235483e-06, "loss": 1.0691, "step": 29711 }, { "epoch": 0.56, "learning_rate": 2.1324088265322985e-06, "loss": 1.0455, "step": 29712 }, { "epoch": 0.56, "learning_rate": 2.1322577220823422e-06, "loss": 0.7897, "step": 29713 }, { "epoch": 0.56, "learning_rate": 2.1321066190055238e-06, "loss": 0.937, "step": 29714 }, { "epoch": 0.56, "learning_rate": 2.1319555173024077e-06, "loss": 0.8568, "step": 29715 }, { "epoch": 0.56, "learning_rate": 2.1318044169735585e-06, "loss": 0.9752, "step": 29716 }, { "epoch": 0.56, "learning_rate": 2.1316533180195408e-06, "loss": 0.8578, "step": 29717 }, { "epoch": 0.56, "learning_rate": 2.1315022204409173e-06, "loss": 1.1592, "step": 29718 }, { "epoch": 0.56, "learning_rate": 2.1313511242382545e-06, "loss": 0.9562, "step": 29719 }, { "epoch": 0.56, "learning_rate": 2.131200029412115e-06, "loss": 0.9948, "step": 29720 }, { "epoch": 0.56, "learning_rate": 2.1310489359630627e-06, "loss": 1.0012, "step": 29721 }, { "epoch": 0.56, "learning_rate": 2.1308978438916632e-06, "loss": 1.0836, "step": 29722 }, { "epoch": 0.56, "learning_rate": 2.1307467531984787e-06, "loss": 0.8217, "step": 29723 }, { "epoch": 0.56, "learning_rate": 2.1305956638840746e-06, "loss": 0.7934, "step": 29724 }, { "epoch": 0.56, "learning_rate": 2.130444575949016e-06, "loss": 0.9843, "step": 29725 }, { "epoch": 0.56, "learning_rate": 2.130293489393866e-06, "loss": 0.9478, "step": 29726 }, { "epoch": 0.56, "learning_rate": 2.130142404219188e-06, "loss": 0.8799, "step": 29727 }, { "epoch": 0.56, "learning_rate": 2.1299913204255474e-06, "loss": 0.6934, "step": 29728 }, { "epoch": 0.56, "learning_rate": 2.1298402380135076e-06, "loss": 0.7943, "step": 29729 }, { "epoch": 0.56, "learning_rate": 2.129689156983633e-06, "loss": 0.8145, "step": 29730 }, { "epoch": 0.56, "learning_rate": 2.1295380773364873e-06, "loss": 1.1672, "step": 29731 }, { "epoch": 0.56, "learning_rate": 2.1293869990726363e-06, "loss": 0.9089, "step": 29732 }, { "epoch": 0.56, "learning_rate": 2.129235922192641e-06, "loss": 1.038, "step": 29733 }, { "epoch": 0.56, "learning_rate": 2.129084846697069e-06, "loss": 0.8226, "step": 29734 }, { "epoch": 0.56, "learning_rate": 2.1289337725864832e-06, "loss": 0.9977, "step": 29735 }, { "epoch": 0.56, "learning_rate": 2.128782699861446e-06, "loss": 0.7568, "step": 29736 }, { "epoch": 0.56, "learning_rate": 2.128631628522523e-06, "loss": 1.349, "step": 29737 }, { "epoch": 0.56, "learning_rate": 2.1284805585702785e-06, "loss": 1.2611, "step": 29738 }, { "epoch": 0.56, "learning_rate": 2.128329490005276e-06, "loss": 0.7748, "step": 29739 }, { "epoch": 0.56, "learning_rate": 2.12817842282808e-06, "loss": 0.9086, "step": 29740 }, { "epoch": 0.56, "learning_rate": 2.1280273570392547e-06, "loss": 0.5776, "step": 29741 }, { "epoch": 0.56, "learning_rate": 2.1278762926393625e-06, "loss": 0.8819, "step": 29742 }, { "epoch": 0.56, "learning_rate": 2.12772522962897e-06, "loss": 1.0496, "step": 29743 }, { "epoch": 0.56, "learning_rate": 2.1275741680086402e-06, "loss": 1.032, "step": 29744 }, { "epoch": 0.56, "learning_rate": 2.127423107778936e-06, "loss": 0.8598, "step": 29745 }, { "epoch": 0.56, "learning_rate": 2.127272048940423e-06, "loss": 0.8073, "step": 29746 }, { "epoch": 0.56, "learning_rate": 2.127120991493666e-06, "loss": 0.9863, "step": 29747 }, { "epoch": 0.56, "learning_rate": 2.1269699354392256e-06, "loss": 0.8425, "step": 29748 }, { "epoch": 0.56, "learning_rate": 2.1268188807776694e-06, "loss": 0.8361, "step": 29749 }, { "epoch": 0.56, "learning_rate": 2.12666782750956e-06, "loss": 1.0114, "step": 29750 }, { "epoch": 0.56, "learning_rate": 2.1265167756354618e-06, "loss": 0.8914, "step": 29751 }, { "epoch": 0.56, "learning_rate": 2.126365725155937e-06, "loss": 0.7556, "step": 29752 }, { "epoch": 0.56, "learning_rate": 2.126214676071552e-06, "loss": 0.9528, "step": 29753 }, { "epoch": 0.56, "learning_rate": 2.126063628382871e-06, "loss": 0.7703, "step": 29754 }, { "epoch": 0.56, "learning_rate": 2.1259125820904554e-06, "loss": 0.9861, "step": 29755 }, { "epoch": 0.56, "learning_rate": 2.1257615371948715e-06, "loss": 1.2556, "step": 29756 }, { "epoch": 0.56, "learning_rate": 2.125610493696682e-06, "loss": 0.8884, "step": 29757 }, { "epoch": 0.56, "learning_rate": 2.125459451596451e-06, "loss": 0.8325, "step": 29758 }, { "epoch": 0.56, "learning_rate": 2.1253084108947446e-06, "loss": 1.0253, "step": 29759 }, { "epoch": 0.56, "learning_rate": 2.1251573715921244e-06, "loss": 0.8817, "step": 29760 }, { "epoch": 0.56, "learning_rate": 2.1250063336891545e-06, "loss": 0.8132, "step": 29761 }, { "epoch": 0.56, "learning_rate": 2.1248552971864e-06, "loss": 1.1727, "step": 29762 }, { "epoch": 0.56, "learning_rate": 2.124704262084424e-06, "loss": 1.1431, "step": 29763 }, { "epoch": 0.56, "learning_rate": 2.124553228383791e-06, "loss": 1.0022, "step": 29764 }, { "epoch": 0.56, "learning_rate": 2.1244021960850644e-06, "loss": 0.9925, "step": 29765 }, { "epoch": 0.56, "learning_rate": 2.124251165188809e-06, "loss": 0.9659, "step": 29766 }, { "epoch": 0.56, "learning_rate": 2.1241001356955876e-06, "loss": 0.7193, "step": 29767 }, { "epoch": 0.56, "learning_rate": 2.1239491076059657e-06, "loss": 0.9628, "step": 29768 }, { "epoch": 0.56, "learning_rate": 2.123798080920506e-06, "loss": 1.0038, "step": 29769 }, { "epoch": 0.56, "learning_rate": 2.123647055639772e-06, "loss": 0.8994, "step": 29770 }, { "epoch": 0.56, "learning_rate": 2.1234960317643284e-06, "loss": 0.9981, "step": 29771 }, { "epoch": 0.56, "learning_rate": 2.12334500929474e-06, "loss": 0.8878, "step": 29772 }, { "epoch": 0.56, "learning_rate": 2.1231939882315687e-06, "loss": 0.7458, "step": 29773 }, { "epoch": 0.56, "learning_rate": 2.1230429685753804e-06, "loss": 0.9697, "step": 29774 }, { "epoch": 0.56, "learning_rate": 2.1228919503267386e-06, "loss": 0.767, "step": 29775 }, { "epoch": 0.56, "learning_rate": 2.122740933486205e-06, "loss": 0.98, "step": 29776 }, { "epoch": 0.56, "learning_rate": 2.1225899180543468e-06, "loss": 0.8243, "step": 29777 }, { "epoch": 0.56, "learning_rate": 2.1224389040317255e-06, "loss": 0.7693, "step": 29778 }, { "epoch": 0.56, "learning_rate": 2.122287891418905e-06, "loss": 0.9783, "step": 29779 }, { "epoch": 0.56, "learning_rate": 2.122136880216451e-06, "loss": 0.8299, "step": 29780 }, { "epoch": 0.56, "learning_rate": 2.1219858704249267e-06, "loss": 0.9272, "step": 29781 }, { "epoch": 0.56, "learning_rate": 2.1218348620448942e-06, "loss": 0.759, "step": 29782 }, { "epoch": 0.56, "learning_rate": 2.12168385507692e-06, "loss": 0.8455, "step": 29783 }, { "epoch": 0.56, "learning_rate": 2.1215328495215656e-06, "loss": 1.014, "step": 29784 }, { "epoch": 0.56, "learning_rate": 2.1213818453793965e-06, "loss": 1.0284, "step": 29785 }, { "epoch": 0.56, "learning_rate": 2.1212308426509757e-06, "loss": 0.853, "step": 29786 }, { "epoch": 0.56, "learning_rate": 2.121079841336868e-06, "loss": 1.082, "step": 29787 }, { "epoch": 0.56, "learning_rate": 2.1209288414376355e-06, "loss": 1.0516, "step": 29788 }, { "epoch": 0.56, "learning_rate": 2.120777842953844e-06, "loss": 1.0995, "step": 29789 }, { "epoch": 0.56, "learning_rate": 2.120626845886057e-06, "loss": 0.9516, "step": 29790 }, { "epoch": 0.56, "learning_rate": 2.120475850234836e-06, "loss": 0.8007, "step": 29791 }, { "epoch": 0.56, "learning_rate": 2.1203248560007473e-06, "loss": 1.1534, "step": 29792 }, { "epoch": 0.56, "learning_rate": 2.1201738631843544e-06, "loss": 1.1102, "step": 29793 }, { "epoch": 0.56, "learning_rate": 2.1200228717862195e-06, "loss": 1.0328, "step": 29794 }, { "epoch": 0.56, "learning_rate": 2.1198718818069088e-06, "loss": 1.0157, "step": 29795 }, { "epoch": 0.56, "learning_rate": 2.1197208932469847e-06, "loss": 0.9257, "step": 29796 }, { "epoch": 0.56, "learning_rate": 2.1195699061070102e-06, "loss": 1.0814, "step": 29797 }, { "epoch": 0.56, "learning_rate": 2.119418920387551e-06, "loss": 0.7357, "step": 29798 }, { "epoch": 0.56, "learning_rate": 2.119267936089169e-06, "loss": 1.2585, "step": 29799 }, { "epoch": 0.56, "learning_rate": 2.119116953212429e-06, "loss": 1.1331, "step": 29800 }, { "epoch": 0.56, "learning_rate": 2.1189659717578953e-06, "loss": 0.841, "step": 29801 }, { "epoch": 0.56, "learning_rate": 2.118814991726131e-06, "loss": 0.8856, "step": 29802 }, { "epoch": 0.56, "learning_rate": 2.118664013117699e-06, "loss": 1.0072, "step": 29803 }, { "epoch": 0.56, "learning_rate": 2.1185130359331644e-06, "loss": 0.7886, "step": 29804 }, { "epoch": 0.56, "learning_rate": 2.1183620601730907e-06, "loss": 0.9667, "step": 29805 }, { "epoch": 0.56, "learning_rate": 2.1182110858380406e-06, "loss": 0.9193, "step": 29806 }, { "epoch": 0.56, "learning_rate": 2.118060112928579e-06, "loss": 0.923, "step": 29807 }, { "epoch": 0.56, "learning_rate": 2.1179091414452697e-06, "loss": 0.7945, "step": 29808 }, { "epoch": 0.56, "learning_rate": 2.1177581713886745e-06, "loss": 0.8583, "step": 29809 }, { "epoch": 0.56, "learning_rate": 2.1176072027593603e-06, "loss": 0.8285, "step": 29810 }, { "epoch": 0.56, "learning_rate": 2.1174562355578887e-06, "loss": 0.8453, "step": 29811 }, { "epoch": 0.56, "learning_rate": 2.117305269784823e-06, "loss": 1.0722, "step": 29812 }, { "epoch": 0.56, "learning_rate": 2.1171543054407277e-06, "loss": 1.0593, "step": 29813 }, { "epoch": 0.56, "learning_rate": 2.117003342526168e-06, "loss": 0.9052, "step": 29814 }, { "epoch": 0.56, "learning_rate": 2.1168523810417036e-06, "loss": 0.8312, "step": 29815 }, { "epoch": 0.56, "learning_rate": 2.1167014209879026e-06, "loss": 0.8439, "step": 29816 }, { "epoch": 0.56, "learning_rate": 2.116550462365327e-06, "loss": 0.932, "step": 29817 }, { "epoch": 0.56, "learning_rate": 2.1163995051745383e-06, "loss": 0.9798, "step": 29818 }, { "epoch": 0.56, "learning_rate": 2.116248549416104e-06, "loss": 1.0697, "step": 29819 }, { "epoch": 0.56, "learning_rate": 2.116097595090585e-06, "loss": 0.7522, "step": 29820 }, { "epoch": 0.56, "learning_rate": 2.115946642198545e-06, "loss": 0.9992, "step": 29821 }, { "epoch": 0.56, "learning_rate": 2.11579569074055e-06, "loss": 0.9653, "step": 29822 }, { "epoch": 0.56, "learning_rate": 2.1156447407171614e-06, "loss": 0.7506, "step": 29823 }, { "epoch": 0.56, "learning_rate": 2.1154937921289432e-06, "loss": 0.9847, "step": 29824 }, { "epoch": 0.56, "learning_rate": 2.1153428449764603e-06, "loss": 1.0942, "step": 29825 }, { "epoch": 0.56, "learning_rate": 2.1151918992602746e-06, "loss": 0.7821, "step": 29826 }, { "epoch": 0.56, "learning_rate": 2.1150409549809507e-06, "loss": 0.7495, "step": 29827 }, { "epoch": 0.56, "learning_rate": 2.1148900121390524e-06, "loss": 1.0793, "step": 29828 }, { "epoch": 0.56, "learning_rate": 2.114739070735143e-06, "loss": 0.8773, "step": 29829 }, { "epoch": 0.56, "learning_rate": 2.1145881307697852e-06, "loss": 0.9982, "step": 29830 }, { "epoch": 0.56, "learning_rate": 2.1144371922435447e-06, "loss": 1.0001, "step": 29831 }, { "epoch": 0.56, "learning_rate": 2.1142862551569836e-06, "loss": 0.9241, "step": 29832 }, { "epoch": 0.56, "learning_rate": 2.1141353195106653e-06, "loss": 0.8944, "step": 29833 }, { "epoch": 0.56, "learning_rate": 2.113984385305154e-06, "loss": 0.9, "step": 29834 }, { "epoch": 0.56, "learning_rate": 2.1138334525410137e-06, "loss": 0.6645, "step": 29835 }, { "epoch": 0.56, "learning_rate": 2.1136825212188066e-06, "loss": 0.8799, "step": 29836 }, { "epoch": 0.56, "learning_rate": 2.113531591339098e-06, "loss": 1.0328, "step": 29837 }, { "epoch": 0.56, "learning_rate": 2.1133806629024504e-06, "loss": 1.0321, "step": 29838 }, { "epoch": 0.56, "learning_rate": 2.113229735909427e-06, "loss": 0.8699, "step": 29839 }, { "epoch": 0.56, "learning_rate": 2.1130788103605927e-06, "loss": 0.8985, "step": 29840 }, { "epoch": 0.56, "learning_rate": 2.11292788625651e-06, "loss": 0.8658, "step": 29841 }, { "epoch": 0.56, "learning_rate": 2.1127769635977417e-06, "loss": 0.7558, "step": 29842 }, { "epoch": 0.56, "learning_rate": 2.1126260423848534e-06, "loss": 1.176, "step": 29843 }, { "epoch": 0.56, "learning_rate": 2.112475122618408e-06, "loss": 1.0074, "step": 29844 }, { "epoch": 0.56, "learning_rate": 2.1123242042989673e-06, "loss": 0.8154, "step": 29845 }, { "epoch": 0.56, "learning_rate": 2.1121732874270974e-06, "loss": 0.897, "step": 29846 }, { "epoch": 0.56, "learning_rate": 2.1120223720033594e-06, "loss": 0.6532, "step": 29847 }, { "epoch": 0.56, "learning_rate": 2.1118714580283185e-06, "loss": 0.9709, "step": 29848 }, { "epoch": 0.56, "learning_rate": 2.111720545502538e-06, "loss": 1.115, "step": 29849 }, { "epoch": 0.56, "learning_rate": 2.111569634426581e-06, "loss": 1.2101, "step": 29850 }, { "epoch": 0.56, "learning_rate": 2.1114187248010102e-06, "loss": 0.8704, "step": 29851 }, { "epoch": 0.56, "learning_rate": 2.1112678166263908e-06, "loss": 1.0649, "step": 29852 }, { "epoch": 0.56, "learning_rate": 2.111116909903286e-06, "loss": 0.8633, "step": 29853 }, { "epoch": 0.56, "learning_rate": 2.1109660046322573e-06, "loss": 1.0528, "step": 29854 }, { "epoch": 0.56, "learning_rate": 2.11081510081387e-06, "loss": 1.0386, "step": 29855 }, { "epoch": 0.56, "learning_rate": 2.110664198448688e-06, "loss": 1.0482, "step": 29856 }, { "epoch": 0.56, "learning_rate": 2.110513297537273e-06, "loss": 1.1523, "step": 29857 }, { "epoch": 0.56, "learning_rate": 2.1103623980801902e-06, "loss": 0.7605, "step": 29858 }, { "epoch": 0.56, "learning_rate": 2.1102115000780023e-06, "loss": 0.7679, "step": 29859 }, { "epoch": 0.56, "learning_rate": 2.1100606035312716e-06, "loss": 0.8193, "step": 29860 }, { "epoch": 0.56, "learning_rate": 2.109909708440564e-06, "loss": 1.1019, "step": 29861 }, { "epoch": 0.56, "learning_rate": 2.1097588148064406e-06, "loss": 1.1176, "step": 29862 }, { "epoch": 0.56, "learning_rate": 2.1096079226294656e-06, "loss": 0.9809, "step": 29863 }, { "epoch": 0.56, "learning_rate": 2.1094570319102038e-06, "loss": 0.7594, "step": 29864 }, { "epoch": 0.56, "learning_rate": 2.109306142649217e-06, "loss": 0.7909, "step": 29865 }, { "epoch": 0.56, "learning_rate": 2.1091552548470687e-06, "loss": 0.6902, "step": 29866 }, { "epoch": 0.56, "learning_rate": 2.1090043685043232e-06, "loss": 0.9767, "step": 29867 }, { "epoch": 0.56, "learning_rate": 2.1088534836215432e-06, "loss": 1.1609, "step": 29868 }, { "epoch": 0.56, "learning_rate": 2.1087026001992924e-06, "loss": 0.9491, "step": 29869 }, { "epoch": 0.56, "learning_rate": 2.1085517182381336e-06, "loss": 0.8641, "step": 29870 }, { "epoch": 0.56, "learning_rate": 2.1084008377386313e-06, "loss": 0.7701, "step": 29871 }, { "epoch": 0.56, "learning_rate": 2.1082499587013477e-06, "loss": 1.083, "step": 29872 }, { "epoch": 0.56, "learning_rate": 2.108099081126847e-06, "loss": 0.9464, "step": 29873 }, { "epoch": 0.56, "learning_rate": 2.107948205015693e-06, "loss": 0.8881, "step": 29874 }, { "epoch": 0.56, "learning_rate": 2.1077973303684473e-06, "loss": 0.989, "step": 29875 }, { "epoch": 0.56, "learning_rate": 2.107646457185675e-06, "loss": 1.0438, "step": 29876 }, { "epoch": 0.56, "learning_rate": 2.1074955854679384e-06, "loss": 0.8116, "step": 29877 }, { "epoch": 0.56, "learning_rate": 2.107344715215801e-06, "loss": 0.7526, "step": 29878 }, { "epoch": 0.56, "learning_rate": 2.1071938464298275e-06, "loss": 0.9796, "step": 29879 }, { "epoch": 0.56, "learning_rate": 2.1070429791105798e-06, "loss": 0.9859, "step": 29880 }, { "epoch": 0.56, "learning_rate": 2.1068921132586205e-06, "loss": 1.1083, "step": 29881 }, { "epoch": 0.56, "learning_rate": 2.1067412488745156e-06, "loss": 1.1951, "step": 29882 }, { "epoch": 0.56, "learning_rate": 2.1065903859588257e-06, "loss": 0.9924, "step": 29883 }, { "epoch": 0.56, "learning_rate": 2.1064395245121145e-06, "loss": 1.0584, "step": 29884 }, { "epoch": 0.56, "learning_rate": 2.1062886645349475e-06, "loss": 0.8183, "step": 29885 }, { "epoch": 0.56, "learning_rate": 2.1061378060278866e-06, "loss": 0.9105, "step": 29886 }, { "epoch": 0.56, "learning_rate": 2.105986948991494e-06, "loss": 1.0453, "step": 29887 }, { "epoch": 0.56, "learning_rate": 2.105836093426335e-06, "loss": 0.9878, "step": 29888 }, { "epoch": 0.56, "learning_rate": 2.105685239332971e-06, "loss": 0.7775, "step": 29889 }, { "epoch": 0.56, "learning_rate": 2.105534386711967e-06, "loss": 1.1059, "step": 29890 }, { "epoch": 0.56, "learning_rate": 2.1053835355638854e-06, "loss": 1.0167, "step": 29891 }, { "epoch": 0.56, "learning_rate": 2.10523268588929e-06, "loss": 0.8468, "step": 29892 }, { "epoch": 0.56, "learning_rate": 2.105081837688742e-06, "loss": 0.786, "step": 29893 }, { "epoch": 0.56, "learning_rate": 2.104930990962808e-06, "loss": 1.0446, "step": 29894 }, { "epoch": 0.56, "learning_rate": 2.1047801457120494e-06, "loss": 0.8758, "step": 29895 }, { "epoch": 0.56, "learning_rate": 2.1046293019370285e-06, "loss": 0.7435, "step": 29896 }, { "epoch": 0.56, "learning_rate": 2.1044784596383103e-06, "loss": 0.8676, "step": 29897 }, { "epoch": 0.56, "learning_rate": 2.104327618816458e-06, "loss": 0.8897, "step": 29898 }, { "epoch": 0.56, "learning_rate": 2.104176779472033e-06, "loss": 1.0465, "step": 29899 }, { "epoch": 0.56, "learning_rate": 2.1040259416056007e-06, "loss": 0.9031, "step": 29900 }, { "epoch": 0.56, "learning_rate": 2.103875105217724e-06, "loss": 0.8023, "step": 29901 }, { "epoch": 0.56, "learning_rate": 2.1037242703089638e-06, "loss": 0.7177, "step": 29902 }, { "epoch": 0.56, "learning_rate": 2.1035734368798867e-06, "loss": 0.927, "step": 29903 }, { "epoch": 0.56, "learning_rate": 2.103422604931053e-06, "loss": 0.9377, "step": 29904 }, { "epoch": 0.56, "learning_rate": 2.103271774463027e-06, "loss": 0.7665, "step": 29905 }, { "epoch": 0.56, "learning_rate": 2.103120945476373e-06, "loss": 1.1845, "step": 29906 }, { "epoch": 0.56, "learning_rate": 2.1029701179716535e-06, "loss": 0.979, "step": 29907 }, { "epoch": 0.56, "learning_rate": 2.10281929194943e-06, "loss": 0.8728, "step": 29908 }, { "epoch": 0.56, "learning_rate": 2.1026684674102683e-06, "loss": 0.9997, "step": 29909 }, { "epoch": 0.56, "learning_rate": 2.1025176443547296e-06, "loss": 0.9053, "step": 29910 }, { "epoch": 0.56, "learning_rate": 2.102366822783378e-06, "loss": 0.9233, "step": 29911 }, { "epoch": 0.56, "learning_rate": 2.1022160026967763e-06, "loss": 1.0076, "step": 29912 }, { "epoch": 0.56, "learning_rate": 2.1020651840954886e-06, "loss": 0.9435, "step": 29913 }, { "epoch": 0.56, "learning_rate": 2.1019143669800764e-06, "loss": 0.9053, "step": 29914 }, { "epoch": 0.56, "learning_rate": 2.1017635513511044e-06, "loss": 0.9634, "step": 29915 }, { "epoch": 0.56, "learning_rate": 2.1016127372091357e-06, "loss": 0.8128, "step": 29916 }, { "epoch": 0.56, "learning_rate": 2.1014619245547313e-06, "loss": 0.7947, "step": 29917 }, { "epoch": 0.56, "learning_rate": 2.101311113388456e-06, "loss": 1.015, "step": 29918 }, { "epoch": 0.56, "learning_rate": 2.101160303710874e-06, "loss": 0.6995, "step": 29919 }, { "epoch": 0.56, "learning_rate": 2.101009495522546e-06, "loss": 1.1108, "step": 29920 }, { "epoch": 0.56, "learning_rate": 2.1008586888240374e-06, "loss": 0.668, "step": 29921 }, { "epoch": 0.56, "learning_rate": 2.1007078836159102e-06, "loss": 0.9562, "step": 29922 }, { "epoch": 0.56, "learning_rate": 2.100557079898726e-06, "loss": 0.7743, "step": 29923 }, { "epoch": 0.56, "learning_rate": 2.100406277673051e-06, "loss": 1.0626, "step": 29924 }, { "epoch": 0.56, "learning_rate": 2.100255476939446e-06, "loss": 1.0674, "step": 29925 }, { "epoch": 0.56, "learning_rate": 2.1001046776984743e-06, "loss": 0.8813, "step": 29926 }, { "epoch": 0.56, "learning_rate": 2.0999538799507004e-06, "loss": 0.8998, "step": 29927 }, { "epoch": 0.56, "learning_rate": 2.0998030836966864e-06, "loss": 0.9173, "step": 29928 }, { "epoch": 0.56, "learning_rate": 2.0996522889369948e-06, "loss": 0.7482, "step": 29929 }, { "epoch": 0.56, "learning_rate": 2.0995014956721897e-06, "loss": 0.972, "step": 29930 }, { "epoch": 0.56, "learning_rate": 2.099350703902834e-06, "loss": 0.8992, "step": 29931 }, { "epoch": 0.56, "learning_rate": 2.09919991362949e-06, "loss": 1.0284, "step": 29932 }, { "epoch": 0.56, "learning_rate": 2.0990491248527212e-06, "loss": 0.8743, "step": 29933 }, { "epoch": 0.56, "learning_rate": 2.098898337573091e-06, "loss": 0.9279, "step": 29934 }, { "epoch": 0.56, "learning_rate": 2.0987475517911615e-06, "loss": 0.5807, "step": 29935 }, { "epoch": 0.56, "learning_rate": 2.098596767507497e-06, "loss": 0.9648, "step": 29936 }, { "epoch": 0.56, "learning_rate": 2.09844598472266e-06, "loss": 0.9242, "step": 29937 }, { "epoch": 0.56, "learning_rate": 2.098295203437213e-06, "loss": 0.9632, "step": 29938 }, { "epoch": 0.56, "learning_rate": 2.098144423651719e-06, "loss": 0.9978, "step": 29939 }, { "epoch": 0.56, "learning_rate": 2.097993645366742e-06, "loss": 1.0275, "step": 29940 }, { "epoch": 0.56, "learning_rate": 2.097842868582844e-06, "loss": 0.8717, "step": 29941 }, { "epoch": 0.56, "learning_rate": 2.097692093300589e-06, "loss": 0.7808, "step": 29942 }, { "epoch": 0.56, "learning_rate": 2.0975413195205393e-06, "loss": 1.0091, "step": 29943 }, { "epoch": 0.56, "learning_rate": 2.097390547243257e-06, "loss": 0.9765, "step": 29944 }, { "epoch": 0.56, "learning_rate": 2.0972397764693074e-06, "loss": 0.999, "step": 29945 }, { "epoch": 0.56, "learning_rate": 2.097089007199251e-06, "loss": 0.7597, "step": 29946 }, { "epoch": 0.57, "learning_rate": 2.096938239433652e-06, "loss": 0.9146, "step": 29947 }, { "epoch": 0.57, "learning_rate": 2.096787473173074e-06, "loss": 0.9186, "step": 29948 }, { "epoch": 0.57, "learning_rate": 2.0966367084180795e-06, "loss": 1.1498, "step": 29949 }, { "epoch": 0.57, "learning_rate": 2.09648594516923e-06, "loss": 1.0261, "step": 29950 }, { "epoch": 0.57, "learning_rate": 2.0963351834270905e-06, "loss": 0.8428, "step": 29951 }, { "epoch": 0.57, "learning_rate": 2.0961844231922226e-06, "loss": 0.974, "step": 29952 }, { "epoch": 0.57, "learning_rate": 2.0960336644651893e-06, "loss": 0.9894, "step": 29953 }, { "epoch": 0.57, "learning_rate": 2.095882907246554e-06, "loss": 0.889, "step": 29954 }, { "epoch": 0.57, "learning_rate": 2.0957321515368808e-06, "loss": 0.7548, "step": 29955 }, { "epoch": 0.57, "learning_rate": 2.0955813973367295e-06, "loss": 0.9405, "step": 29956 }, { "epoch": 0.57, "learning_rate": 2.095430644646666e-06, "loss": 0.9591, "step": 29957 }, { "epoch": 0.57, "learning_rate": 2.095279893467253e-06, "loss": 0.7714, "step": 29958 }, { "epoch": 0.57, "learning_rate": 2.0951291437990502e-06, "loss": 0.8955, "step": 29959 }, { "epoch": 0.57, "learning_rate": 2.094978395642624e-06, "loss": 0.8268, "step": 29960 }, { "epoch": 0.57, "learning_rate": 2.0948276489985364e-06, "loss": 1.1588, "step": 29961 }, { "epoch": 0.57, "learning_rate": 2.094676903867349e-06, "loss": 1.1148, "step": 29962 }, { "epoch": 0.57, "learning_rate": 2.0945261602496266e-06, "loss": 1.0158, "step": 29963 }, { "epoch": 0.57, "learning_rate": 2.094375418145931e-06, "loss": 0.9174, "step": 29964 }, { "epoch": 0.57, "learning_rate": 2.0942246775568236e-06, "loss": 1.0186, "step": 29965 }, { "epoch": 0.57, "learning_rate": 2.0940739384828707e-06, "loss": 0.8417, "step": 29966 }, { "epoch": 0.57, "learning_rate": 2.0939232009246325e-06, "loss": 0.9058, "step": 29967 }, { "epoch": 0.57, "learning_rate": 2.0937724648826717e-06, "loss": 1.1058, "step": 29968 }, { "epoch": 0.57, "learning_rate": 2.0936217303575534e-06, "loss": 0.949, "step": 29969 }, { "epoch": 0.57, "learning_rate": 2.0934709973498395e-06, "loss": 1.0067, "step": 29970 }, { "epoch": 0.57, "learning_rate": 2.093320265860091e-06, "loss": 0.791, "step": 29971 }, { "epoch": 0.57, "learning_rate": 2.093169535888873e-06, "loss": 0.9213, "step": 29972 }, { "epoch": 0.57, "learning_rate": 2.0930188074367474e-06, "loss": 0.7335, "step": 29973 }, { "epoch": 0.57, "learning_rate": 2.0928680805042766e-06, "loss": 0.9407, "step": 29974 }, { "epoch": 0.57, "learning_rate": 2.092717355092024e-06, "loss": 0.9534, "step": 29975 }, { "epoch": 0.57, "learning_rate": 2.092566631200553e-06, "loss": 0.9495, "step": 29976 }, { "epoch": 0.57, "learning_rate": 2.0924159088304245e-06, "loss": 0.8807, "step": 29977 }, { "epoch": 0.57, "learning_rate": 2.092265187982204e-06, "loss": 0.6741, "step": 29978 }, { "epoch": 0.57, "learning_rate": 2.0921144686564525e-06, "loss": 0.9229, "step": 29979 }, { "epoch": 0.57, "learning_rate": 2.091963750853732e-06, "loss": 0.9155, "step": 29980 }, { "epoch": 0.57, "learning_rate": 2.091813034574607e-06, "loss": 0.8989, "step": 29981 }, { "epoch": 0.57, "learning_rate": 2.09166231981964e-06, "loss": 0.8607, "step": 29982 }, { "epoch": 0.57, "learning_rate": 2.0915116065893924e-06, "loss": 0.8966, "step": 29983 }, { "epoch": 0.57, "learning_rate": 2.091360894884429e-06, "loss": 0.7961, "step": 29984 }, { "epoch": 0.57, "learning_rate": 2.0912101847053113e-06, "loss": 0.7938, "step": 29985 }, { "epoch": 0.57, "learning_rate": 2.0910594760526017e-06, "loss": 0.8426, "step": 29986 }, { "epoch": 0.57, "learning_rate": 2.0909087689268635e-06, "loss": 1.0485, "step": 29987 }, { "epoch": 0.57, "learning_rate": 2.0907580633286593e-06, "loss": 1.1171, "step": 29988 }, { "epoch": 0.57, "learning_rate": 2.090607359258553e-06, "loss": 0.9575, "step": 29989 }, { "epoch": 0.57, "learning_rate": 2.090456656717105e-06, "loss": 0.8815, "step": 29990 }, { "epoch": 0.57, "learning_rate": 2.0903059557048803e-06, "loss": 1.003, "step": 29991 }, { "epoch": 0.57, "learning_rate": 2.0901552562224404e-06, "loss": 0.93, "step": 29992 }, { "epoch": 0.57, "learning_rate": 2.090004558270347e-06, "loss": 0.96, "step": 29993 }, { "epoch": 0.57, "learning_rate": 2.0898538618491653e-06, "loss": 1.0334, "step": 29994 }, { "epoch": 0.57, "learning_rate": 2.0897031669594566e-06, "loss": 0.8207, "step": 29995 }, { "epoch": 0.57, "learning_rate": 2.0895524736017828e-06, "loss": 0.9037, "step": 29996 }, { "epoch": 0.57, "learning_rate": 2.0894017817767087e-06, "loss": 0.9948, "step": 29997 }, { "epoch": 0.57, "learning_rate": 2.0892510914847957e-06, "loss": 0.9053, "step": 29998 }, { "epoch": 0.57, "learning_rate": 2.089100402726605e-06, "loss": 0.9088, "step": 29999 }, { "epoch": 0.57, "learning_rate": 2.0889497155027027e-06, "loss": 1.0005, "step": 30000 }, { "epoch": 0.57, "learning_rate": 2.088799029813648e-06, "loss": 0.7721, "step": 30001 }, { "epoch": 0.57, "learning_rate": 2.0886483456600053e-06, "loss": 1.0354, "step": 30002 }, { "epoch": 0.57, "learning_rate": 2.088497663042338e-06, "loss": 0.9319, "step": 30003 }, { "epoch": 0.57, "learning_rate": 2.088346981961208e-06, "loss": 0.8377, "step": 30004 }, { "epoch": 0.57, "learning_rate": 2.0881963024171765e-06, "loss": 1.0607, "step": 30005 }, { "epoch": 0.57, "learning_rate": 2.088045624410808e-06, "loss": 0.9976, "step": 30006 }, { "epoch": 0.57, "learning_rate": 2.0878949479426646e-06, "loss": 0.9333, "step": 30007 }, { "epoch": 0.57, "learning_rate": 2.0877442730133085e-06, "loss": 0.7159, "step": 30008 }, { "epoch": 0.57, "learning_rate": 2.087593599623303e-06, "loss": 0.8221, "step": 30009 }, { "epoch": 0.57, "learning_rate": 2.0874429277732107e-06, "loss": 0.7939, "step": 30010 }, { "epoch": 0.57, "learning_rate": 2.0872922574635927e-06, "loss": 0.918, "step": 30011 }, { "epoch": 0.57, "learning_rate": 2.087141588695014e-06, "loss": 1.1382, "step": 30012 }, { "epoch": 0.57, "learning_rate": 2.0869909214680358e-06, "loss": 1.0049, "step": 30013 }, { "epoch": 0.57, "learning_rate": 2.0868402557832197e-06, "loss": 0.8312, "step": 30014 }, { "epoch": 0.57, "learning_rate": 2.0866895916411297e-06, "loss": 0.9357, "step": 30015 }, { "epoch": 0.57, "learning_rate": 2.086538929042329e-06, "loss": 0.87, "step": 30016 }, { "epoch": 0.57, "learning_rate": 2.086388267987378e-06, "loss": 0.9658, "step": 30017 }, { "epoch": 0.57, "learning_rate": 2.086237608476842e-06, "loss": 0.7644, "step": 30018 }, { "epoch": 0.57, "learning_rate": 2.086086950511282e-06, "loss": 1.0307, "step": 30019 }, { "epoch": 0.57, "learning_rate": 2.0859362940912593e-06, "loss": 0.9397, "step": 30020 }, { "epoch": 0.57, "learning_rate": 2.0857856392173386e-06, "loss": 0.9965, "step": 30021 }, { "epoch": 0.57, "learning_rate": 2.0856349858900814e-06, "loss": 0.7611, "step": 30022 }, { "epoch": 0.57, "learning_rate": 2.0854843341100502e-06, "loss": 0.8091, "step": 30023 }, { "epoch": 0.57, "learning_rate": 2.0853336838778087e-06, "loss": 1.0125, "step": 30024 }, { "epoch": 0.57, "learning_rate": 2.0851830351939184e-06, "loss": 0.9656, "step": 30025 }, { "epoch": 0.57, "learning_rate": 2.085032388058941e-06, "loss": 0.6474, "step": 30026 }, { "epoch": 0.57, "learning_rate": 2.084881742473441e-06, "loss": 0.9534, "step": 30027 }, { "epoch": 0.57, "learning_rate": 2.0847310984379788e-06, "loss": 0.8817, "step": 30028 }, { "epoch": 0.57, "learning_rate": 2.0845804559531186e-06, "loss": 0.8244, "step": 30029 }, { "epoch": 0.57, "learning_rate": 2.0844298150194218e-06, "loss": 0.9935, "step": 30030 }, { "epoch": 0.57, "learning_rate": 2.084279175637452e-06, "loss": 0.8599, "step": 30031 }, { "epoch": 0.57, "learning_rate": 2.08412853780777e-06, "loss": 0.88, "step": 30032 }, { "epoch": 0.57, "learning_rate": 2.0839779015309406e-06, "loss": 0.8606, "step": 30033 }, { "epoch": 0.57, "learning_rate": 2.0838272668075247e-06, "loss": 0.8704, "step": 30034 }, { "epoch": 0.57, "learning_rate": 2.0836766336380838e-06, "loss": 0.9574, "step": 30035 }, { "epoch": 0.57, "learning_rate": 2.083526002023182e-06, "loss": 0.8382, "step": 30036 }, { "epoch": 0.57, "learning_rate": 2.0833753719633826e-06, "loss": 0.7994, "step": 30037 }, { "epoch": 0.57, "learning_rate": 2.083224743459245e-06, "loss": 0.9971, "step": 30038 }, { "epoch": 0.57, "learning_rate": 2.083074116511335e-06, "loss": 0.9924, "step": 30039 }, { "epoch": 0.57, "learning_rate": 2.0829234911202132e-06, "loss": 0.7952, "step": 30040 }, { "epoch": 0.57, "learning_rate": 2.0827728672864413e-06, "loss": 0.8557, "step": 30041 }, { "epoch": 0.57, "learning_rate": 2.0826222450105836e-06, "loss": 0.7723, "step": 30042 }, { "epoch": 0.57, "learning_rate": 2.0824716242932012e-06, "loss": 1.0917, "step": 30043 }, { "epoch": 0.57, "learning_rate": 2.0823210051348568e-06, "loss": 0.9616, "step": 30044 }, { "epoch": 0.57, "learning_rate": 2.082170387536114e-06, "loss": 0.9491, "step": 30045 }, { "epoch": 0.57, "learning_rate": 2.0820197714975336e-06, "loss": 1.0029, "step": 30046 }, { "epoch": 0.57, "learning_rate": 2.0818691570196776e-06, "loss": 0.9853, "step": 30047 }, { "epoch": 0.57, "learning_rate": 2.081718544103111e-06, "loss": 0.7745, "step": 30048 }, { "epoch": 0.57, "learning_rate": 2.0815679327483932e-06, "loss": 0.93, "step": 30049 }, { "epoch": 0.57, "learning_rate": 2.0814173229560885e-06, "loss": 1.0684, "step": 30050 }, { "epoch": 0.57, "learning_rate": 2.0812667147267585e-06, "loss": 0.7611, "step": 30051 }, { "epoch": 0.57, "learning_rate": 2.081116108060966e-06, "loss": 0.9657, "step": 30052 }, { "epoch": 0.57, "learning_rate": 2.0809655029592725e-06, "loss": 1.002, "step": 30053 }, { "epoch": 0.57, "learning_rate": 2.0808148994222417e-06, "loss": 0.7573, "step": 30054 }, { "epoch": 0.57, "learning_rate": 2.080664297450435e-06, "loss": 0.7842, "step": 30055 }, { "epoch": 0.57, "learning_rate": 2.0805136970444144e-06, "loss": 1.019, "step": 30056 }, { "epoch": 0.57, "learning_rate": 2.0803630982047433e-06, "loss": 0.8941, "step": 30057 }, { "epoch": 0.57, "learning_rate": 2.080212500931984e-06, "loss": 0.8849, "step": 30058 }, { "epoch": 0.57, "learning_rate": 2.080061905226697e-06, "loss": 0.9253, "step": 30059 }, { "epoch": 0.57, "learning_rate": 2.0799113110894474e-06, "loss": 0.8116, "step": 30060 }, { "epoch": 0.57, "learning_rate": 2.0797607185207957e-06, "loss": 0.9538, "step": 30061 }, { "epoch": 0.57, "learning_rate": 2.079610127521304e-06, "loss": 0.9725, "step": 30062 }, { "epoch": 0.57, "learning_rate": 2.0794595380915356e-06, "loss": 1.0701, "step": 30063 }, { "epoch": 0.57, "learning_rate": 2.0793089502320525e-06, "loss": 0.8789, "step": 30064 }, { "epoch": 0.57, "learning_rate": 2.079158363943416e-06, "loss": 0.978, "step": 30065 }, { "epoch": 0.57, "learning_rate": 2.0790077792261907e-06, "loss": 0.8152, "step": 30066 }, { "epoch": 0.57, "learning_rate": 2.0788571960809372e-06, "loss": 1.1753, "step": 30067 }, { "epoch": 0.57, "learning_rate": 2.078706614508217e-06, "loss": 0.9651, "step": 30068 }, { "epoch": 0.57, "learning_rate": 2.0785560345085944e-06, "loss": 1.0496, "step": 30069 }, { "epoch": 0.57, "learning_rate": 2.07840545608263e-06, "loss": 0.9618, "step": 30070 }, { "epoch": 0.57, "learning_rate": 2.0782548792308863e-06, "loss": 0.8895, "step": 30071 }, { "epoch": 0.57, "learning_rate": 2.078104303953927e-06, "loss": 0.8645, "step": 30072 }, { "epoch": 0.57, "learning_rate": 2.0779537302523132e-06, "loss": 0.9031, "step": 30073 }, { "epoch": 0.57, "learning_rate": 2.077803158126606e-06, "loss": 0.9515, "step": 30074 }, { "epoch": 0.57, "learning_rate": 2.0776525875773704e-06, "loss": 0.8466, "step": 30075 }, { "epoch": 0.57, "learning_rate": 2.0775020186051664e-06, "loss": 0.9105, "step": 30076 }, { "epoch": 0.57, "learning_rate": 2.077351451210557e-06, "loss": 0.9742, "step": 30077 }, { "epoch": 0.57, "learning_rate": 2.077200885394104e-06, "loss": 0.7421, "step": 30078 }, { "epoch": 0.57, "learning_rate": 2.0770503211563704e-06, "loss": 1.0031, "step": 30079 }, { "epoch": 0.57, "learning_rate": 2.0768997584979175e-06, "loss": 0.9596, "step": 30080 }, { "epoch": 0.57, "learning_rate": 2.0767491974193084e-06, "loss": 0.9609, "step": 30081 }, { "epoch": 0.57, "learning_rate": 2.076598637921105e-06, "loss": 0.7502, "step": 30082 }, { "epoch": 0.57, "learning_rate": 2.0764480800038685e-06, "loss": 0.5975, "step": 30083 }, { "epoch": 0.57, "learning_rate": 2.076297523668162e-06, "loss": 0.8231, "step": 30084 }, { "epoch": 0.57, "learning_rate": 2.076146968914548e-06, "loss": 0.9203, "step": 30085 }, { "epoch": 0.57, "learning_rate": 2.0759964157435873e-06, "loss": 0.6793, "step": 30086 }, { "epoch": 0.57, "learning_rate": 2.0758458641558443e-06, "loss": 1.0374, "step": 30087 }, { "epoch": 0.57, "learning_rate": 2.07569531415188e-06, "loss": 0.8261, "step": 30088 }, { "epoch": 0.57, "learning_rate": 2.075544765732255e-06, "loss": 0.7097, "step": 30089 }, { "epoch": 0.57, "learning_rate": 2.0753942188975335e-06, "loss": 0.8802, "step": 30090 }, { "epoch": 0.57, "learning_rate": 2.075243673648277e-06, "loss": 1.1774, "step": 30091 }, { "epoch": 0.57, "learning_rate": 2.075093129985047e-06, "loss": 0.8913, "step": 30092 }, { "epoch": 0.57, "learning_rate": 2.0749425879084075e-06, "loss": 0.9907, "step": 30093 }, { "epoch": 0.57, "learning_rate": 2.074792047418919e-06, "loss": 0.9205, "step": 30094 }, { "epoch": 0.57, "learning_rate": 2.0746415085171426e-06, "loss": 0.9244, "step": 30095 }, { "epoch": 0.57, "learning_rate": 2.074490971203643e-06, "loss": 1.0901, "step": 30096 }, { "epoch": 0.57, "learning_rate": 2.074340435478981e-06, "loss": 0.9566, "step": 30097 }, { "epoch": 0.57, "learning_rate": 2.0741899013437184e-06, "loss": 0.8422, "step": 30098 }, { "epoch": 0.57, "learning_rate": 2.074039368798418e-06, "loss": 1.1676, "step": 30099 }, { "epoch": 0.57, "learning_rate": 2.0738888378436417e-06, "loss": 1.1561, "step": 30100 }, { "epoch": 0.57, "learning_rate": 2.0737383084799502e-06, "loss": 0.9241, "step": 30101 }, { "epoch": 0.57, "learning_rate": 2.073587780707908e-06, "loss": 0.9609, "step": 30102 }, { "epoch": 0.57, "learning_rate": 2.073437254528076e-06, "loss": 0.9605, "step": 30103 }, { "epoch": 0.57, "learning_rate": 2.0732867299410152e-06, "loss": 0.7202, "step": 30104 }, { "epoch": 0.57, "learning_rate": 2.0731362069472894e-06, "loss": 1.025, "step": 30105 }, { "epoch": 0.57, "learning_rate": 2.07298568554746e-06, "loss": 1.0681, "step": 30106 }, { "epoch": 0.57, "learning_rate": 2.0728351657420884e-06, "loss": 0.911, "step": 30107 }, { "epoch": 0.57, "learning_rate": 2.072684647531738e-06, "loss": 0.8746, "step": 30108 }, { "epoch": 0.57, "learning_rate": 2.07253413091697e-06, "loss": 0.8588, "step": 30109 }, { "epoch": 0.57, "learning_rate": 2.0723836158983456e-06, "loss": 0.7535, "step": 30110 }, { "epoch": 0.57, "learning_rate": 2.0722331024764283e-06, "loss": 1.1769, "step": 30111 }, { "epoch": 0.57, "learning_rate": 2.0720825906517793e-06, "loss": 1.0418, "step": 30112 }, { "epoch": 0.57, "learning_rate": 2.0719320804249597e-06, "loss": 0.9539, "step": 30113 }, { "epoch": 0.57, "learning_rate": 2.0717815717965345e-06, "loss": 0.7802, "step": 30114 }, { "epoch": 0.57, "learning_rate": 2.0716310647670635e-06, "loss": 0.7423, "step": 30115 }, { "epoch": 0.57, "learning_rate": 2.0714805593371076e-06, "loss": 0.8284, "step": 30116 }, { "epoch": 0.57, "learning_rate": 2.071330055507231e-06, "loss": 0.9784, "step": 30117 }, { "epoch": 0.57, "learning_rate": 2.071179553277995e-06, "loss": 0.9957, "step": 30118 }, { "epoch": 0.57, "learning_rate": 2.071029052649961e-06, "loss": 0.8971, "step": 30119 }, { "epoch": 0.57, "learning_rate": 2.0708785536236915e-06, "loss": 1.0391, "step": 30120 }, { "epoch": 0.57, "learning_rate": 2.070728056199749e-06, "loss": 0.9303, "step": 30121 }, { "epoch": 0.57, "learning_rate": 2.0705775603786937e-06, "loss": 0.8185, "step": 30122 }, { "epoch": 0.57, "learning_rate": 2.0704270661610894e-06, "loss": 0.8089, "step": 30123 }, { "epoch": 0.57, "learning_rate": 2.070276573547497e-06, "loss": 0.9131, "step": 30124 }, { "epoch": 0.57, "learning_rate": 2.070126082538478e-06, "loss": 0.9535, "step": 30125 }, { "epoch": 0.57, "learning_rate": 2.0699755931345956e-06, "loss": 0.9018, "step": 30126 }, { "epoch": 0.57, "learning_rate": 2.069825105336412e-06, "loss": 0.7997, "step": 30127 }, { "epoch": 0.57, "learning_rate": 2.0696746191444867e-06, "loss": 0.8352, "step": 30128 }, { "epoch": 0.57, "learning_rate": 2.0695241345593843e-06, "loss": 0.7806, "step": 30129 }, { "epoch": 0.57, "learning_rate": 2.069373651581666e-06, "loss": 1.2375, "step": 30130 }, { "epoch": 0.57, "learning_rate": 2.0692231702118917e-06, "loss": 1.0815, "step": 30131 }, { "epoch": 0.57, "learning_rate": 2.069072690450626e-06, "loss": 0.9607, "step": 30132 }, { "epoch": 0.57, "learning_rate": 2.068922212298429e-06, "loss": 0.6869, "step": 30133 }, { "epoch": 0.57, "learning_rate": 2.068771735755863e-06, "loss": 0.8332, "step": 30134 }, { "epoch": 0.57, "learning_rate": 2.0686212608234914e-06, "loss": 1.0663, "step": 30135 }, { "epoch": 0.57, "learning_rate": 2.0684707875018744e-06, "loss": 1.1404, "step": 30136 }, { "epoch": 0.57, "learning_rate": 2.0683203157915733e-06, "loss": 0.9877, "step": 30137 }, { "epoch": 0.57, "learning_rate": 2.068169845693152e-06, "loss": 0.7917, "step": 30138 }, { "epoch": 0.57, "learning_rate": 2.068019377207171e-06, "loss": 0.8746, "step": 30139 }, { "epoch": 0.57, "learning_rate": 2.067868910334192e-06, "loss": 0.7925, "step": 30140 }, { "epoch": 0.57, "learning_rate": 2.0677184450747774e-06, "loss": 0.9088, "step": 30141 }, { "epoch": 0.57, "learning_rate": 2.067567981429489e-06, "loss": 0.7798, "step": 30142 }, { "epoch": 0.57, "learning_rate": 2.067417519398888e-06, "loss": 1.0718, "step": 30143 }, { "epoch": 0.57, "learning_rate": 2.0672670589835376e-06, "loss": 1.0705, "step": 30144 }, { "epoch": 0.57, "learning_rate": 2.0671166001839986e-06, "loss": 0.8099, "step": 30145 }, { "epoch": 0.57, "learning_rate": 2.066966143000832e-06, "loss": 0.7792, "step": 30146 }, { "epoch": 0.57, "learning_rate": 2.0668156874346013e-06, "loss": 0.8213, "step": 30147 }, { "epoch": 0.57, "learning_rate": 2.066665233485868e-06, "loss": 0.838, "step": 30148 }, { "epoch": 0.57, "learning_rate": 2.066514781155192e-06, "loss": 0.7273, "step": 30149 }, { "epoch": 0.57, "learning_rate": 2.066364330443138e-06, "loss": 1.0651, "step": 30150 }, { "epoch": 0.57, "learning_rate": 2.066213881350266e-06, "loss": 1.0006, "step": 30151 }, { "epoch": 0.57, "learning_rate": 2.0660634338771367e-06, "loss": 0.8032, "step": 30152 }, { "epoch": 0.57, "learning_rate": 2.065912988024315e-06, "loss": 0.9087, "step": 30153 }, { "epoch": 0.57, "learning_rate": 2.06576254379236e-06, "loss": 0.8522, "step": 30154 }, { "epoch": 0.57, "learning_rate": 2.0656121011818338e-06, "loss": 1.0494, "step": 30155 }, { "epoch": 0.57, "learning_rate": 2.0654616601933e-06, "loss": 1.1277, "step": 30156 }, { "epoch": 0.57, "learning_rate": 2.0653112208273187e-06, "loss": 0.9803, "step": 30157 }, { "epoch": 0.57, "learning_rate": 2.065160783084451e-06, "loss": 0.6312, "step": 30158 }, { "epoch": 0.57, "learning_rate": 2.0650103469652607e-06, "loss": 0.8654, "step": 30159 }, { "epoch": 0.57, "learning_rate": 2.0648599124703076e-06, "loss": 0.854, "step": 30160 }, { "epoch": 0.57, "learning_rate": 2.0647094796001547e-06, "loss": 0.9263, "step": 30161 }, { "epoch": 0.57, "learning_rate": 2.0645590483553636e-06, "loss": 1.0168, "step": 30162 }, { "epoch": 0.57, "learning_rate": 2.064408618736496e-06, "loss": 0.992, "step": 30163 }, { "epoch": 0.57, "learning_rate": 2.0642581907441113e-06, "loss": 0.6482, "step": 30164 }, { "epoch": 0.57, "learning_rate": 2.064107764378775e-06, "loss": 0.9789, "step": 30165 }, { "epoch": 0.57, "learning_rate": 2.063957339641047e-06, "loss": 0.6619, "step": 30166 }, { "epoch": 0.57, "learning_rate": 2.063806916531487e-06, "loss": 0.8105, "step": 30167 }, { "epoch": 0.57, "learning_rate": 2.0636564950506603e-06, "loss": 0.8832, "step": 30168 }, { "epoch": 0.57, "learning_rate": 2.0635060751991268e-06, "loss": 1.0691, "step": 30169 }, { "epoch": 0.57, "learning_rate": 2.0633556569774473e-06, "loss": 0.8977, "step": 30170 }, { "epoch": 0.57, "learning_rate": 2.063205240386185e-06, "loss": 0.7719, "step": 30171 }, { "epoch": 0.57, "learning_rate": 2.063054825425902e-06, "loss": 0.8041, "step": 30172 }, { "epoch": 0.57, "learning_rate": 2.062904412097157e-06, "loss": 1.0521, "step": 30173 }, { "epoch": 0.57, "learning_rate": 2.0627540004005144e-06, "loss": 1.0035, "step": 30174 }, { "epoch": 0.57, "learning_rate": 2.0626035903365347e-06, "loss": 1.112, "step": 30175 }, { "epoch": 0.57, "learning_rate": 2.06245318190578e-06, "loss": 0.6681, "step": 30176 }, { "epoch": 0.57, "learning_rate": 2.0623027751088117e-06, "loss": 0.7821, "step": 30177 }, { "epoch": 0.57, "learning_rate": 2.062152369946192e-06, "loss": 0.9084, "step": 30178 }, { "epoch": 0.57, "learning_rate": 2.0620019664184805e-06, "loss": 0.7979, "step": 30179 }, { "epoch": 0.57, "learning_rate": 2.0618515645262414e-06, "loss": 0.82, "step": 30180 }, { "epoch": 0.57, "learning_rate": 2.0617011642700346e-06, "loss": 1.2498, "step": 30181 }, { "epoch": 0.57, "learning_rate": 2.0615507656504225e-06, "loss": 0.8422, "step": 30182 }, { "epoch": 0.57, "learning_rate": 2.061400368667966e-06, "loss": 0.715, "step": 30183 }, { "epoch": 0.57, "learning_rate": 2.0612499733232275e-06, "loss": 0.9791, "step": 30184 }, { "epoch": 0.57, "learning_rate": 2.061099579616768e-06, "loss": 0.8307, "step": 30185 }, { "epoch": 0.57, "learning_rate": 2.0609491875491495e-06, "loss": 0.8994, "step": 30186 }, { "epoch": 0.57, "learning_rate": 2.060798797120933e-06, "loss": 1.0903, "step": 30187 }, { "epoch": 0.57, "learning_rate": 2.06064840833268e-06, "loss": 1.1038, "step": 30188 }, { "epoch": 0.57, "learning_rate": 2.0604980211849525e-06, "loss": 0.912, "step": 30189 }, { "epoch": 0.57, "learning_rate": 2.0603476356783126e-06, "loss": 0.9739, "step": 30190 }, { "epoch": 0.57, "learning_rate": 2.06019725181332e-06, "loss": 0.99, "step": 30191 }, { "epoch": 0.57, "learning_rate": 2.060046869590538e-06, "loss": 0.9341, "step": 30192 }, { "epoch": 0.57, "learning_rate": 2.0598964890105284e-06, "loss": 1.068, "step": 30193 }, { "epoch": 0.57, "learning_rate": 2.05974611007385e-06, "loss": 1.1724, "step": 30194 }, { "epoch": 0.57, "learning_rate": 2.0595957327810676e-06, "loss": 0.7961, "step": 30195 }, { "epoch": 0.57, "learning_rate": 2.0594453571327405e-06, "loss": 0.8867, "step": 30196 }, { "epoch": 0.57, "learning_rate": 2.0592949831294305e-06, "loss": 1.0615, "step": 30197 }, { "epoch": 0.57, "learning_rate": 2.0591446107717005e-06, "loss": 0.7899, "step": 30198 }, { "epoch": 0.57, "learning_rate": 2.0589942400601114e-06, "loss": 1.0701, "step": 30199 }, { "epoch": 0.57, "learning_rate": 2.058843870995223e-06, "loss": 1.1607, "step": 30200 }, { "epoch": 0.57, "learning_rate": 2.0586935035775987e-06, "loss": 0.8446, "step": 30201 }, { "epoch": 0.57, "learning_rate": 2.058543137807799e-06, "loss": 0.8432, "step": 30202 }, { "epoch": 0.57, "learning_rate": 2.058392773686386e-06, "loss": 1.1547, "step": 30203 }, { "epoch": 0.57, "learning_rate": 2.0582424112139206e-06, "loss": 0.77, "step": 30204 }, { "epoch": 0.57, "learning_rate": 2.058092050390965e-06, "loss": 0.9237, "step": 30205 }, { "epoch": 0.57, "learning_rate": 2.057941691218079e-06, "loss": 0.9131, "step": 30206 }, { "epoch": 0.57, "learning_rate": 2.057791333695827e-06, "loss": 0.827, "step": 30207 }, { "epoch": 0.57, "learning_rate": 2.0576409778247673e-06, "loss": 0.9675, "step": 30208 }, { "epoch": 0.57, "learning_rate": 2.0574906236054627e-06, "loss": 0.8698, "step": 30209 }, { "epoch": 0.57, "learning_rate": 2.057340271038474e-06, "loss": 0.9456, "step": 30210 }, { "epoch": 0.57, "learning_rate": 2.0571899201243646e-06, "loss": 0.7692, "step": 30211 }, { "epoch": 0.57, "learning_rate": 2.057039570863693e-06, "loss": 1.0565, "step": 30212 }, { "epoch": 0.57, "learning_rate": 2.0568892232570234e-06, "loss": 1.0316, "step": 30213 }, { "epoch": 0.57, "learning_rate": 2.056738877304916e-06, "loss": 0.9953, "step": 30214 }, { "epoch": 0.57, "learning_rate": 2.05658853300793e-06, "loss": 0.734, "step": 30215 }, { "epoch": 0.57, "learning_rate": 2.0564381903666308e-06, "loss": 0.8457, "step": 30216 }, { "epoch": 0.57, "learning_rate": 2.056287849381577e-06, "loss": 0.6843, "step": 30217 }, { "epoch": 0.57, "learning_rate": 2.0561375100533305e-06, "loss": 1.2033, "step": 30218 }, { "epoch": 0.57, "learning_rate": 2.0559871723824535e-06, "loss": 0.9869, "step": 30219 }, { "epoch": 0.57, "learning_rate": 2.0558368363695068e-06, "loss": 0.8352, "step": 30220 }, { "epoch": 0.57, "learning_rate": 2.0556865020150522e-06, "loss": 0.7005, "step": 30221 }, { "epoch": 0.57, "learning_rate": 2.0555361693196493e-06, "loss": 0.9091, "step": 30222 }, { "epoch": 0.57, "learning_rate": 2.0553858382838614e-06, "loss": 0.7717, "step": 30223 }, { "epoch": 0.57, "learning_rate": 2.055235508908249e-06, "loss": 1.1727, "step": 30224 }, { "epoch": 0.57, "learning_rate": 2.055085181193373e-06, "loss": 1.3772, "step": 30225 }, { "epoch": 0.57, "learning_rate": 2.0549348551397968e-06, "loss": 0.9483, "step": 30226 }, { "epoch": 0.57, "learning_rate": 2.05478453074808e-06, "loss": 0.973, "step": 30227 }, { "epoch": 0.57, "learning_rate": 2.0546342080187827e-06, "loss": 0.9044, "step": 30228 }, { "epoch": 0.57, "learning_rate": 2.0544838869524684e-06, "loss": 0.7867, "step": 30229 }, { "epoch": 0.57, "learning_rate": 2.0543335675496976e-06, "loss": 1.0326, "step": 30230 }, { "epoch": 0.57, "learning_rate": 2.054183249811031e-06, "loss": 1.102, "step": 30231 }, { "epoch": 0.57, "learning_rate": 2.0540329337370314e-06, "loss": 1.1637, "step": 30232 }, { "epoch": 0.57, "learning_rate": 2.0538826193282592e-06, "loss": 0.9583, "step": 30233 }, { "epoch": 0.57, "learning_rate": 2.0537323065852748e-06, "loss": 0.7168, "step": 30234 }, { "epoch": 0.57, "learning_rate": 2.053581995508641e-06, "loss": 0.9509, "step": 30235 }, { "epoch": 0.57, "learning_rate": 2.053431686098918e-06, "loss": 0.7702, "step": 30236 }, { "epoch": 0.57, "learning_rate": 2.0532813783566673e-06, "loss": 0.9984, "step": 30237 }, { "epoch": 0.57, "learning_rate": 2.05313107228245e-06, "loss": 0.915, "step": 30238 }, { "epoch": 0.57, "learning_rate": 2.0529807678768285e-06, "loss": 0.8981, "step": 30239 }, { "epoch": 0.57, "learning_rate": 2.0528304651403618e-06, "loss": 0.7836, "step": 30240 }, { "epoch": 0.57, "learning_rate": 2.052680164073614e-06, "loss": 0.9995, "step": 30241 }, { "epoch": 0.57, "learning_rate": 2.052529864677144e-06, "loss": 1.0236, "step": 30242 }, { "epoch": 0.57, "learning_rate": 2.052379566951513e-06, "loss": 1.0769, "step": 30243 }, { "epoch": 0.57, "learning_rate": 2.0522292708972837e-06, "loss": 0.799, "step": 30244 }, { "epoch": 0.57, "learning_rate": 2.0520789765150166e-06, "loss": 0.9018, "step": 30245 }, { "epoch": 0.57, "learning_rate": 2.0519286838052723e-06, "loss": 0.9428, "step": 30246 }, { "epoch": 0.57, "learning_rate": 2.0517783927686137e-06, "loss": 0.8006, "step": 30247 }, { "epoch": 0.57, "learning_rate": 2.051628103405601e-06, "loss": 0.8622, "step": 30248 }, { "epoch": 0.57, "learning_rate": 2.0514778157167934e-06, "loss": 0.9255, "step": 30249 }, { "epoch": 0.57, "learning_rate": 2.0513275297027553e-06, "loss": 1.1285, "step": 30250 }, { "epoch": 0.57, "learning_rate": 2.051177245364046e-06, "loss": 1.0662, "step": 30251 }, { "epoch": 0.57, "learning_rate": 2.0510269627012265e-06, "loss": 0.8235, "step": 30252 }, { "epoch": 0.57, "learning_rate": 2.0508766817148595e-06, "loss": 0.8683, "step": 30253 }, { "epoch": 0.57, "learning_rate": 2.0507264024055056e-06, "loss": 0.855, "step": 30254 }, { "epoch": 0.57, "learning_rate": 2.050576124773724e-06, "loss": 0.8321, "step": 30255 }, { "epoch": 0.57, "learning_rate": 2.0504258488200787e-06, "loss": 0.9781, "step": 30256 }, { "epoch": 0.57, "learning_rate": 2.050275574545129e-06, "loss": 0.959, "step": 30257 }, { "epoch": 0.57, "learning_rate": 2.050125301949436e-06, "loss": 0.897, "step": 30258 }, { "epoch": 0.57, "learning_rate": 2.049975031033562e-06, "loss": 0.8543, "step": 30259 }, { "epoch": 0.57, "learning_rate": 2.049824761798068e-06, "loss": 0.8712, "step": 30260 }, { "epoch": 0.57, "learning_rate": 2.049674494243513e-06, "loss": 1.0498, "step": 30261 }, { "epoch": 0.57, "learning_rate": 2.0495242283704607e-06, "loss": 1.1246, "step": 30262 }, { "epoch": 0.57, "learning_rate": 2.0493739641794717e-06, "loss": 0.9236, "step": 30263 }, { "epoch": 0.57, "learning_rate": 2.0492237016711047e-06, "loss": 0.8541, "step": 30264 }, { "epoch": 0.57, "learning_rate": 2.0490734408459235e-06, "loss": 0.8532, "step": 30265 }, { "epoch": 0.57, "learning_rate": 2.048923181704489e-06, "loss": 0.8661, "step": 30266 }, { "epoch": 0.57, "learning_rate": 2.04877292424736e-06, "loss": 1.1719, "step": 30267 }, { "epoch": 0.57, "learning_rate": 2.0486226684751006e-06, "loss": 1.0862, "step": 30268 }, { "epoch": 0.57, "learning_rate": 2.0484724143882698e-06, "loss": 1.1264, "step": 30269 }, { "epoch": 0.57, "learning_rate": 2.0483221619874284e-06, "loss": 1.0488, "step": 30270 }, { "epoch": 0.57, "learning_rate": 2.048171911273139e-06, "loss": 0.9928, "step": 30271 }, { "epoch": 0.57, "learning_rate": 2.0480216622459616e-06, "loss": 0.8625, "step": 30272 }, { "epoch": 0.57, "learning_rate": 2.0478714149064567e-06, "loss": 0.863, "step": 30273 }, { "epoch": 0.57, "learning_rate": 2.0477211692551872e-06, "loss": 1.0779, "step": 30274 }, { "epoch": 0.57, "learning_rate": 2.047570925292713e-06, "loss": 0.839, "step": 30275 }, { "epoch": 0.57, "learning_rate": 2.0474206830195942e-06, "loss": 1.1539, "step": 30276 }, { "epoch": 0.57, "learning_rate": 2.047270442436394e-06, "loss": 0.8476, "step": 30277 }, { "epoch": 0.57, "learning_rate": 2.0471202035436706e-06, "loss": 1.0651, "step": 30278 }, { "epoch": 0.57, "learning_rate": 2.046969966341987e-06, "loss": 0.6536, "step": 30279 }, { "epoch": 0.57, "learning_rate": 2.046819730831904e-06, "loss": 0.9102, "step": 30280 }, { "epoch": 0.57, "learning_rate": 2.0466694970139824e-06, "loss": 1.1528, "step": 30281 }, { "epoch": 0.57, "learning_rate": 2.046519264888782e-06, "loss": 0.7544, "step": 30282 }, { "epoch": 0.57, "learning_rate": 2.046369034456866e-06, "loss": 0.8345, "step": 30283 }, { "epoch": 0.57, "learning_rate": 2.0462188057187938e-06, "loss": 1.1104, "step": 30284 }, { "epoch": 0.57, "learning_rate": 2.046068578675126e-06, "loss": 0.8245, "step": 30285 }, { "epoch": 0.57, "learning_rate": 2.045918353326424e-06, "loss": 0.7901, "step": 30286 }, { "epoch": 0.57, "learning_rate": 2.04576812967325e-06, "loss": 1.06, "step": 30287 }, { "epoch": 0.57, "learning_rate": 2.045617907716163e-06, "loss": 1.165, "step": 30288 }, { "epoch": 0.57, "learning_rate": 2.0454676874557257e-06, "loss": 0.955, "step": 30289 }, { "epoch": 0.57, "learning_rate": 2.0453174688924983e-06, "loss": 0.7984, "step": 30290 }, { "epoch": 0.57, "learning_rate": 2.04516725202704e-06, "loss": 0.8375, "step": 30291 }, { "epoch": 0.57, "learning_rate": 2.0450170368599145e-06, "loss": 0.876, "step": 30292 }, { "epoch": 0.57, "learning_rate": 2.044866823391681e-06, "loss": 0.9175, "step": 30293 }, { "epoch": 0.57, "learning_rate": 2.0447166116229e-06, "loss": 0.774, "step": 30294 }, { "epoch": 0.57, "learning_rate": 2.0445664015541347e-06, "loss": 0.9124, "step": 30295 }, { "epoch": 0.57, "learning_rate": 2.044416193185944e-06, "loss": 0.8137, "step": 30296 }, { "epoch": 0.57, "learning_rate": 2.0442659865188887e-06, "loss": 0.8281, "step": 30297 }, { "epoch": 0.57, "learning_rate": 2.0441157815535314e-06, "loss": 0.7624, "step": 30298 }, { "epoch": 0.57, "learning_rate": 2.0439655782904303e-06, "loss": 1.0026, "step": 30299 }, { "epoch": 0.57, "learning_rate": 2.043815376730149e-06, "loss": 1.1407, "step": 30300 }, { "epoch": 0.57, "learning_rate": 2.0436651768732464e-06, "loss": 1.0396, "step": 30301 }, { "epoch": 0.57, "learning_rate": 2.0435149787202845e-06, "loss": 0.7816, "step": 30302 }, { "epoch": 0.57, "learning_rate": 2.0433647822718228e-06, "loss": 0.8781, "step": 30303 }, { "epoch": 0.57, "learning_rate": 2.043214587528424e-06, "loss": 0.8198, "step": 30304 }, { "epoch": 0.57, "learning_rate": 2.0430643944906483e-06, "loss": 0.9357, "step": 30305 }, { "epoch": 0.57, "learning_rate": 2.0429142031590545e-06, "loss": 1.2089, "step": 30306 }, { "epoch": 0.57, "learning_rate": 2.042764013534206e-06, "loss": 0.9598, "step": 30307 }, { "epoch": 0.57, "learning_rate": 2.0426138256166626e-06, "loss": 0.6857, "step": 30308 }, { "epoch": 0.57, "learning_rate": 2.0424636394069848e-06, "loss": 0.7082, "step": 30309 }, { "epoch": 0.57, "learning_rate": 2.0423134549057342e-06, "loss": 0.8983, "step": 30310 }, { "epoch": 0.57, "learning_rate": 2.0421632721134714e-06, "loss": 0.6754, "step": 30311 }, { "epoch": 0.57, "learning_rate": 2.042013091030756e-06, "loss": 1.0237, "step": 30312 }, { "epoch": 0.57, "learning_rate": 2.0418629116581507e-06, "loss": 0.9502, "step": 30313 }, { "epoch": 0.57, "learning_rate": 2.0417127339962147e-06, "loss": 0.9652, "step": 30314 }, { "epoch": 0.57, "learning_rate": 2.0415625580455085e-06, "loss": 0.8568, "step": 30315 }, { "epoch": 0.57, "learning_rate": 2.0414123838065954e-06, "loss": 0.888, "step": 30316 }, { "epoch": 0.57, "learning_rate": 2.041262211280034e-06, "loss": 0.8156, "step": 30317 }, { "epoch": 0.57, "learning_rate": 2.041112040466384e-06, "loss": 1.0072, "step": 30318 }, { "epoch": 0.57, "learning_rate": 2.0409618713662087e-06, "loss": 1.0246, "step": 30319 }, { "epoch": 0.57, "learning_rate": 2.0408117039800673e-06, "loss": 0.9359, "step": 30320 }, { "epoch": 0.57, "learning_rate": 2.0406615383085214e-06, "loss": 0.7975, "step": 30321 }, { "epoch": 0.57, "learning_rate": 2.040511374352131e-06, "loss": 0.8597, "step": 30322 }, { "epoch": 0.57, "learning_rate": 2.0403612121114567e-06, "loss": 0.8435, "step": 30323 }, { "epoch": 0.57, "learning_rate": 2.0402110515870594e-06, "loss": 0.9153, "step": 30324 }, { "epoch": 0.57, "learning_rate": 2.040060892779501e-06, "loss": 0.936, "step": 30325 }, { "epoch": 0.57, "learning_rate": 2.0399107356893406e-06, "loss": 1.0018, "step": 30326 }, { "epoch": 0.57, "learning_rate": 2.039760580317139e-06, "loss": 0.7332, "step": 30327 }, { "epoch": 0.57, "learning_rate": 2.0396104266634574e-06, "loss": 1.0843, "step": 30328 }, { "epoch": 0.57, "learning_rate": 2.039460274728857e-06, "loss": 1.03, "step": 30329 }, { "epoch": 0.57, "learning_rate": 2.0393101245138966e-06, "loss": 0.9286, "step": 30330 }, { "epoch": 0.57, "learning_rate": 2.039159976019139e-06, "loss": 1.2092, "step": 30331 }, { "epoch": 0.57, "learning_rate": 2.0390098292451443e-06, "loss": 0.9797, "step": 30332 }, { "epoch": 0.57, "learning_rate": 2.0388596841924717e-06, "loss": 0.9132, "step": 30333 }, { "epoch": 0.57, "learning_rate": 2.0387095408616836e-06, "loss": 0.8892, "step": 30334 }, { "epoch": 0.57, "learning_rate": 2.03855939925334e-06, "loss": 0.88, "step": 30335 }, { "epoch": 0.57, "learning_rate": 2.0384092593680003e-06, "loss": 1.0037, "step": 30336 }, { "epoch": 0.57, "learning_rate": 2.0382591212062274e-06, "loss": 1.058, "step": 30337 }, { "epoch": 0.57, "learning_rate": 2.038108984768581e-06, "loss": 0.9164, "step": 30338 }, { "epoch": 0.57, "learning_rate": 2.0379588500556207e-06, "loss": 0.8892, "step": 30339 }, { "epoch": 0.57, "learning_rate": 2.0378087170679083e-06, "loss": 0.9208, "step": 30340 }, { "epoch": 0.57, "learning_rate": 2.037658585806004e-06, "loss": 0.7089, "step": 30341 }, { "epoch": 0.57, "learning_rate": 2.037508456270468e-06, "loss": 0.8426, "step": 30342 }, { "epoch": 0.57, "learning_rate": 2.0373583284618614e-06, "loss": 0.9612, "step": 30343 }, { "epoch": 0.57, "learning_rate": 2.037208202380745e-06, "loss": 1.0348, "step": 30344 }, { "epoch": 0.57, "learning_rate": 2.037058078027678e-06, "loss": 0.9972, "step": 30345 }, { "epoch": 0.57, "learning_rate": 2.0369079554032234e-06, "loss": 0.8574, "step": 30346 }, { "epoch": 0.57, "learning_rate": 2.0367578345079397e-06, "loss": 0.7764, "step": 30347 }, { "epoch": 0.57, "learning_rate": 2.0366077153423875e-06, "loss": 0.8463, "step": 30348 }, { "epoch": 0.57, "learning_rate": 2.036457597907128e-06, "loss": 0.9623, "step": 30349 }, { "epoch": 0.57, "learning_rate": 2.0363074822027222e-06, "loss": 1.2043, "step": 30350 }, { "epoch": 0.57, "learning_rate": 2.0361573682297293e-06, "loss": 0.9776, "step": 30351 }, { "epoch": 0.57, "learning_rate": 2.0360072559887113e-06, "loss": 0.9828, "step": 30352 }, { "epoch": 0.57, "learning_rate": 2.035857145480228e-06, "loss": 0.7839, "step": 30353 }, { "epoch": 0.57, "learning_rate": 2.035707036704839e-06, "loss": 0.7195, "step": 30354 }, { "epoch": 0.57, "learning_rate": 2.0355569296631065e-06, "loss": 0.9766, "step": 30355 }, { "epoch": 0.57, "learning_rate": 2.03540682435559e-06, "loss": 0.8761, "step": 30356 }, { "epoch": 0.57, "learning_rate": 2.0352567207828494e-06, "loss": 0.9538, "step": 30357 }, { "epoch": 0.57, "learning_rate": 2.035106618945447e-06, "loss": 0.79, "step": 30358 }, { "epoch": 0.57, "learning_rate": 2.0349565188439426e-06, "loss": 0.8678, "step": 30359 }, { "epoch": 0.57, "learning_rate": 2.0348064204788946e-06, "loss": 0.9081, "step": 30360 }, { "epoch": 0.57, "learning_rate": 2.034656323850867e-06, "loss": 0.9904, "step": 30361 }, { "epoch": 0.57, "learning_rate": 2.034506228960417e-06, "loss": 0.998, "step": 30362 }, { "epoch": 0.57, "learning_rate": 2.034356135808107e-06, "loss": 1.0553, "step": 30363 }, { "epoch": 0.57, "learning_rate": 2.034206044394497e-06, "loss": 1.0019, "step": 30364 }, { "epoch": 0.57, "learning_rate": 2.0340559547201477e-06, "loss": 0.9341, "step": 30365 }, { "epoch": 0.57, "learning_rate": 2.033905866785618e-06, "loss": 0.9084, "step": 30366 }, { "epoch": 0.57, "learning_rate": 2.033755780591471e-06, "loss": 0.7034, "step": 30367 }, { "epoch": 0.57, "learning_rate": 2.0336056961382652e-06, "loss": 1.0175, "step": 30368 }, { "epoch": 0.57, "learning_rate": 2.03345561342656e-06, "loss": 1.1115, "step": 30369 }, { "epoch": 0.57, "learning_rate": 2.0333055324569186e-06, "loss": 0.8631, "step": 30370 }, { "epoch": 0.57, "learning_rate": 2.0331554532299004e-06, "loss": 0.83, "step": 30371 }, { "epoch": 0.57, "learning_rate": 2.033005375746064e-06, "loss": 0.9307, "step": 30372 }, { "epoch": 0.57, "learning_rate": 2.0328553000059725e-06, "loss": 0.8417, "step": 30373 }, { "epoch": 0.57, "learning_rate": 2.0327052260101853e-06, "loss": 0.9713, "step": 30374 }, { "epoch": 0.57, "learning_rate": 2.032555153759261e-06, "loss": 1.0637, "step": 30375 }, { "epoch": 0.57, "learning_rate": 2.0324050832537623e-06, "loss": 1.0235, "step": 30376 }, { "epoch": 0.57, "learning_rate": 2.0322550144942485e-06, "loss": 1.0005, "step": 30377 }, { "epoch": 0.57, "learning_rate": 2.0321049474812793e-06, "loss": 0.8594, "step": 30378 }, { "epoch": 0.57, "learning_rate": 2.0319548822154172e-06, "loss": 0.7059, "step": 30379 }, { "epoch": 0.57, "learning_rate": 2.0318048186972213e-06, "loss": 1.0095, "step": 30380 }, { "epoch": 0.57, "learning_rate": 2.0316547569272505e-06, "loss": 0.9167, "step": 30381 }, { "epoch": 0.57, "learning_rate": 2.0315046969060674e-06, "loss": 1.0617, "step": 30382 }, { "epoch": 0.57, "learning_rate": 2.0313546386342313e-06, "loss": 0.934, "step": 30383 }, { "epoch": 0.57, "learning_rate": 2.0312045821123026e-06, "loss": 0.7864, "step": 30384 }, { "epoch": 0.57, "learning_rate": 2.0310545273408412e-06, "loss": 0.929, "step": 30385 }, { "epoch": 0.57, "learning_rate": 2.0309044743204087e-06, "loss": 1.0499, "step": 30386 }, { "epoch": 0.57, "learning_rate": 2.0307544230515636e-06, "loss": 1.2539, "step": 30387 }, { "epoch": 0.57, "learning_rate": 2.0306043735348676e-06, "loss": 0.9072, "step": 30388 }, { "epoch": 0.57, "learning_rate": 2.030454325770881e-06, "loss": 0.93, "step": 30389 }, { "epoch": 0.57, "learning_rate": 2.0303042797601623e-06, "loss": 1.066, "step": 30390 }, { "epoch": 0.57, "learning_rate": 2.0301542355032737e-06, "loss": 0.762, "step": 30391 }, { "epoch": 0.57, "learning_rate": 2.030004193000775e-06, "loss": 1.0852, "step": 30392 }, { "epoch": 0.57, "learning_rate": 2.029854152253225e-06, "loss": 1.0177, "step": 30393 }, { "epoch": 0.57, "learning_rate": 2.0297041132611866e-06, "loss": 1.0023, "step": 30394 }, { "epoch": 0.57, "learning_rate": 2.029554076025219e-06, "loss": 0.8418, "step": 30395 }, { "epoch": 0.57, "learning_rate": 2.0294040405458804e-06, "loss": 0.9306, "step": 30396 }, { "epoch": 0.57, "learning_rate": 2.0292540068237336e-06, "loss": 0.8728, "step": 30397 }, { "epoch": 0.57, "learning_rate": 2.0291039748593382e-06, "loss": 0.8535, "step": 30398 }, { "epoch": 0.57, "learning_rate": 2.0289539446532528e-06, "loss": 0.9292, "step": 30399 }, { "epoch": 0.57, "learning_rate": 2.02880391620604e-06, "loss": 1.2115, "step": 30400 }, { "epoch": 0.57, "learning_rate": 2.0286538895182593e-06, "loss": 0.7807, "step": 30401 }, { "epoch": 0.57, "learning_rate": 2.0285038645904694e-06, "loss": 0.8559, "step": 30402 }, { "epoch": 0.57, "learning_rate": 2.028353841423233e-06, "loss": 0.8719, "step": 30403 }, { "epoch": 0.57, "learning_rate": 2.0282038200171077e-06, "loss": 0.6193, "step": 30404 }, { "epoch": 0.57, "learning_rate": 2.0280538003726553e-06, "loss": 0.8844, "step": 30405 }, { "epoch": 0.57, "learning_rate": 2.0279037824904355e-06, "loss": 1.1451, "step": 30406 }, { "epoch": 0.57, "learning_rate": 2.027753766371009e-06, "loss": 0.8645, "step": 30407 }, { "epoch": 0.57, "learning_rate": 2.027603752014934e-06, "loss": 0.8733, "step": 30408 }, { "epoch": 0.57, "learning_rate": 2.0274537394227737e-06, "loss": 0.8993, "step": 30409 }, { "epoch": 0.57, "learning_rate": 2.0273037285950864e-06, "loss": 0.7079, "step": 30410 }, { "epoch": 0.57, "learning_rate": 2.0271537195324316e-06, "loss": 0.9201, "step": 30411 }, { "epoch": 0.57, "learning_rate": 2.0270037122353707e-06, "loss": 1.2246, "step": 30412 }, { "epoch": 0.57, "learning_rate": 2.0268537067044638e-06, "loss": 0.9226, "step": 30413 }, { "epoch": 0.57, "learning_rate": 2.0267037029402698e-06, "loss": 0.9561, "step": 30414 }, { "epoch": 0.57, "learning_rate": 2.0265537009433507e-06, "loss": 0.8366, "step": 30415 }, { "epoch": 0.57, "learning_rate": 2.0264037007142657e-06, "loss": 0.9004, "step": 30416 }, { "epoch": 0.57, "learning_rate": 2.0262537022535737e-06, "loss": 0.6516, "step": 30417 }, { "epoch": 0.57, "learning_rate": 2.0261037055618367e-06, "loss": 0.929, "step": 30418 }, { "epoch": 0.57, "learning_rate": 2.0259537106396134e-06, "loss": 1.0478, "step": 30419 }, { "epoch": 0.57, "learning_rate": 2.025803717487464e-06, "loss": 0.9505, "step": 30420 }, { "epoch": 0.57, "learning_rate": 2.02565372610595e-06, "loss": 0.6891, "step": 30421 }, { "epoch": 0.57, "learning_rate": 2.0255037364956302e-06, "loss": 0.8871, "step": 30422 }, { "epoch": 0.57, "learning_rate": 2.0253537486570643e-06, "loss": 0.8171, "step": 30423 }, { "epoch": 0.57, "learning_rate": 2.025203762590814e-06, "loss": 1.0007, "step": 30424 }, { "epoch": 0.57, "learning_rate": 2.025053778297437e-06, "loss": 0.9972, "step": 30425 }, { "epoch": 0.57, "learning_rate": 2.0249037957774955e-06, "loss": 0.852, "step": 30426 }, { "epoch": 0.57, "learning_rate": 2.024753815031548e-06, "loss": 0.9111, "step": 30427 }, { "epoch": 0.57, "learning_rate": 2.0246038360601563e-06, "loss": 0.8569, "step": 30428 }, { "epoch": 0.57, "learning_rate": 2.0244538588638783e-06, "loss": 0.7387, "step": 30429 }, { "epoch": 0.57, "learning_rate": 2.0243038834432757e-06, "loss": 0.9549, "step": 30430 }, { "epoch": 0.57, "learning_rate": 2.0241539097989075e-06, "loss": 1.024, "step": 30431 }, { "epoch": 0.57, "learning_rate": 2.0240039379313337e-06, "loss": 1.1041, "step": 30432 }, { "epoch": 0.57, "learning_rate": 2.0238539678411145e-06, "loss": 1.0635, "step": 30433 }, { "epoch": 0.57, "learning_rate": 2.023703999528811e-06, "loss": 0.8539, "step": 30434 }, { "epoch": 0.57, "learning_rate": 2.023554032994981e-06, "loss": 1.0587, "step": 30435 }, { "epoch": 0.57, "learning_rate": 2.0234040682401867e-06, "loss": 0.8069, "step": 30436 }, { "epoch": 0.57, "learning_rate": 2.0232541052649867e-06, "loss": 0.9299, "step": 30437 }, { "epoch": 0.57, "learning_rate": 2.0231041440699403e-06, "loss": 1.0872, "step": 30438 }, { "epoch": 0.57, "learning_rate": 2.0229541846556096e-06, "loss": 0.895, "step": 30439 }, { "epoch": 0.57, "learning_rate": 2.0228042270225524e-06, "loss": 0.7937, "step": 30440 }, { "epoch": 0.57, "learning_rate": 2.0226542711713297e-06, "loss": 0.8591, "step": 30441 }, { "epoch": 0.57, "learning_rate": 2.022504317102502e-06, "loss": 0.9711, "step": 30442 }, { "epoch": 0.57, "learning_rate": 2.0223543648166286e-06, "loss": 1.0719, "step": 30443 }, { "epoch": 0.57, "learning_rate": 2.0222044143142683e-06, "loss": 1.0905, "step": 30444 }, { "epoch": 0.57, "learning_rate": 2.0220544655959834e-06, "loss": 1.0414, "step": 30445 }, { "epoch": 0.57, "learning_rate": 2.0219045186623316e-06, "loss": 0.8175, "step": 30446 }, { "epoch": 0.57, "learning_rate": 2.021754573513874e-06, "loss": 0.7707, "step": 30447 }, { "epoch": 0.57, "learning_rate": 2.0216046301511695e-06, "loss": 0.9953, "step": 30448 }, { "epoch": 0.57, "learning_rate": 2.0214546885747796e-06, "loss": 1.0341, "step": 30449 }, { "epoch": 0.57, "learning_rate": 2.021304748785262e-06, "loss": 1.1949, "step": 30450 }, { "epoch": 0.57, "learning_rate": 2.021154810783179e-06, "loss": 0.8364, "step": 30451 }, { "epoch": 0.57, "learning_rate": 2.0210048745690896e-06, "loss": 0.8499, "step": 30452 }, { "epoch": 0.57, "learning_rate": 2.020854940143552e-06, "loss": 0.7974, "step": 30453 }, { "epoch": 0.57, "learning_rate": 2.0207050075071276e-06, "loss": 0.9001, "step": 30454 }, { "epoch": 0.57, "learning_rate": 2.0205550766603764e-06, "loss": 0.9328, "step": 30455 }, { "epoch": 0.57, "learning_rate": 2.0204051476038586e-06, "loss": 1.0957, "step": 30456 }, { "epoch": 0.57, "learning_rate": 2.020255220338132e-06, "loss": 0.9649, "step": 30457 }, { "epoch": 0.57, "learning_rate": 2.0201052948637583e-06, "loss": 0.8261, "step": 30458 }, { "epoch": 0.57, "learning_rate": 2.0199553711812965e-06, "loss": 0.9887, "step": 30459 }, { "epoch": 0.57, "learning_rate": 2.0198054492913064e-06, "loss": 0.7042, "step": 30460 }, { "epoch": 0.57, "learning_rate": 2.019655529194348e-06, "loss": 0.9013, "step": 30461 }, { "epoch": 0.57, "learning_rate": 2.0195056108909822e-06, "loss": 1.0907, "step": 30462 }, { "epoch": 0.57, "learning_rate": 2.019355694381766e-06, "loss": 0.9622, "step": 30463 }, { "epoch": 0.57, "learning_rate": 2.0192057796672625e-06, "loss": 0.778, "step": 30464 }, { "epoch": 0.57, "learning_rate": 2.0190558667480297e-06, "loss": 1.0453, "step": 30465 }, { "epoch": 0.57, "learning_rate": 2.018905955624626e-06, "loss": 0.8357, "step": 30466 }, { "epoch": 0.57, "learning_rate": 2.018756046297614e-06, "loss": 1.1327, "step": 30467 }, { "epoch": 0.57, "learning_rate": 2.0186061387675525e-06, "loss": 1.0073, "step": 30468 }, { "epoch": 0.57, "learning_rate": 2.0184562330349996e-06, "loss": 1.0034, "step": 30469 }, { "epoch": 0.57, "learning_rate": 2.0183063291005176e-06, "loss": 1.0125, "step": 30470 }, { "epoch": 0.57, "learning_rate": 2.0181564269646648e-06, "loss": 0.837, "step": 30471 }, { "epoch": 0.57, "learning_rate": 2.018006526628e-06, "loss": 0.8501, "step": 30472 }, { "epoch": 0.57, "learning_rate": 2.0178566280910857e-06, "loss": 0.8948, "step": 30473 }, { "epoch": 0.57, "learning_rate": 2.017706731354479e-06, "loss": 0.9208, "step": 30474 }, { "epoch": 0.57, "learning_rate": 2.01755683641874e-06, "loss": 1.136, "step": 30475 }, { "epoch": 0.57, "learning_rate": 2.01740694328443e-06, "loss": 0.8979, "step": 30476 }, { "epoch": 0.58, "learning_rate": 2.0172570519521077e-06, "loss": 1.0006, "step": 30477 }, { "epoch": 0.58, "learning_rate": 2.017107162422332e-06, "loss": 0.9242, "step": 30478 }, { "epoch": 0.58, "learning_rate": 2.0169572746956645e-06, "loss": 0.8887, "step": 30479 }, { "epoch": 0.58, "learning_rate": 2.0168073887726626e-06, "loss": 0.8864, "step": 30480 }, { "epoch": 0.58, "learning_rate": 2.016657504653888e-06, "loss": 0.9616, "step": 30481 }, { "epoch": 0.58, "learning_rate": 2.0165076223398987e-06, "loss": 1.0473, "step": 30482 }, { "epoch": 0.58, "learning_rate": 2.016357741831256e-06, "loss": 1.0657, "step": 30483 }, { "epoch": 0.58, "learning_rate": 2.016207863128517e-06, "loss": 0.9747, "step": 30484 }, { "epoch": 0.58, "learning_rate": 2.0160579862322445e-06, "loss": 0.825, "step": 30485 }, { "epoch": 0.58, "learning_rate": 2.015908111142997e-06, "loss": 0.9034, "step": 30486 }, { "epoch": 0.58, "learning_rate": 2.015758237861332e-06, "loss": 1.0963, "step": 30487 }, { "epoch": 0.58, "learning_rate": 2.015608366387812e-06, "loss": 0.8434, "step": 30488 }, { "epoch": 0.58, "learning_rate": 2.015458496722996e-06, "loss": 0.8531, "step": 30489 }, { "epoch": 0.58, "learning_rate": 2.0153086288674417e-06, "loss": 0.9233, "step": 30490 }, { "epoch": 0.58, "learning_rate": 2.0151587628217112e-06, "loss": 1.0432, "step": 30491 }, { "epoch": 0.58, "learning_rate": 2.015008898586363e-06, "loss": 0.7287, "step": 30492 }, { "epoch": 0.58, "learning_rate": 2.014859036161956e-06, "loss": 1.0399, "step": 30493 }, { "epoch": 0.58, "learning_rate": 2.0147091755490513e-06, "loss": 0.9602, "step": 30494 }, { "epoch": 0.58, "learning_rate": 2.014559316748207e-06, "loss": 0.9549, "step": 30495 }, { "epoch": 0.58, "learning_rate": 2.014409459759983e-06, "loss": 0.7998, "step": 30496 }, { "epoch": 0.58, "learning_rate": 2.0142596045849406e-06, "loss": 1.0156, "step": 30497 }, { "epoch": 0.58, "learning_rate": 2.0141097512236373e-06, "loss": 0.7946, "step": 30498 }, { "epoch": 0.58, "learning_rate": 2.013959899676633e-06, "loss": 0.9102, "step": 30499 }, { "epoch": 0.58, "learning_rate": 2.0138100499444875e-06, "loss": 1.1743, "step": 30500 }, { "epoch": 0.58, "learning_rate": 2.013660202027761e-06, "loss": 0.9706, "step": 30501 }, { "epoch": 0.58, "learning_rate": 2.0135103559270113e-06, "loss": 0.792, "step": 30502 }, { "epoch": 0.58, "learning_rate": 2.0133605116427994e-06, "loss": 1.1131, "step": 30503 }, { "epoch": 0.58, "learning_rate": 2.0132106691756853e-06, "loss": 0.8809, "step": 30504 }, { "epoch": 0.58, "learning_rate": 2.0130608285262265e-06, "loss": 0.8465, "step": 30505 }, { "epoch": 0.58, "learning_rate": 2.0129109896949844e-06, "loss": 0.9119, "step": 30506 }, { "epoch": 0.58, "learning_rate": 2.012761152682518e-06, "loss": 0.7918, "step": 30507 }, { "epoch": 0.58, "learning_rate": 2.0126113174893854e-06, "loss": 1.0405, "step": 30508 }, { "epoch": 0.58, "learning_rate": 2.0124614841161475e-06, "loss": 0.7984, "step": 30509 }, { "epoch": 0.58, "learning_rate": 2.0123116525633647e-06, "loss": 0.8041, "step": 30510 }, { "epoch": 0.58, "learning_rate": 2.0121618228315934e-06, "loss": 0.8961, "step": 30511 }, { "epoch": 0.58, "learning_rate": 2.012011994921396e-06, "loss": 1.1727, "step": 30512 }, { "epoch": 0.58, "learning_rate": 2.011862168833331e-06, "loss": 0.9935, "step": 30513 }, { "epoch": 0.58, "learning_rate": 2.0117123445679572e-06, "loss": 0.9969, "step": 30514 }, { "epoch": 0.58, "learning_rate": 2.011562522125835e-06, "loss": 0.9915, "step": 30515 }, { "epoch": 0.58, "learning_rate": 2.011412701507523e-06, "loss": 0.8118, "step": 30516 }, { "epoch": 0.58, "learning_rate": 2.0112628827135803e-06, "loss": 0.9428, "step": 30517 }, { "epoch": 0.58, "learning_rate": 2.011113065744568e-06, "loss": 1.0745, "step": 30518 }, { "epoch": 0.58, "learning_rate": 2.010963250601045e-06, "loss": 0.864, "step": 30519 }, { "epoch": 0.58, "learning_rate": 2.0108134372835686e-06, "loss": 0.7986, "step": 30520 }, { "epoch": 0.58, "learning_rate": 2.010663625792701e-06, "loss": 1.0614, "step": 30521 }, { "epoch": 0.58, "learning_rate": 2.0105138161290004e-06, "loss": 1.0718, "step": 30522 }, { "epoch": 0.58, "learning_rate": 2.0103640082930257e-06, "loss": 0.922, "step": 30523 }, { "epoch": 0.58, "learning_rate": 2.010214202285337e-06, "loss": 0.967, "step": 30524 }, { "epoch": 0.58, "learning_rate": 2.010064398106494e-06, "loss": 1.1518, "step": 30525 }, { "epoch": 0.58, "learning_rate": 2.009914595757054e-06, "loss": 0.7897, "step": 30526 }, { "epoch": 0.58, "learning_rate": 2.0097647952375793e-06, "loss": 1.0787, "step": 30527 }, { "epoch": 0.58, "learning_rate": 2.009614996548628e-06, "loss": 0.8391, "step": 30528 }, { "epoch": 0.58, "learning_rate": 2.009465199690758e-06, "loss": 0.9216, "step": 30529 }, { "epoch": 0.58, "learning_rate": 2.0093154046645303e-06, "loss": 0.9116, "step": 30530 }, { "epoch": 0.58, "learning_rate": 2.009165611470505e-06, "loss": 1.0281, "step": 30531 }, { "epoch": 0.58, "learning_rate": 2.0090158201092384e-06, "loss": 0.9626, "step": 30532 }, { "epoch": 0.58, "learning_rate": 2.008866030581293e-06, "loss": 0.7718, "step": 30533 }, { "epoch": 0.58, "learning_rate": 2.0087162428872265e-06, "loss": 0.9391, "step": 30534 }, { "epoch": 0.58, "learning_rate": 2.008566457027598e-06, "loss": 0.8066, "step": 30535 }, { "epoch": 0.58, "learning_rate": 2.008416673002968e-06, "loss": 0.7138, "step": 30536 }, { "epoch": 0.58, "learning_rate": 2.0082668908138948e-06, "loss": 1.028, "step": 30537 }, { "epoch": 0.58, "learning_rate": 2.008117110460937e-06, "loss": 1.107, "step": 30538 }, { "epoch": 0.58, "learning_rate": 2.0079673319446563e-06, "loss": 0.9083, "step": 30539 }, { "epoch": 0.58, "learning_rate": 2.0078175552656104e-06, "loss": 0.8302, "step": 30540 }, { "epoch": 0.58, "learning_rate": 2.0076677804243574e-06, "loss": 0.8233, "step": 30541 }, { "epoch": 0.58, "learning_rate": 2.007518007421459e-06, "loss": 0.9182, "step": 30542 }, { "epoch": 0.58, "learning_rate": 2.007368236257473e-06, "loss": 1.1262, "step": 30543 }, { "epoch": 0.58, "learning_rate": 2.007218466932959e-06, "loss": 1.0309, "step": 30544 }, { "epoch": 0.58, "learning_rate": 2.0070686994484754e-06, "loss": 1.0663, "step": 30545 }, { "epoch": 0.58, "learning_rate": 2.0069189338045832e-06, "loss": 0.731, "step": 30546 }, { "epoch": 0.58, "learning_rate": 2.0067691700018395e-06, "loss": 0.7682, "step": 30547 }, { "epoch": 0.58, "learning_rate": 2.006619408040805e-06, "loss": 0.8025, "step": 30548 }, { "epoch": 0.58, "learning_rate": 2.0064696479220393e-06, "loss": 1.0138, "step": 30549 }, { "epoch": 0.58, "learning_rate": 2.0063198896460996e-06, "loss": 1.1678, "step": 30550 }, { "epoch": 0.58, "learning_rate": 2.0061701332135467e-06, "loss": 0.9156, "step": 30551 }, { "epoch": 0.58, "learning_rate": 2.00602037862494e-06, "loss": 0.937, "step": 30552 }, { "epoch": 0.58, "learning_rate": 2.005870625880837e-06, "loss": 0.8318, "step": 30553 }, { "epoch": 0.58, "learning_rate": 2.0057208749817987e-06, "loss": 0.685, "step": 30554 }, { "epoch": 0.58, "learning_rate": 2.0055711259283838e-06, "loss": 1.0355, "step": 30555 }, { "epoch": 0.58, "learning_rate": 2.00542137872115e-06, "loss": 1.0239, "step": 30556 }, { "epoch": 0.58, "learning_rate": 2.0052716333606586e-06, "loss": 1.0185, "step": 30557 }, { "epoch": 0.58, "learning_rate": 2.0051218898474672e-06, "loss": 1.0607, "step": 30558 }, { "epoch": 0.58, "learning_rate": 2.004972148182135e-06, "loss": 1.0671, "step": 30559 }, { "epoch": 0.58, "learning_rate": 2.004822408365223e-06, "loss": 0.67, "step": 30560 }, { "epoch": 0.58, "learning_rate": 2.0046726703972887e-06, "loss": 0.8978, "step": 30561 }, { "epoch": 0.58, "learning_rate": 2.0045229342788907e-06, "loss": 1.1596, "step": 30562 }, { "epoch": 0.58, "learning_rate": 2.004373200010589e-06, "loss": 1.0627, "step": 30563 }, { "epoch": 0.58, "learning_rate": 2.0042234675929433e-06, "loss": 0.9357, "step": 30564 }, { "epoch": 0.58, "learning_rate": 2.004073737026511e-06, "loss": 0.8088, "step": 30565 }, { "epoch": 0.58, "learning_rate": 2.003924008311853e-06, "loss": 0.8878, "step": 30566 }, { "epoch": 0.58, "learning_rate": 2.003774281449527e-06, "loss": 0.9884, "step": 30567 }, { "epoch": 0.58, "learning_rate": 2.0036245564400924e-06, "loss": 0.9305, "step": 30568 }, { "epoch": 0.58, "learning_rate": 2.0034748332841093e-06, "loss": 1.0657, "step": 30569 }, { "epoch": 0.58, "learning_rate": 2.003325111982136e-06, "loss": 0.9897, "step": 30570 }, { "epoch": 0.58, "learning_rate": 2.0031753925347305e-06, "loss": 0.9122, "step": 30571 }, { "epoch": 0.58, "learning_rate": 2.003025674942453e-06, "loss": 0.8637, "step": 30572 }, { "epoch": 0.58, "learning_rate": 2.0028759592058634e-06, "loss": 0.8369, "step": 30573 }, { "epoch": 0.58, "learning_rate": 2.0027262453255183e-06, "loss": 1.0473, "step": 30574 }, { "epoch": 0.58, "learning_rate": 2.002576533301979e-06, "loss": 1.3323, "step": 30575 }, { "epoch": 0.58, "learning_rate": 2.0024268231358045e-06, "loss": 1.028, "step": 30576 }, { "epoch": 0.58, "learning_rate": 2.0022771148275513e-06, "loss": 0.8854, "step": 30577 }, { "epoch": 0.58, "learning_rate": 2.0021274083777815e-06, "loss": 0.9126, "step": 30578 }, { "epoch": 0.58, "learning_rate": 2.0019777037870518e-06, "loss": 1.0353, "step": 30579 }, { "epoch": 0.58, "learning_rate": 2.0018280010559214e-06, "loss": 0.8314, "step": 30580 }, { "epoch": 0.58, "learning_rate": 2.0016783001849516e-06, "loss": 1.0217, "step": 30581 }, { "epoch": 0.58, "learning_rate": 2.0015286011746994e-06, "loss": 0.8203, "step": 30582 }, { "epoch": 0.58, "learning_rate": 2.0013789040257233e-06, "loss": 0.9388, "step": 30583 }, { "epoch": 0.58, "learning_rate": 2.001229208738584e-06, "loss": 0.9351, "step": 30584 }, { "epoch": 0.58, "learning_rate": 2.001079515313839e-06, "loss": 0.8397, "step": 30585 }, { "epoch": 0.58, "learning_rate": 2.000929823752048e-06, "loss": 0.9376, "step": 30586 }, { "epoch": 0.58, "learning_rate": 2.0007801340537693e-06, "loss": 1.0544, "step": 30587 }, { "epoch": 0.58, "learning_rate": 2.0006304462195633e-06, "loss": 0.9208, "step": 30588 }, { "epoch": 0.58, "learning_rate": 2.0004807602499864e-06, "loss": 0.7426, "step": 30589 }, { "epoch": 0.58, "learning_rate": 2.0003310761456005e-06, "loss": 0.8954, "step": 30590 }, { "epoch": 0.58, "learning_rate": 2.0001813939069627e-06, "loss": 0.8456, "step": 30591 }, { "epoch": 0.58, "learning_rate": 2.0000317135346316e-06, "loss": 0.9805, "step": 30592 }, { "epoch": 0.58, "learning_rate": 1.9998820350291666e-06, "loss": 1.1041, "step": 30593 }, { "epoch": 0.58, "learning_rate": 1.999732358391128e-06, "loss": 1.1304, "step": 30594 }, { "epoch": 0.58, "learning_rate": 1.999582683621072e-06, "loss": 0.9047, "step": 30595 }, { "epoch": 0.58, "learning_rate": 1.99943301071956e-06, "loss": 0.8477, "step": 30596 }, { "epoch": 0.58, "learning_rate": 1.99928333968715e-06, "loss": 0.8739, "step": 30597 }, { "epoch": 0.58, "learning_rate": 1.999133670524399e-06, "loss": 0.6768, "step": 30598 }, { "epoch": 0.58, "learning_rate": 1.9989840032318693e-06, "loss": 0.8237, "step": 30599 }, { "epoch": 0.58, "learning_rate": 1.9988343378101173e-06, "loss": 0.926, "step": 30600 }, { "epoch": 0.58, "learning_rate": 1.9986846742597017e-06, "loss": 1.072, "step": 30601 }, { "epoch": 0.58, "learning_rate": 1.998535012581183e-06, "loss": 0.8141, "step": 30602 }, { "epoch": 0.58, "learning_rate": 1.9983853527751194e-06, "loss": 0.8007, "step": 30603 }, { "epoch": 0.58, "learning_rate": 1.9982356948420688e-06, "loss": 0.7548, "step": 30604 }, { "epoch": 0.58, "learning_rate": 1.998086038782592e-06, "loss": 0.9362, "step": 30605 }, { "epoch": 0.58, "learning_rate": 1.9979363845972453e-06, "loss": 1.0044, "step": 30606 }, { "epoch": 0.58, "learning_rate": 1.997786732286589e-06, "loss": 1.102, "step": 30607 }, { "epoch": 0.58, "learning_rate": 1.9976370818511816e-06, "loss": 0.9342, "step": 30608 }, { "epoch": 0.58, "learning_rate": 1.9974874332915826e-06, "loss": 0.7532, "step": 30609 }, { "epoch": 0.58, "learning_rate": 1.997337786608349e-06, "loss": 0.9864, "step": 30610 }, { "epoch": 0.58, "learning_rate": 1.9971881418020417e-06, "loss": 0.7853, "step": 30611 }, { "epoch": 0.58, "learning_rate": 1.9970384988732188e-06, "loss": 1.1074, "step": 30612 }, { "epoch": 0.58, "learning_rate": 1.9968888578224372e-06, "loss": 1.0043, "step": 30613 }, { "epoch": 0.58, "learning_rate": 1.9967392186502575e-06, "loss": 0.8783, "step": 30614 }, { "epoch": 0.58, "learning_rate": 1.9965895813572394e-06, "loss": 0.8252, "step": 30615 }, { "epoch": 0.58, "learning_rate": 1.9964399459439386e-06, "loss": 0.8706, "step": 30616 }, { "epoch": 0.58, "learning_rate": 1.996290312410917e-06, "loss": 1.0613, "step": 30617 }, { "epoch": 0.58, "learning_rate": 1.9961406807587323e-06, "loss": 1.1066, "step": 30618 }, { "epoch": 0.58, "learning_rate": 1.995991050987941e-06, "loss": 1.0968, "step": 30619 }, { "epoch": 0.58, "learning_rate": 1.9958414230991054e-06, "loss": 0.9839, "step": 30620 }, { "epoch": 0.58, "learning_rate": 1.995691797092782e-06, "loss": 0.8424, "step": 30621 }, { "epoch": 0.58, "learning_rate": 1.995542172969529e-06, "loss": 1.0108, "step": 30622 }, { "epoch": 0.58, "learning_rate": 1.995392550729907e-06, "loss": 0.8866, "step": 30623 }, { "epoch": 0.58, "learning_rate": 1.995242930374474e-06, "loss": 0.888, "step": 30624 }, { "epoch": 0.58, "learning_rate": 1.9950933119037873e-06, "loss": 0.9652, "step": 30625 }, { "epoch": 0.58, "learning_rate": 1.994943695318408e-06, "loss": 0.7875, "step": 30626 }, { "epoch": 0.58, "learning_rate": 1.9947940806188927e-06, "loss": 0.9523, "step": 30627 }, { "epoch": 0.58, "learning_rate": 1.9946444678058006e-06, "loss": 0.8861, "step": 30628 }, { "epoch": 0.58, "learning_rate": 1.994494856879691e-06, "loss": 0.8986, "step": 30629 }, { "epoch": 0.58, "learning_rate": 1.9943452478411224e-06, "loss": 0.9642, "step": 30630 }, { "epoch": 0.58, "learning_rate": 1.994195640690652e-06, "loss": 1.0483, "step": 30631 }, { "epoch": 0.58, "learning_rate": 1.994046035428841e-06, "loss": 0.8537, "step": 30632 }, { "epoch": 0.58, "learning_rate": 1.9938964320562462e-06, "loss": 0.9317, "step": 30633 }, { "epoch": 0.58, "learning_rate": 1.993746830573426e-06, "loss": 0.9661, "step": 30634 }, { "epoch": 0.58, "learning_rate": 1.9935972309809397e-06, "loss": 0.8927, "step": 30635 }, { "epoch": 0.58, "learning_rate": 1.9934476332793465e-06, "loss": 0.6743, "step": 30636 }, { "epoch": 0.58, "learning_rate": 1.9932980374692033e-06, "loss": 1.0362, "step": 30637 }, { "epoch": 0.58, "learning_rate": 1.9931484435510704e-06, "loss": 1.0133, "step": 30638 }, { "epoch": 0.58, "learning_rate": 1.992998851525506e-06, "loss": 0.9048, "step": 30639 }, { "epoch": 0.58, "learning_rate": 1.9928492613930674e-06, "loss": 0.9291, "step": 30640 }, { "epoch": 0.58, "learning_rate": 1.9926996731543146e-06, "loss": 1.0369, "step": 30641 }, { "epoch": 0.58, "learning_rate": 1.9925500868098056e-06, "loss": 0.8255, "step": 30642 }, { "epoch": 0.58, "learning_rate": 1.9924005023600984e-06, "loss": 1.2258, "step": 30643 }, { "epoch": 0.58, "learning_rate": 1.992250919805753e-06, "loss": 0.9936, "step": 30644 }, { "epoch": 0.58, "learning_rate": 1.9921013391473277e-06, "loss": 0.6526, "step": 30645 }, { "epoch": 0.58, "learning_rate": 1.9919517603853793e-06, "loss": 1.0331, "step": 30646 }, { "epoch": 0.58, "learning_rate": 1.991802183520468e-06, "loss": 1.0912, "step": 30647 }, { "epoch": 0.58, "learning_rate": 1.9916526085531514e-06, "loss": 0.8256, "step": 30648 }, { "epoch": 0.58, "learning_rate": 1.9915030354839883e-06, "loss": 0.8326, "step": 30649 }, { "epoch": 0.58, "learning_rate": 1.9913534643135376e-06, "loss": 0.9272, "step": 30650 }, { "epoch": 0.58, "learning_rate": 1.9912038950423575e-06, "loss": 0.8919, "step": 30651 }, { "epoch": 0.58, "learning_rate": 1.991054327671006e-06, "loss": 0.9078, "step": 30652 }, { "epoch": 0.58, "learning_rate": 1.990904762200043e-06, "loss": 0.8886, "step": 30653 }, { "epoch": 0.58, "learning_rate": 1.9907551986300256e-06, "loss": 0.8943, "step": 30654 }, { "epoch": 0.58, "learning_rate": 1.9906056369615117e-06, "loss": 1.0389, "step": 30655 }, { "epoch": 0.58, "learning_rate": 1.9904560771950616e-06, "loss": 1.0668, "step": 30656 }, { "epoch": 0.58, "learning_rate": 1.990306519331233e-06, "loss": 0.894, "step": 30657 }, { "epoch": 0.58, "learning_rate": 1.990156963370583e-06, "loss": 0.9841, "step": 30658 }, { "epoch": 0.58, "learning_rate": 1.990007409313673e-06, "loss": 0.8521, "step": 30659 }, { "epoch": 0.58, "learning_rate": 1.989857857161059e-06, "loss": 0.7372, "step": 30660 }, { "epoch": 0.58, "learning_rate": 1.9897083069132998e-06, "loss": 0.9527, "step": 30661 }, { "epoch": 0.58, "learning_rate": 1.9895587585709545e-06, "loss": 0.9671, "step": 30662 }, { "epoch": 0.58, "learning_rate": 1.989409212134581e-06, "loss": 0.9427, "step": 30663 }, { "epoch": 0.58, "learning_rate": 1.9892596676047376e-06, "loss": 1.0454, "step": 30664 }, { "epoch": 0.58, "learning_rate": 1.9891101249819835e-06, "loss": 0.9367, "step": 30665 }, { "epoch": 0.58, "learning_rate": 1.988960584266877e-06, "loss": 0.9971, "step": 30666 }, { "epoch": 0.58, "learning_rate": 1.9888110454599745e-06, "loss": 0.8606, "step": 30667 }, { "epoch": 0.58, "learning_rate": 1.988661508561837e-06, "loss": 1.0097, "step": 30668 }, { "epoch": 0.58, "learning_rate": 1.9885119735730214e-06, "loss": 1.2507, "step": 30669 }, { "epoch": 0.58, "learning_rate": 1.9883624404940858e-06, "loss": 0.9063, "step": 30670 }, { "epoch": 0.58, "learning_rate": 1.98821290932559e-06, "loss": 1.1106, "step": 30671 }, { "epoch": 0.58, "learning_rate": 1.988063380068092e-06, "loss": 0.9, "step": 30672 }, { "epoch": 0.58, "learning_rate": 1.987913852722148e-06, "loss": 0.8443, "step": 30673 }, { "epoch": 0.58, "learning_rate": 1.9877643272883196e-06, "loss": 1.0942, "step": 30674 }, { "epoch": 0.58, "learning_rate": 1.9876148037671627e-06, "loss": 1.1787, "step": 30675 }, { "epoch": 0.58, "learning_rate": 1.9874652821592364e-06, "loss": 1.0474, "step": 30676 }, { "epoch": 0.58, "learning_rate": 1.9873157624650992e-06, "loss": 0.942, "step": 30677 }, { "epoch": 0.58, "learning_rate": 1.9871662446853095e-06, "loss": 0.8667, "step": 30678 }, { "epoch": 0.58, "learning_rate": 1.987016728820424e-06, "loss": 0.811, "step": 30679 }, { "epoch": 0.58, "learning_rate": 1.986867214871004e-06, "loss": 0.9906, "step": 30680 }, { "epoch": 0.58, "learning_rate": 1.9867177028376055e-06, "loss": 0.8916, "step": 30681 }, { "epoch": 0.58, "learning_rate": 1.9865681927207865e-06, "loss": 1.0377, "step": 30682 }, { "epoch": 0.58, "learning_rate": 1.986418684521107e-06, "loss": 0.7223, "step": 30683 }, { "epoch": 0.58, "learning_rate": 1.9862691782391248e-06, "loss": 0.9802, "step": 30684 }, { "epoch": 0.58, "learning_rate": 1.9861196738753963e-06, "loss": 0.7882, "step": 30685 }, { "epoch": 0.58, "learning_rate": 1.9859701714304825e-06, "loss": 0.8995, "step": 30686 }, { "epoch": 0.58, "learning_rate": 1.9858206709049403e-06, "loss": 1.063, "step": 30687 }, { "epoch": 0.58, "learning_rate": 1.9856711722993274e-06, "loss": 0.8097, "step": 30688 }, { "epoch": 0.58, "learning_rate": 1.9855216756142025e-06, "loss": 0.8563, "step": 30689 }, { "epoch": 0.58, "learning_rate": 1.985372180850124e-06, "loss": 0.9403, "step": 30690 }, { "epoch": 0.58, "learning_rate": 1.985222688007651e-06, "loss": 0.7711, "step": 30691 }, { "epoch": 0.58, "learning_rate": 1.9850731970873388e-06, "loss": 0.9095, "step": 30692 }, { "epoch": 0.58, "learning_rate": 1.984923708089749e-06, "loss": 1.1334, "step": 30693 }, { "epoch": 0.58, "learning_rate": 1.984774221015438e-06, "loss": 0.9663, "step": 30694 }, { "epoch": 0.58, "learning_rate": 1.9846247358649634e-06, "loss": 0.9322, "step": 30695 }, { "epoch": 0.58, "learning_rate": 1.984475252638885e-06, "loss": 0.8312, "step": 30696 }, { "epoch": 0.58, "learning_rate": 1.9843257713377605e-06, "loss": 0.8212, "step": 30697 }, { "epoch": 0.58, "learning_rate": 1.9841762919621465e-06, "loss": 0.714, "step": 30698 }, { "epoch": 0.58, "learning_rate": 1.9840268145126036e-06, "loss": 1.0894, "step": 30699 }, { "epoch": 0.58, "learning_rate": 1.983877338989689e-06, "loss": 1.0818, "step": 30700 }, { "epoch": 0.58, "learning_rate": 1.983727865393959e-06, "loss": 0.8763, "step": 30701 }, { "epoch": 0.58, "learning_rate": 1.9835783937259752e-06, "loss": 1.0094, "step": 30702 }, { "epoch": 0.58, "learning_rate": 1.9834289239862923e-06, "loss": 0.787, "step": 30703 }, { "epoch": 0.58, "learning_rate": 1.9832794561754702e-06, "loss": 0.7509, "step": 30704 }, { "epoch": 0.58, "learning_rate": 1.9831299902940677e-06, "loss": 0.97, "step": 30705 }, { "epoch": 0.58, "learning_rate": 1.982980526342642e-06, "loss": 0.9986, "step": 30706 }, { "epoch": 0.58, "learning_rate": 1.9828310643217496e-06, "loss": 1.0092, "step": 30707 }, { "epoch": 0.58, "learning_rate": 1.9826816042319518e-06, "loss": 0.9116, "step": 30708 }, { "epoch": 0.58, "learning_rate": 1.982532146073804e-06, "loss": 0.8616, "step": 30709 }, { "epoch": 0.58, "learning_rate": 1.982382689847866e-06, "loss": 0.9618, "step": 30710 }, { "epoch": 0.58, "learning_rate": 1.9822332355546946e-06, "loss": 0.8403, "step": 30711 }, { "epoch": 0.58, "learning_rate": 1.982083783194849e-06, "loss": 1.1411, "step": 30712 }, { "epoch": 0.58, "learning_rate": 1.9819343327688857e-06, "loss": 0.8843, "step": 30713 }, { "epoch": 0.58, "learning_rate": 1.9817848842773648e-06, "loss": 0.7917, "step": 30714 }, { "epoch": 0.58, "learning_rate": 1.981635437720843e-06, "loss": 0.8212, "step": 30715 }, { "epoch": 0.58, "learning_rate": 1.9814859930998782e-06, "loss": 1.0861, "step": 30716 }, { "epoch": 0.58, "learning_rate": 1.9813365504150286e-06, "loss": 0.8376, "step": 30717 }, { "epoch": 0.58, "learning_rate": 1.9811871096668533e-06, "loss": 0.9199, "step": 30718 }, { "epoch": 0.58, "learning_rate": 1.9810376708559084e-06, "loss": 0.852, "step": 30719 }, { "epoch": 0.58, "learning_rate": 1.980888233982754e-06, "loss": 1.0091, "step": 30720 }, { "epoch": 0.58, "learning_rate": 1.980738799047947e-06, "loss": 0.8124, "step": 30721 }, { "epoch": 0.58, "learning_rate": 1.980589366052044e-06, "loss": 0.9088, "step": 30722 }, { "epoch": 0.58, "learning_rate": 1.980439934995606e-06, "loss": 0.8899, "step": 30723 }, { "epoch": 0.58, "learning_rate": 1.980290505879188e-06, "loss": 0.9803, "step": 30724 }, { "epoch": 0.58, "learning_rate": 1.9801410787033495e-06, "loss": 1.0377, "step": 30725 }, { "epoch": 0.58, "learning_rate": 1.979991653468649e-06, "loss": 0.7961, "step": 30726 }, { "epoch": 0.58, "learning_rate": 1.979842230175644e-06, "loss": 0.986, "step": 30727 }, { "epoch": 0.58, "learning_rate": 1.979692808824891e-06, "loss": 0.8056, "step": 30728 }, { "epoch": 0.58, "learning_rate": 1.9795433894169503e-06, "loss": 0.8154, "step": 30729 }, { "epoch": 0.58, "learning_rate": 1.979393971952378e-06, "loss": 0.8829, "step": 30730 }, { "epoch": 0.58, "learning_rate": 1.979244556431732e-06, "loss": 1.0617, "step": 30731 }, { "epoch": 0.58, "learning_rate": 1.9790951428555717e-06, "loss": 0.7419, "step": 30732 }, { "epoch": 0.58, "learning_rate": 1.9789457312244546e-06, "loss": 0.8237, "step": 30733 }, { "epoch": 0.58, "learning_rate": 1.9787963215389367e-06, "loss": 0.9186, "step": 30734 }, { "epoch": 0.58, "learning_rate": 1.9786469137995786e-06, "loss": 0.8817, "step": 30735 }, { "epoch": 0.58, "learning_rate": 1.9784975080069373e-06, "loss": 0.8773, "step": 30736 }, { "epoch": 0.58, "learning_rate": 1.9783481041615688e-06, "loss": 1.0508, "step": 30737 }, { "epoch": 0.58, "learning_rate": 1.978198702264033e-06, "loss": 0.9236, "step": 30738 }, { "epoch": 0.58, "learning_rate": 1.9780493023148877e-06, "loss": 0.9361, "step": 30739 }, { "epoch": 0.58, "learning_rate": 1.9778999043146895e-06, "loss": 0.9846, "step": 30740 }, { "epoch": 0.58, "learning_rate": 1.9777505082639985e-06, "loss": 0.7986, "step": 30741 }, { "epoch": 0.58, "learning_rate": 1.9776011141633706e-06, "loss": 0.8886, "step": 30742 }, { "epoch": 0.58, "learning_rate": 1.977451722013363e-06, "loss": 1.0276, "step": 30743 }, { "epoch": 0.58, "learning_rate": 1.977302331814536e-06, "loss": 1.0068, "step": 30744 }, { "epoch": 0.58, "learning_rate": 1.977152943567445e-06, "loss": 0.7104, "step": 30745 }, { "epoch": 0.58, "learning_rate": 1.977003557272649e-06, "loss": 0.9465, "step": 30746 }, { "epoch": 0.58, "learning_rate": 1.9768541729307065e-06, "loss": 1.0667, "step": 30747 }, { "epoch": 0.58, "learning_rate": 1.9767047905421742e-06, "loss": 1.0706, "step": 30748 }, { "epoch": 0.58, "learning_rate": 1.9765554101076097e-06, "loss": 1.0593, "step": 30749 }, { "epoch": 0.58, "learning_rate": 1.976406031627572e-06, "loss": 1.1517, "step": 30750 }, { "epoch": 0.58, "learning_rate": 1.9762566551026172e-06, "loss": 0.8998, "step": 30751 }, { "epoch": 0.58, "learning_rate": 1.9761072805333044e-06, "loss": 0.8961, "step": 30752 }, { "epoch": 0.58, "learning_rate": 1.975957907920191e-06, "loss": 0.7806, "step": 30753 }, { "epoch": 0.58, "learning_rate": 1.975808537263835e-06, "loss": 1.0274, "step": 30754 }, { "epoch": 0.58, "learning_rate": 1.975659168564793e-06, "loss": 1.1113, "step": 30755 }, { "epoch": 0.58, "learning_rate": 1.9755098018236246e-06, "loss": 0.9115, "step": 30756 }, { "epoch": 0.58, "learning_rate": 1.9753604370408864e-06, "loss": 1.1658, "step": 30757 }, { "epoch": 0.58, "learning_rate": 1.975211074217135e-06, "loss": 0.6848, "step": 30758 }, { "epoch": 0.58, "learning_rate": 1.9750617133529305e-06, "loss": 0.8562, "step": 30759 }, { "epoch": 0.58, "learning_rate": 1.9749123544488297e-06, "loss": 0.8276, "step": 30760 }, { "epoch": 0.58, "learning_rate": 1.974762997505389e-06, "loss": 1.0002, "step": 30761 }, { "epoch": 0.58, "learning_rate": 1.974613642523168e-06, "loss": 1.1771, "step": 30762 }, { "epoch": 0.58, "learning_rate": 1.9744642895027236e-06, "loss": 0.9481, "step": 30763 }, { "epoch": 0.58, "learning_rate": 1.9743149384446123e-06, "loss": 0.7843, "step": 30764 }, { "epoch": 0.58, "learning_rate": 1.9741655893493944e-06, "loss": 0.7527, "step": 30765 }, { "epoch": 0.58, "learning_rate": 1.9740162422176255e-06, "loss": 0.9171, "step": 30766 }, { "epoch": 0.58, "learning_rate": 1.973866897049863e-06, "loss": 0.9421, "step": 30767 }, { "epoch": 0.58, "learning_rate": 1.9737175538466665e-06, "loss": 1.0133, "step": 30768 }, { "epoch": 0.58, "learning_rate": 1.9735682126085927e-06, "loss": 1.0316, "step": 30769 }, { "epoch": 0.58, "learning_rate": 1.9734188733361977e-06, "loss": 0.848, "step": 30770 }, { "epoch": 0.58, "learning_rate": 1.9732695360300416e-06, "loss": 0.7946, "step": 30771 }, { "epoch": 0.58, "learning_rate": 1.9731202006906806e-06, "loss": 0.9032, "step": 30772 }, { "epoch": 0.58, "learning_rate": 1.9729708673186727e-06, "loss": 0.6787, "step": 30773 }, { "epoch": 0.58, "learning_rate": 1.9728215359145748e-06, "loss": 0.8658, "step": 30774 }, { "epoch": 0.58, "learning_rate": 1.9726722064789463e-06, "loss": 1.181, "step": 30775 }, { "epoch": 0.58, "learning_rate": 1.972522879012342e-06, "loss": 0.7539, "step": 30776 }, { "epoch": 0.58, "learning_rate": 1.9723735535153226e-06, "loss": 0.9647, "step": 30777 }, { "epoch": 0.58, "learning_rate": 1.9722242299884443e-06, "loss": 0.8975, "step": 30778 }, { "epoch": 0.58, "learning_rate": 1.972074908432263e-06, "loss": 0.8338, "step": 30779 }, { "epoch": 0.58, "learning_rate": 1.9719255888473385e-06, "loss": 1.1161, "step": 30780 }, { "epoch": 0.58, "learning_rate": 1.9717762712342282e-06, "loss": 1.1577, "step": 30781 }, { "epoch": 0.58, "learning_rate": 1.971626955593488e-06, "loss": 0.8961, "step": 30782 }, { "epoch": 0.58, "learning_rate": 1.971477641925678e-06, "loss": 0.7621, "step": 30783 }, { "epoch": 0.58, "learning_rate": 1.9713283302313536e-06, "loss": 0.8608, "step": 30784 }, { "epoch": 0.58, "learning_rate": 1.9711790205110726e-06, "loss": 0.9218, "step": 30785 }, { "epoch": 0.58, "learning_rate": 1.971029712765394e-06, "loss": 0.9704, "step": 30786 }, { "epoch": 0.58, "learning_rate": 1.970880406994873e-06, "loss": 1.0904, "step": 30787 }, { "epoch": 0.58, "learning_rate": 1.9707311032000682e-06, "loss": 1.0074, "step": 30788 }, { "epoch": 0.58, "learning_rate": 1.9705818013815386e-06, "loss": 0.8763, "step": 30789 }, { "epoch": 0.58, "learning_rate": 1.97043250153984e-06, "loss": 0.8677, "step": 30790 }, { "epoch": 0.58, "learning_rate": 1.970283203675529e-06, "loss": 0.8438, "step": 30791 }, { "epoch": 0.58, "learning_rate": 1.970133907789165e-06, "loss": 1.0554, "step": 30792 }, { "epoch": 0.58, "learning_rate": 1.9699846138813053e-06, "loss": 1.0491, "step": 30793 }, { "epoch": 0.58, "learning_rate": 1.9698353219525062e-06, "loss": 1.0188, "step": 30794 }, { "epoch": 0.58, "learning_rate": 1.9696860320033256e-06, "loss": 1.0262, "step": 30795 }, { "epoch": 0.58, "learning_rate": 1.969536744034322e-06, "loss": 0.809, "step": 30796 }, { "epoch": 0.58, "learning_rate": 1.969387458046051e-06, "loss": 0.9856, "step": 30797 }, { "epoch": 0.58, "learning_rate": 1.969238174039071e-06, "loss": 0.8549, "step": 30798 }, { "epoch": 0.58, "learning_rate": 1.9690888920139403e-06, "loss": 0.8559, "step": 30799 }, { "epoch": 0.58, "learning_rate": 1.9689396119712145e-06, "loss": 1.3096, "step": 30800 }, { "epoch": 0.58, "learning_rate": 1.9687903339114516e-06, "loss": 0.7068, "step": 30801 }, { "epoch": 0.58, "learning_rate": 1.9686410578352103e-06, "loss": 0.8843, "step": 30802 }, { "epoch": 0.58, "learning_rate": 1.9684917837430463e-06, "loss": 0.9223, "step": 30803 }, { "epoch": 0.58, "learning_rate": 1.9683425116355182e-06, "loss": 0.7383, "step": 30804 }, { "epoch": 0.58, "learning_rate": 1.968193241513183e-06, "loss": 0.6998, "step": 30805 }, { "epoch": 0.58, "learning_rate": 1.968043973376597e-06, "loss": 1.0524, "step": 30806 }, { "epoch": 0.58, "learning_rate": 1.9678947072263194e-06, "loss": 0.9833, "step": 30807 }, { "epoch": 0.58, "learning_rate": 1.967745443062906e-06, "loss": 0.8644, "step": 30808 }, { "epoch": 0.58, "learning_rate": 1.9675961808869144e-06, "loss": 0.9351, "step": 30809 }, { "epoch": 0.58, "learning_rate": 1.9674469206989038e-06, "loss": 0.9012, "step": 30810 }, { "epoch": 0.58, "learning_rate": 1.9672976624994292e-06, "loss": 0.845, "step": 30811 }, { "epoch": 0.58, "learning_rate": 1.9671484062890485e-06, "loss": 1.0672, "step": 30812 }, { "epoch": 0.58, "learning_rate": 1.9669991520683203e-06, "loss": 0.9284, "step": 30813 }, { "epoch": 0.58, "learning_rate": 1.9668498998378e-06, "loss": 0.8651, "step": 30814 }, { "epoch": 0.58, "learning_rate": 1.966700649598046e-06, "loss": 0.8877, "step": 30815 }, { "epoch": 0.58, "learning_rate": 1.9665514013496155e-06, "loss": 0.8245, "step": 30816 }, { "epoch": 0.58, "learning_rate": 1.9664021550930663e-06, "loss": 0.8219, "step": 30817 }, { "epoch": 0.58, "learning_rate": 1.9662529108289537e-06, "loss": 1.0128, "step": 30818 }, { "epoch": 0.58, "learning_rate": 1.9661036685578376e-06, "loss": 1.0698, "step": 30819 }, { "epoch": 0.58, "learning_rate": 1.9659544282802745e-06, "loss": 0.9176, "step": 30820 }, { "epoch": 0.58, "learning_rate": 1.9658051899968193e-06, "loss": 1.019, "step": 30821 }, { "epoch": 0.58, "learning_rate": 1.9656559537080326e-06, "loss": 0.9001, "step": 30822 }, { "epoch": 0.58, "learning_rate": 1.96550671941447e-06, "loss": 0.7297, "step": 30823 }, { "epoch": 0.58, "learning_rate": 1.965357487116688e-06, "loss": 1.1895, "step": 30824 }, { "epoch": 0.58, "learning_rate": 1.965208256815246e-06, "loss": 1.2362, "step": 30825 }, { "epoch": 0.58, "learning_rate": 1.9650590285107e-06, "loss": 0.9553, "step": 30826 }, { "epoch": 0.58, "learning_rate": 1.9649098022036058e-06, "loss": 1.0596, "step": 30827 }, { "epoch": 0.58, "learning_rate": 1.9647605778945234e-06, "loss": 0.9333, "step": 30828 }, { "epoch": 0.58, "learning_rate": 1.9646113555840076e-06, "loss": 0.7681, "step": 30829 }, { "epoch": 0.58, "learning_rate": 1.9644621352726167e-06, "loss": 0.8583, "step": 30830 }, { "epoch": 0.58, "learning_rate": 1.9643129169609083e-06, "loss": 1.097, "step": 30831 }, { "epoch": 0.58, "learning_rate": 1.964163700649439e-06, "loss": 1.0274, "step": 30832 }, { "epoch": 0.58, "learning_rate": 1.9640144863387653e-06, "loss": 0.8833, "step": 30833 }, { "epoch": 0.58, "learning_rate": 1.9638652740294462e-06, "loss": 0.9854, "step": 30834 }, { "epoch": 0.58, "learning_rate": 1.9637160637220366e-06, "loss": 1.1226, "step": 30835 }, { "epoch": 0.58, "learning_rate": 1.9635668554170954e-06, "loss": 0.8479, "step": 30836 }, { "epoch": 0.58, "learning_rate": 1.963417649115179e-06, "loss": 1.2788, "step": 30837 }, { "epoch": 0.58, "learning_rate": 1.963268444816845e-06, "loss": 0.9297, "step": 30838 }, { "epoch": 0.58, "learning_rate": 1.963119242522649e-06, "loss": 1.0663, "step": 30839 }, { "epoch": 0.58, "learning_rate": 1.9629700422331505e-06, "loss": 0.8435, "step": 30840 }, { "epoch": 0.58, "learning_rate": 1.9628208439489056e-06, "loss": 0.8638, "step": 30841 }, { "epoch": 0.58, "learning_rate": 1.96267164767047e-06, "loss": 1.0239, "step": 30842 }, { "epoch": 0.58, "learning_rate": 1.9625224533984027e-06, "loss": 0.9779, "step": 30843 }, { "epoch": 0.58, "learning_rate": 1.9623732611332602e-06, "loss": 1.1224, "step": 30844 }, { "epoch": 0.58, "learning_rate": 1.9622240708755986e-06, "loss": 0.8641, "step": 30845 }, { "epoch": 0.58, "learning_rate": 1.962074882625977e-06, "loss": 0.7654, "step": 30846 }, { "epoch": 0.58, "learning_rate": 1.961925696384951e-06, "loss": 0.9778, "step": 30847 }, { "epoch": 0.58, "learning_rate": 1.961776512153077e-06, "loss": 0.8156, "step": 30848 }, { "epoch": 0.58, "learning_rate": 1.9616273299309145e-06, "loss": 0.7978, "step": 30849 }, { "epoch": 0.58, "learning_rate": 1.961478149719018e-06, "loss": 1.0523, "step": 30850 }, { "epoch": 0.58, "learning_rate": 1.961328971517945e-06, "loss": 0.9909, "step": 30851 }, { "epoch": 0.58, "learning_rate": 1.9611797953282545e-06, "loss": 1.0646, "step": 30852 }, { "epoch": 0.58, "learning_rate": 1.961030621150502e-06, "loss": 0.7839, "step": 30853 }, { "epoch": 0.58, "learning_rate": 1.9608814489852435e-06, "loss": 0.8087, "step": 30854 }, { "epoch": 0.58, "learning_rate": 1.9607322788330384e-06, "loss": 0.9904, "step": 30855 }, { "epoch": 0.58, "learning_rate": 1.960583110694442e-06, "loss": 0.9544, "step": 30856 }, { "epoch": 0.58, "learning_rate": 1.960433944570011e-06, "loss": 0.9457, "step": 30857 }, { "epoch": 0.58, "learning_rate": 1.9602847804603035e-06, "loss": 0.8055, "step": 30858 }, { "epoch": 0.58, "learning_rate": 1.960135618365877e-06, "loss": 0.9199, "step": 30859 }, { "epoch": 0.58, "learning_rate": 1.959986458287286e-06, "loss": 0.8035, "step": 30860 }, { "epoch": 0.58, "learning_rate": 1.95983730022509e-06, "loss": 0.8835, "step": 30861 }, { "epoch": 0.58, "learning_rate": 1.9596881441798457e-06, "loss": 1.0493, "step": 30862 }, { "epoch": 0.58, "learning_rate": 1.959538990152108e-06, "loss": 0.9827, "step": 30863 }, { "epoch": 0.58, "learning_rate": 1.959389838142435e-06, "loss": 0.7866, "step": 30864 }, { "epoch": 0.58, "learning_rate": 1.9592406881513847e-06, "loss": 0.9297, "step": 30865 }, { "epoch": 0.58, "learning_rate": 1.959091540179512e-06, "loss": 0.9109, "step": 30866 }, { "epoch": 0.58, "learning_rate": 1.9589423942273765e-06, "loss": 0.821, "step": 30867 }, { "epoch": 0.58, "learning_rate": 1.958793250295533e-06, "loss": 0.9933, "step": 30868 }, { "epoch": 0.58, "learning_rate": 1.9586441083845374e-06, "loss": 1.082, "step": 30869 }, { "epoch": 0.58, "learning_rate": 1.95849496849495e-06, "loss": 0.8065, "step": 30870 }, { "epoch": 0.58, "learning_rate": 1.958345830627325e-06, "loss": 0.8576, "step": 30871 }, { "epoch": 0.58, "learning_rate": 1.958196694782219e-06, "loss": 0.9264, "step": 30872 }, { "epoch": 0.58, "learning_rate": 1.9580475609601918e-06, "loss": 0.9428, "step": 30873 }, { "epoch": 0.58, "learning_rate": 1.957898429161798e-06, "loss": 0.9022, "step": 30874 }, { "epoch": 0.58, "learning_rate": 1.957749299387594e-06, "loss": 1.0353, "step": 30875 }, { "epoch": 0.58, "learning_rate": 1.957600171638138e-06, "loss": 1.0001, "step": 30876 }, { "epoch": 0.58, "learning_rate": 1.9574510459139863e-06, "loss": 0.8102, "step": 30877 }, { "epoch": 0.58, "learning_rate": 1.9573019222156955e-06, "loss": 0.7566, "step": 30878 }, { "epoch": 0.58, "learning_rate": 1.9571528005438226e-06, "loss": 0.8483, "step": 30879 }, { "epoch": 0.58, "learning_rate": 1.9570036808989254e-06, "loss": 0.8965, "step": 30880 }, { "epoch": 0.58, "learning_rate": 1.9568545632815587e-06, "loss": 0.9802, "step": 30881 }, { "epoch": 0.58, "learning_rate": 1.9567054476922815e-06, "loss": 0.943, "step": 30882 }, { "epoch": 0.58, "learning_rate": 1.956556334131649e-06, "loss": 0.8252, "step": 30883 }, { "epoch": 0.58, "learning_rate": 1.956407222600218e-06, "loss": 0.9621, "step": 30884 }, { "epoch": 0.58, "learning_rate": 1.9562581130985457e-06, "loss": 0.952, "step": 30885 }, { "epoch": 0.58, "learning_rate": 1.95610900562719e-06, "loss": 0.924, "step": 30886 }, { "epoch": 0.58, "learning_rate": 1.9559599001867053e-06, "loss": 0.9982, "step": 30887 }, { "epoch": 0.58, "learning_rate": 1.955810796777651e-06, "loss": 1.1729, "step": 30888 }, { "epoch": 0.58, "learning_rate": 1.955661695400582e-06, "loss": 0.9601, "step": 30889 }, { "epoch": 0.58, "learning_rate": 1.955512596056055e-06, "loss": 0.8852, "step": 30890 }, { "epoch": 0.58, "learning_rate": 1.955363498744628e-06, "loss": 0.8338, "step": 30891 }, { "epoch": 0.58, "learning_rate": 1.955214403466857e-06, "loss": 0.8471, "step": 30892 }, { "epoch": 0.58, "learning_rate": 1.9550653102232972e-06, "loss": 0.9915, "step": 30893 }, { "epoch": 0.58, "learning_rate": 1.9549162190145086e-06, "loss": 1.039, "step": 30894 }, { "epoch": 0.58, "learning_rate": 1.9547671298410457e-06, "loss": 0.9124, "step": 30895 }, { "epoch": 0.58, "learning_rate": 1.954618042703465e-06, "loss": 0.8839, "step": 30896 }, { "epoch": 0.58, "learning_rate": 1.9544689576023247e-06, "loss": 0.7982, "step": 30897 }, { "epoch": 0.58, "learning_rate": 1.95431987453818e-06, "loss": 0.872, "step": 30898 }, { "epoch": 0.58, "learning_rate": 1.954170793511588e-06, "loss": 0.8816, "step": 30899 }, { "epoch": 0.58, "learning_rate": 1.954021714523106e-06, "loss": 1.081, "step": 30900 }, { "epoch": 0.58, "learning_rate": 1.9538726375732903e-06, "loss": 0.9207, "step": 30901 }, { "epoch": 0.58, "learning_rate": 1.9537235626626967e-06, "loss": 0.9058, "step": 30902 }, { "epoch": 0.58, "learning_rate": 1.9535744897918834e-06, "loss": 1.1179, "step": 30903 }, { "epoch": 0.58, "learning_rate": 1.953425418961406e-06, "loss": 0.9811, "step": 30904 }, { "epoch": 0.58, "learning_rate": 1.9532763501718206e-06, "loss": 0.777, "step": 30905 }, { "epoch": 0.58, "learning_rate": 1.9531272834236846e-06, "loss": 0.7762, "step": 30906 }, { "epoch": 0.58, "learning_rate": 1.9529782187175557e-06, "loss": 0.8906, "step": 30907 }, { "epoch": 0.58, "learning_rate": 1.9528291560539882e-06, "loss": 0.9722, "step": 30908 }, { "epoch": 0.58, "learning_rate": 1.9526800954335405e-06, "loss": 0.9447, "step": 30909 }, { "epoch": 0.58, "learning_rate": 1.9525310368567686e-06, "loss": 0.674, "step": 30910 }, { "epoch": 0.58, "learning_rate": 1.952381980324228e-06, "loss": 0.7852, "step": 30911 }, { "epoch": 0.58, "learning_rate": 1.952232925836478e-06, "loss": 0.9006, "step": 30912 }, { "epoch": 0.58, "learning_rate": 1.952083873394072e-06, "loss": 0.9376, "step": 30913 }, { "epoch": 0.58, "learning_rate": 1.9519348229975683e-06, "loss": 0.782, "step": 30914 }, { "epoch": 0.58, "learning_rate": 1.951785774647524e-06, "loss": 1.0206, "step": 30915 }, { "epoch": 0.58, "learning_rate": 1.9516367283444946e-06, "loss": 0.9924, "step": 30916 }, { "epoch": 0.58, "learning_rate": 1.9514876840890355e-06, "loss": 0.7137, "step": 30917 }, { "epoch": 0.58, "learning_rate": 1.9513386418817064e-06, "loss": 1.0537, "step": 30918 }, { "epoch": 0.58, "learning_rate": 1.9511896017230607e-06, "loss": 1.0823, "step": 30919 }, { "epoch": 0.58, "learning_rate": 1.9510405636136575e-06, "loss": 1.0246, "step": 30920 }, { "epoch": 0.58, "learning_rate": 1.9508915275540503e-06, "loss": 0.9259, "step": 30921 }, { "epoch": 0.58, "learning_rate": 1.9507424935447986e-06, "loss": 0.8812, "step": 30922 }, { "epoch": 0.58, "learning_rate": 1.9505934615864576e-06, "loss": 0.7302, "step": 30923 }, { "epoch": 0.58, "learning_rate": 1.9504444316795825e-06, "loss": 1.0289, "step": 30924 }, { "epoch": 0.58, "learning_rate": 1.9502954038247324e-06, "loss": 1.0693, "step": 30925 }, { "epoch": 0.58, "learning_rate": 1.9501463780224617e-06, "loss": 0.9539, "step": 30926 }, { "epoch": 0.58, "learning_rate": 1.949997354273327e-06, "loss": 0.6533, "step": 30927 }, { "epoch": 0.58, "learning_rate": 1.9498483325778865e-06, "loss": 0.7743, "step": 30928 }, { "epoch": 0.58, "learning_rate": 1.9496993129366954e-06, "loss": 0.9267, "step": 30929 }, { "epoch": 0.58, "learning_rate": 1.9495502953503093e-06, "loss": 0.9525, "step": 30930 }, { "epoch": 0.58, "learning_rate": 1.9494012798192863e-06, "loss": 1.0097, "step": 30931 }, { "epoch": 0.58, "learning_rate": 1.9492522663441816e-06, "loss": 0.8886, "step": 30932 }, { "epoch": 0.58, "learning_rate": 1.9491032549255523e-06, "loss": 0.9795, "step": 30933 }, { "epoch": 0.58, "learning_rate": 1.9489542455639544e-06, "loss": 0.8986, "step": 30934 }, { "epoch": 0.58, "learning_rate": 1.9488052382599447e-06, "loss": 0.7549, "step": 30935 }, { "epoch": 0.58, "learning_rate": 1.9486562330140786e-06, "loss": 0.8136, "step": 30936 }, { "epoch": 0.58, "learning_rate": 1.948507229826914e-06, "loss": 1.0189, "step": 30937 }, { "epoch": 0.58, "learning_rate": 1.9483582286990067e-06, "loss": 0.9059, "step": 30938 }, { "epoch": 0.58, "learning_rate": 1.948209229630912e-06, "loss": 1.031, "step": 30939 }, { "epoch": 0.58, "learning_rate": 1.9480602326231873e-06, "loss": 0.9719, "step": 30940 }, { "epoch": 0.58, "learning_rate": 1.9479112376763897e-06, "loss": 0.9045, "step": 30941 }, { "epoch": 0.58, "learning_rate": 1.947762244791073e-06, "loss": 0.6922, "step": 30942 }, { "epoch": 0.58, "learning_rate": 1.9476132539677964e-06, "loss": 1.1494, "step": 30943 }, { "epoch": 0.58, "learning_rate": 1.947464265207115e-06, "loss": 1.0728, "step": 30944 }, { "epoch": 0.58, "learning_rate": 1.947315278509584e-06, "loss": 0.9273, "step": 30945 }, { "epoch": 0.58, "learning_rate": 1.9471662938757624e-06, "loss": 0.8901, "step": 30946 }, { "epoch": 0.58, "learning_rate": 1.9470173113062036e-06, "loss": 0.8719, "step": 30947 }, { "epoch": 0.58, "learning_rate": 1.946868330801465e-06, "loss": 0.9262, "step": 30948 }, { "epoch": 0.58, "learning_rate": 1.9467193523621043e-06, "loss": 1.0242, "step": 30949 }, { "epoch": 0.58, "learning_rate": 1.9465703759886763e-06, "loss": 0.9194, "step": 30950 }, { "epoch": 0.58, "learning_rate": 1.9464214016817367e-06, "loss": 1.1491, "step": 30951 }, { "epoch": 0.58, "learning_rate": 1.9462724294418435e-06, "loss": 0.9729, "step": 30952 }, { "epoch": 0.58, "learning_rate": 1.9461234592695517e-06, "loss": 0.9119, "step": 30953 }, { "epoch": 0.58, "learning_rate": 1.945974491165418e-06, "loss": 0.8667, "step": 30954 }, { "epoch": 0.58, "learning_rate": 1.9458255251299986e-06, "loss": 1.0592, "step": 30955 }, { "epoch": 0.58, "learning_rate": 1.94567656116385e-06, "loss": 1.1282, "step": 30956 }, { "epoch": 0.58, "learning_rate": 1.945527599267527e-06, "loss": 0.8402, "step": 30957 }, { "epoch": 0.58, "learning_rate": 1.945378639441588e-06, "loss": 0.9742, "step": 30958 }, { "epoch": 0.58, "learning_rate": 1.9452296816865884e-06, "loss": 0.9165, "step": 30959 }, { "epoch": 0.58, "learning_rate": 1.9450807260030828e-06, "loss": 0.947, "step": 30960 }, { "epoch": 0.58, "learning_rate": 1.9449317723916298e-06, "loss": 1.0284, "step": 30961 }, { "epoch": 0.58, "learning_rate": 1.9447828208527847e-06, "loss": 1.0768, "step": 30962 }, { "epoch": 0.58, "learning_rate": 1.9446338713871022e-06, "loss": 0.9796, "step": 30963 }, { "epoch": 0.58, "learning_rate": 1.944484923995141e-06, "loss": 1.0264, "step": 30964 }, { "epoch": 0.58, "learning_rate": 1.9443359786774566e-06, "loss": 0.7057, "step": 30965 }, { "epoch": 0.58, "learning_rate": 1.9441870354346033e-06, "loss": 0.9114, "step": 30966 }, { "epoch": 0.58, "learning_rate": 1.9440380942671392e-06, "loss": 0.8584, "step": 30967 }, { "epoch": 0.58, "learning_rate": 1.94388915517562e-06, "loss": 0.9984, "step": 30968 }, { "epoch": 0.58, "learning_rate": 1.9437402181606005e-06, "loss": 1.0676, "step": 30969 }, { "epoch": 0.58, "learning_rate": 1.9435912832226394e-06, "loss": 0.9715, "step": 30970 }, { "epoch": 0.58, "learning_rate": 1.943442350362291e-06, "loss": 0.8989, "step": 30971 }, { "epoch": 0.58, "learning_rate": 1.943293419580111e-06, "loss": 0.8524, "step": 30972 }, { "epoch": 0.58, "learning_rate": 1.9431444908766574e-06, "loss": 0.9041, "step": 30973 }, { "epoch": 0.58, "learning_rate": 1.9429955642524843e-06, "loss": 0.9759, "step": 30974 }, { "epoch": 0.58, "learning_rate": 1.942846639708149e-06, "loss": 1.0103, "step": 30975 }, { "epoch": 0.58, "learning_rate": 1.9426977172442074e-06, "loss": 1.0903, "step": 30976 }, { "epoch": 0.58, "learning_rate": 1.9425487968612157e-06, "loss": 0.9438, "step": 30977 }, { "epoch": 0.58, "learning_rate": 1.9423998785597287e-06, "loss": 1.0177, "step": 30978 }, { "epoch": 0.58, "learning_rate": 1.9422509623403046e-06, "loss": 0.9216, "step": 30979 }, { "epoch": 0.58, "learning_rate": 1.942102048203498e-06, "loss": 1.0266, "step": 30980 }, { "epoch": 0.58, "learning_rate": 1.9419531361498647e-06, "loss": 1.0512, "step": 30981 }, { "epoch": 0.58, "learning_rate": 1.9418042261799615e-06, "loss": 0.9968, "step": 30982 }, { "epoch": 0.58, "learning_rate": 1.9416553182943447e-06, "loss": 0.9027, "step": 30983 }, { "epoch": 0.58, "learning_rate": 1.941506412493569e-06, "loss": 0.7347, "step": 30984 }, { "epoch": 0.58, "learning_rate": 1.9413575087781922e-06, "loss": 0.9724, "step": 30985 }, { "epoch": 0.58, "learning_rate": 1.941208607148769e-06, "loss": 1.1581, "step": 30986 }, { "epoch": 0.58, "learning_rate": 1.941059707605855e-06, "loss": 0.9309, "step": 30987 }, { "epoch": 0.58, "learning_rate": 1.9409108101500082e-06, "loss": 1.0302, "step": 30988 }, { "epoch": 0.58, "learning_rate": 1.9407619147817824e-06, "loss": 0.7883, "step": 30989 }, { "epoch": 0.58, "learning_rate": 1.9406130215017343e-06, "loss": 0.7721, "step": 30990 }, { "epoch": 0.58, "learning_rate": 1.9404641303104206e-06, "loss": 0.8372, "step": 30991 }, { "epoch": 0.58, "learning_rate": 1.9403152412083968e-06, "loss": 0.9055, "step": 30992 }, { "epoch": 0.58, "learning_rate": 1.940166354196218e-06, "loss": 0.9983, "step": 30993 }, { "epoch": 0.58, "learning_rate": 1.940017469274442e-06, "loss": 1.1206, "step": 30994 }, { "epoch": 0.58, "learning_rate": 1.939868586443622e-06, "loss": 0.8636, "step": 30995 }, { "epoch": 0.58, "learning_rate": 1.9397197057043164e-06, "loss": 0.9417, "step": 30996 }, { "epoch": 0.58, "learning_rate": 1.93957082705708e-06, "loss": 0.8712, "step": 30997 }, { "epoch": 0.58, "learning_rate": 1.93942195050247e-06, "loss": 0.7208, "step": 30998 }, { "epoch": 0.58, "learning_rate": 1.9392730760410396e-06, "loss": 0.7877, "step": 30999 }, { "epoch": 0.58, "learning_rate": 1.9391242036733476e-06, "loss": 1.1412, "step": 31000 }, { "epoch": 0.58, "learning_rate": 1.938975333399949e-06, "loss": 0.857, "step": 31001 }, { "epoch": 0.58, "learning_rate": 1.9388264652213976e-06, "loss": 0.9969, "step": 31002 }, { "epoch": 0.58, "learning_rate": 1.9386775991382518e-06, "loss": 0.7425, "step": 31003 }, { "epoch": 0.58, "learning_rate": 1.938528735151067e-06, "loss": 0.8106, "step": 31004 }, { "epoch": 0.58, "learning_rate": 1.938379873260398e-06, "loss": 0.8708, "step": 31005 }, { "epoch": 0.58, "learning_rate": 1.938231013466802e-06, "loss": 1.1136, "step": 31006 }, { "epoch": 0.59, "learning_rate": 1.938082155770834e-06, "loss": 0.8927, "step": 31007 }, { "epoch": 0.59, "learning_rate": 1.9379333001730495e-06, "loss": 0.8612, "step": 31008 }, { "epoch": 0.59, "learning_rate": 1.9377844466740057e-06, "loss": 0.7857, "step": 31009 }, { "epoch": 0.59, "learning_rate": 1.937635595274257e-06, "loss": 0.6833, "step": 31010 }, { "epoch": 0.59, "learning_rate": 1.937486745974359e-06, "loss": 0.8743, "step": 31011 }, { "epoch": 0.59, "learning_rate": 1.9373378987748697e-06, "loss": 1.3407, "step": 31012 }, { "epoch": 0.59, "learning_rate": 1.9371890536763434e-06, "loss": 1.0361, "step": 31013 }, { "epoch": 0.59, "learning_rate": 1.937040210679334e-06, "loss": 1.0992, "step": 31014 }, { "epoch": 0.59, "learning_rate": 1.936891369784401e-06, "loss": 1.1188, "step": 31015 }, { "epoch": 0.59, "learning_rate": 1.936742530992098e-06, "loss": 1.0536, "step": 31016 }, { "epoch": 0.59, "learning_rate": 1.9365936943029807e-06, "loss": 0.903, "step": 31017 }, { "epoch": 0.59, "learning_rate": 1.9364448597176055e-06, "loss": 1.0624, "step": 31018 }, { "epoch": 0.59, "learning_rate": 1.9362960272365285e-06, "loss": 1.1332, "step": 31019 }, { "epoch": 0.59, "learning_rate": 1.936147196860304e-06, "loss": 1.1124, "step": 31020 }, { "epoch": 0.59, "learning_rate": 1.935998368589489e-06, "loss": 0.8606, "step": 31021 }, { "epoch": 0.59, "learning_rate": 1.9358495424246393e-06, "loss": 1.0273, "step": 31022 }, { "epoch": 0.59, "learning_rate": 1.935700718366309e-06, "loss": 0.728, "step": 31023 }, { "epoch": 0.59, "learning_rate": 1.9355518964150548e-06, "loss": 1.1789, "step": 31024 }, { "epoch": 0.59, "learning_rate": 1.9354030765714337e-06, "loss": 1.1765, "step": 31025 }, { "epoch": 0.59, "learning_rate": 1.935254258835999e-06, "loss": 0.8095, "step": 31026 }, { "epoch": 0.59, "learning_rate": 1.9351054432093085e-06, "loss": 0.8437, "step": 31027 }, { "epoch": 0.59, "learning_rate": 1.9349566296919173e-06, "loss": 0.7157, "step": 31028 }, { "epoch": 0.59, "learning_rate": 1.9348078182843793e-06, "loss": 0.7389, "step": 31029 }, { "epoch": 0.59, "learning_rate": 1.934659008987253e-06, "loss": 0.764, "step": 31030 }, { "epoch": 0.59, "learning_rate": 1.934510201801092e-06, "loss": 1.2213, "step": 31031 }, { "epoch": 0.59, "learning_rate": 1.9343613967264517e-06, "loss": 1.084, "step": 31032 }, { "epoch": 0.59, "learning_rate": 1.93421259376389e-06, "loss": 0.7534, "step": 31033 }, { "epoch": 0.59, "learning_rate": 1.934063792913961e-06, "loss": 1.0159, "step": 31034 }, { "epoch": 0.59, "learning_rate": 1.9339149941772194e-06, "loss": 0.8102, "step": 31035 }, { "epoch": 0.59, "learning_rate": 1.9337661975542227e-06, "loss": 0.8466, "step": 31036 }, { "epoch": 0.59, "learning_rate": 1.9336174030455256e-06, "loss": 0.9304, "step": 31037 }, { "epoch": 0.59, "learning_rate": 1.9334686106516835e-06, "loss": 0.7755, "step": 31038 }, { "epoch": 0.59, "learning_rate": 1.933319820373252e-06, "loss": 0.8331, "step": 31039 }, { "epoch": 0.59, "learning_rate": 1.933171032210788e-06, "loss": 0.7962, "step": 31040 }, { "epoch": 0.59, "learning_rate": 1.9330222461648444e-06, "loss": 1.0425, "step": 31041 }, { "epoch": 0.59, "learning_rate": 1.93287346223598e-06, "loss": 0.7915, "step": 31042 }, { "epoch": 0.59, "learning_rate": 1.932724680424748e-06, "loss": 1.1801, "step": 31043 }, { "epoch": 0.59, "learning_rate": 1.9325759007317037e-06, "loss": 1.0043, "step": 31044 }, { "epoch": 0.59, "learning_rate": 1.9324271231574043e-06, "loss": 0.9866, "step": 31045 }, { "epoch": 0.59, "learning_rate": 1.9322783477024055e-06, "loss": 0.6494, "step": 31046 }, { "epoch": 0.59, "learning_rate": 1.9321295743672604e-06, "loss": 0.8948, "step": 31047 }, { "epoch": 0.59, "learning_rate": 1.931980803152527e-06, "loss": 0.8658, "step": 31048 }, { "epoch": 0.59, "learning_rate": 1.9318320340587606e-06, "loss": 0.9115, "step": 31049 }, { "epoch": 0.59, "learning_rate": 1.9316832670865143e-06, "loss": 1.0723, "step": 31050 }, { "epoch": 0.59, "learning_rate": 1.9315345022363464e-06, "loss": 0.9751, "step": 31051 }, { "epoch": 0.59, "learning_rate": 1.9313857395088105e-06, "loss": 0.7214, "step": 31052 }, { "epoch": 0.59, "learning_rate": 1.9312369789044625e-06, "loss": 1.0247, "step": 31053 }, { "epoch": 0.59, "learning_rate": 1.9310882204238596e-06, "loss": 0.6958, "step": 31054 }, { "epoch": 0.59, "learning_rate": 1.9309394640675556e-06, "loss": 0.8977, "step": 31055 }, { "epoch": 0.59, "learning_rate": 1.9307907098361052e-06, "loss": 1.1275, "step": 31056 }, { "epoch": 0.59, "learning_rate": 1.9306419577300656e-06, "loss": 0.9984, "step": 31057 }, { "epoch": 0.59, "learning_rate": 1.930493207749991e-06, "loss": 0.8213, "step": 31058 }, { "epoch": 0.59, "learning_rate": 1.9303444598964374e-06, "loss": 0.8261, "step": 31059 }, { "epoch": 0.59, "learning_rate": 1.93019571416996e-06, "loss": 0.809, "step": 31060 }, { "epoch": 0.59, "learning_rate": 1.930046970571115e-06, "loss": 0.7604, "step": 31061 }, { "epoch": 0.59, "learning_rate": 1.929898229100456e-06, "loss": 0.9901, "step": 31062 }, { "epoch": 0.59, "learning_rate": 1.929749489758541e-06, "loss": 1.0762, "step": 31063 }, { "epoch": 0.59, "learning_rate": 1.9296007525459236e-06, "loss": 0.9895, "step": 31064 }, { "epoch": 0.59, "learning_rate": 1.9294520174631583e-06, "loss": 0.8158, "step": 31065 }, { "epoch": 0.59, "learning_rate": 1.9293032845108023e-06, "loss": 0.8279, "step": 31066 }, { "epoch": 0.59, "learning_rate": 1.929154553689411e-06, "loss": 0.9698, "step": 31067 }, { "epoch": 0.59, "learning_rate": 1.929005824999538e-06, "loss": 1.0008, "step": 31068 }, { "epoch": 0.59, "learning_rate": 1.9288570984417407e-06, "loss": 1.0443, "step": 31069 }, { "epoch": 0.59, "learning_rate": 1.9287083740165734e-06, "loss": 0.9767, "step": 31070 }, { "epoch": 0.59, "learning_rate": 1.9285596517245904e-06, "loss": 1.016, "step": 31071 }, { "epoch": 0.59, "learning_rate": 1.9284109315663495e-06, "loss": 0.9566, "step": 31072 }, { "epoch": 0.59, "learning_rate": 1.9282622135424038e-06, "loss": 0.9843, "step": 31073 }, { "epoch": 0.59, "learning_rate": 1.9281134976533093e-06, "loss": 1.0412, "step": 31074 }, { "epoch": 0.59, "learning_rate": 1.9279647838996225e-06, "loss": 1.1462, "step": 31075 }, { "epoch": 0.59, "learning_rate": 1.9278160722818975e-06, "loss": 0.8102, "step": 31076 }, { "epoch": 0.59, "learning_rate": 1.9276673628006886e-06, "loss": 0.728, "step": 31077 }, { "epoch": 0.59, "learning_rate": 1.9275186554565535e-06, "loss": 0.7446, "step": 31078 }, { "epoch": 0.59, "learning_rate": 1.9273699502500454e-06, "loss": 0.8106, "step": 31079 }, { "epoch": 0.59, "learning_rate": 1.927221247181721e-06, "loss": 1.0088, "step": 31080 }, { "epoch": 0.59, "learning_rate": 1.927072546252134e-06, "loss": 1.1268, "step": 31081 }, { "epoch": 0.59, "learning_rate": 1.9269238474618413e-06, "loss": 0.7367, "step": 31082 }, { "epoch": 0.59, "learning_rate": 1.9267751508113968e-06, "loss": 1.0552, "step": 31083 }, { "epoch": 0.59, "learning_rate": 1.9266264563013567e-06, "loss": 0.9115, "step": 31084 }, { "epoch": 0.59, "learning_rate": 1.9264777639322762e-06, "loss": 0.7878, "step": 31085 }, { "epoch": 0.59, "learning_rate": 1.926329073704709e-06, "loss": 0.947, "step": 31086 }, { "epoch": 0.59, "learning_rate": 1.926180385619212e-06, "loss": 1.1711, "step": 31087 }, { "epoch": 0.59, "learning_rate": 1.9260316996763407e-06, "loss": 1.0751, "step": 31088 }, { "epoch": 0.59, "learning_rate": 1.925883015876648e-06, "loss": 0.9518, "step": 31089 }, { "epoch": 0.59, "learning_rate": 1.9257343342206918e-06, "loss": 0.6175, "step": 31090 }, { "epoch": 0.59, "learning_rate": 1.9255856547090255e-06, "loss": 0.8121, "step": 31091 }, { "epoch": 0.59, "learning_rate": 1.9254369773422043e-06, "loss": 0.7844, "step": 31092 }, { "epoch": 0.59, "learning_rate": 1.9252883021207845e-06, "loss": 0.9827, "step": 31093 }, { "epoch": 0.59, "learning_rate": 1.92513962904532e-06, "loss": 0.8949, "step": 31094 }, { "epoch": 0.59, "learning_rate": 1.9249909581163665e-06, "loss": 1.0422, "step": 31095 }, { "epoch": 0.59, "learning_rate": 1.92484228933448e-06, "loss": 0.9878, "step": 31096 }, { "epoch": 0.59, "learning_rate": 1.9246936227002145e-06, "loss": 0.8121, "step": 31097 }, { "epoch": 0.59, "learning_rate": 1.924544958214124e-06, "loss": 0.9494, "step": 31098 }, { "epoch": 0.59, "learning_rate": 1.9243962958767667e-06, "loss": 0.8351, "step": 31099 }, { "epoch": 0.59, "learning_rate": 1.924247635688695e-06, "loss": 1.0236, "step": 31100 }, { "epoch": 0.59, "learning_rate": 1.9240989776504653e-06, "loss": 0.8068, "step": 31101 }, { "epoch": 0.59, "learning_rate": 1.9239503217626323e-06, "loss": 0.8012, "step": 31102 }, { "epoch": 0.59, "learning_rate": 1.9238016680257517e-06, "loss": 0.8519, "step": 31103 }, { "epoch": 0.59, "learning_rate": 1.923653016440377e-06, "loss": 0.8372, "step": 31104 }, { "epoch": 0.59, "learning_rate": 1.923504367007065e-06, "loss": 0.9116, "step": 31105 }, { "epoch": 0.59, "learning_rate": 1.9233557197263702e-06, "loss": 0.9459, "step": 31106 }, { "epoch": 0.59, "learning_rate": 1.923207074598846e-06, "loss": 0.9791, "step": 31107 }, { "epoch": 0.59, "learning_rate": 1.92305843162505e-06, "loss": 1.0297, "step": 31108 }, { "epoch": 0.59, "learning_rate": 1.9229097908055368e-06, "loss": 0.902, "step": 31109 }, { "epoch": 0.59, "learning_rate": 1.922761152140859e-06, "loss": 0.8442, "step": 31110 }, { "epoch": 0.59, "learning_rate": 1.922612515631575e-06, "loss": 0.9897, "step": 31111 }, { "epoch": 0.59, "learning_rate": 1.922463881278238e-06, "loss": 0.9551, "step": 31112 }, { "epoch": 0.59, "learning_rate": 1.922315249081402e-06, "loss": 0.936, "step": 31113 }, { "epoch": 0.59, "learning_rate": 1.922166619041624e-06, "loss": 0.9169, "step": 31114 }, { "epoch": 0.59, "learning_rate": 1.922017991159458e-06, "loss": 0.9298, "step": 31115 }, { "epoch": 0.59, "learning_rate": 1.9218693654354583e-06, "loss": 0.895, "step": 31116 }, { "epoch": 0.59, "learning_rate": 1.921720741870182e-06, "loss": 0.8432, "step": 31117 }, { "epoch": 0.59, "learning_rate": 1.9215721204641826e-06, "loss": 0.9271, "step": 31118 }, { "epoch": 0.59, "learning_rate": 1.921423501218014e-06, "loss": 1.0682, "step": 31119 }, { "epoch": 0.59, "learning_rate": 1.9212748841322334e-06, "loss": 1.0969, "step": 31120 }, { "epoch": 0.59, "learning_rate": 1.921126269207394e-06, "loss": 0.9843, "step": 31121 }, { "epoch": 0.59, "learning_rate": 1.9209776564440517e-06, "loss": 0.7895, "step": 31122 }, { "epoch": 0.59, "learning_rate": 1.920829045842761e-06, "loss": 0.9819, "step": 31123 }, { "epoch": 0.59, "learning_rate": 1.9206804374040772e-06, "loss": 0.843, "step": 31124 }, { "epoch": 0.59, "learning_rate": 1.920531831128554e-06, "loss": 0.9243, "step": 31125 }, { "epoch": 0.59, "learning_rate": 1.9203832270167476e-06, "loss": 0.8488, "step": 31126 }, { "epoch": 0.59, "learning_rate": 1.920234625069213e-06, "loss": 1.0999, "step": 31127 }, { "epoch": 0.59, "learning_rate": 1.920086025286504e-06, "loss": 0.907, "step": 31128 }, { "epoch": 0.59, "learning_rate": 1.919937427669176e-06, "loss": 0.9256, "step": 31129 }, { "epoch": 0.59, "learning_rate": 1.9197888322177844e-06, "loss": 0.9306, "step": 31130 }, { "epoch": 0.59, "learning_rate": 1.919640238932882e-06, "loss": 1.1346, "step": 31131 }, { "epoch": 0.59, "learning_rate": 1.919491647815027e-06, "loss": 0.8823, "step": 31132 }, { "epoch": 0.59, "learning_rate": 1.919343058864772e-06, "loss": 0.8562, "step": 31133 }, { "epoch": 0.59, "learning_rate": 1.919194472082671e-06, "loss": 0.9346, "step": 31134 }, { "epoch": 0.59, "learning_rate": 1.9190458874692815e-06, "loss": 0.7711, "step": 31135 }, { "epoch": 0.59, "learning_rate": 1.9188973050251563e-06, "loss": 0.8415, "step": 31136 }, { "epoch": 0.59, "learning_rate": 1.91874872475085e-06, "loss": 1.0174, "step": 31137 }, { "epoch": 0.59, "learning_rate": 1.918600146646919e-06, "loss": 1.0815, "step": 31138 }, { "epoch": 0.59, "learning_rate": 1.9184515707139177e-06, "loss": 0.8555, "step": 31139 }, { "epoch": 0.59, "learning_rate": 1.918302996952399e-06, "loss": 0.9645, "step": 31140 }, { "epoch": 0.59, "learning_rate": 1.9181544253629204e-06, "loss": 0.7775, "step": 31141 }, { "epoch": 0.59, "learning_rate": 1.9180058559460344e-06, "loss": 0.8252, "step": 31142 }, { "epoch": 0.59, "learning_rate": 1.917857288702297e-06, "loss": 0.9927, "step": 31143 }, { "epoch": 0.59, "learning_rate": 1.9177087236322625e-06, "loss": 1.0184, "step": 31144 }, { "epoch": 0.59, "learning_rate": 1.9175601607364862e-06, "loss": 0.9467, "step": 31145 }, { "epoch": 0.59, "learning_rate": 1.9174116000155217e-06, "loss": 0.9419, "step": 31146 }, { "epoch": 0.59, "learning_rate": 1.9172630414699253e-06, "loss": 1.0594, "step": 31147 }, { "epoch": 0.59, "learning_rate": 1.917114485100251e-06, "loss": 0.7379, "step": 31148 }, { "epoch": 0.59, "learning_rate": 1.916965930907052e-06, "loss": 0.7809, "step": 31149 }, { "epoch": 0.59, "learning_rate": 1.916817378890885e-06, "loss": 1.1064, "step": 31150 }, { "epoch": 0.59, "learning_rate": 1.9166688290523044e-06, "loss": 0.8619, "step": 31151 }, { "epoch": 0.59, "learning_rate": 1.9165202813918637e-06, "loss": 0.9542, "step": 31152 }, { "epoch": 0.59, "learning_rate": 1.916371735910119e-06, "loss": 0.9689, "step": 31153 }, { "epoch": 0.59, "learning_rate": 1.916223192607625e-06, "loss": 0.8727, "step": 31154 }, { "epoch": 0.59, "learning_rate": 1.916074651484935e-06, "loss": 1.0258, "step": 31155 }, { "epoch": 0.59, "learning_rate": 1.9159261125426042e-06, "loss": 1.2692, "step": 31156 }, { "epoch": 0.59, "learning_rate": 1.915777575781187e-06, "loss": 1.145, "step": 31157 }, { "epoch": 0.59, "learning_rate": 1.9156290412012395e-06, "loss": 0.8867, "step": 31158 }, { "epoch": 0.59, "learning_rate": 1.915480508803314e-06, "loss": 0.8943, "step": 31159 }, { "epoch": 0.59, "learning_rate": 1.9153319785879678e-06, "loss": 0.8116, "step": 31160 }, { "epoch": 0.59, "learning_rate": 1.9151834505557533e-06, "loss": 0.792, "step": 31161 }, { "epoch": 0.59, "learning_rate": 1.9150349247072254e-06, "loss": 0.8237, "step": 31162 }, { "epoch": 0.59, "learning_rate": 1.9148864010429393e-06, "loss": 1.0706, "step": 31163 }, { "epoch": 0.59, "learning_rate": 1.91473787956345e-06, "loss": 0.9087, "step": 31164 }, { "epoch": 0.59, "learning_rate": 1.914589360269311e-06, "loss": 0.9647, "step": 31165 }, { "epoch": 0.59, "learning_rate": 1.914440843161078e-06, "loss": 0.9478, "step": 31166 }, { "epoch": 0.59, "learning_rate": 1.9142923282393048e-06, "loss": 0.9847, "step": 31167 }, { "epoch": 0.59, "learning_rate": 1.914143815504545e-06, "loss": 0.9318, "step": 31168 }, { "epoch": 0.59, "learning_rate": 1.9139953049573557e-06, "loss": 0.9733, "step": 31169 }, { "epoch": 0.59, "learning_rate": 1.913846796598289e-06, "loss": 1.0058, "step": 31170 }, { "epoch": 0.59, "learning_rate": 1.9136982904279002e-06, "loss": 0.9899, "step": 31171 }, { "epoch": 0.59, "learning_rate": 1.913549786446745e-06, "loss": 0.9041, "step": 31172 }, { "epoch": 0.59, "learning_rate": 1.913401284655377e-06, "loss": 0.7097, "step": 31173 }, { "epoch": 0.59, "learning_rate": 1.9132527850543496e-06, "loss": 0.8827, "step": 31174 }, { "epoch": 0.59, "learning_rate": 1.913104287644219e-06, "loss": 0.9271, "step": 31175 }, { "epoch": 0.59, "learning_rate": 1.9129557924255386e-06, "loss": 1.0483, "step": 31176 }, { "epoch": 0.59, "learning_rate": 1.912807299398863e-06, "loss": 0.7219, "step": 31177 }, { "epoch": 0.59, "learning_rate": 1.9126588085647478e-06, "loss": 0.7584, "step": 31178 }, { "epoch": 0.59, "learning_rate": 1.9125103199237468e-06, "loss": 0.7953, "step": 31179 }, { "epoch": 0.59, "learning_rate": 1.912361833476413e-06, "loss": 0.7903, "step": 31180 }, { "epoch": 0.59, "learning_rate": 1.912213349223303e-06, "loss": 1.0857, "step": 31181 }, { "epoch": 0.59, "learning_rate": 1.9120648671649707e-06, "loss": 1.0197, "step": 31182 }, { "epoch": 0.59, "learning_rate": 1.9119163873019686e-06, "loss": 0.8617, "step": 31183 }, { "epoch": 0.59, "learning_rate": 1.9117679096348533e-06, "loss": 0.8822, "step": 31184 }, { "epoch": 0.59, "learning_rate": 1.9116194341641796e-06, "loss": 0.9317, "step": 31185 }, { "epoch": 0.59, "learning_rate": 1.9114709608904992e-06, "loss": 0.8527, "step": 31186 }, { "epoch": 0.59, "learning_rate": 1.9113224898143696e-06, "loss": 0.8464, "step": 31187 }, { "epoch": 0.59, "learning_rate": 1.911174020936344e-06, "loss": 0.9564, "step": 31188 }, { "epoch": 0.59, "learning_rate": 1.911025554256975e-06, "loss": 0.8669, "step": 31189 }, { "epoch": 0.59, "learning_rate": 1.9108770897768203e-06, "loss": 1.0359, "step": 31190 }, { "epoch": 0.59, "learning_rate": 1.9107286274964316e-06, "loss": 0.9276, "step": 31191 }, { "epoch": 0.59, "learning_rate": 1.9105801674163634e-06, "loss": 0.8535, "step": 31192 }, { "epoch": 0.59, "learning_rate": 1.910431709537172e-06, "loss": 0.9739, "step": 31193 }, { "epoch": 0.59, "learning_rate": 1.91028325385941e-06, "loss": 1.0278, "step": 31194 }, { "epoch": 0.59, "learning_rate": 1.910134800383632e-06, "loss": 0.919, "step": 31195 }, { "epoch": 0.59, "learning_rate": 1.9099863491103932e-06, "loss": 0.9374, "step": 31196 }, { "epoch": 0.59, "learning_rate": 1.9098379000402465e-06, "loss": 0.8511, "step": 31197 }, { "epoch": 0.59, "learning_rate": 1.9096894531737475e-06, "loss": 0.8363, "step": 31198 }, { "epoch": 0.59, "learning_rate": 1.90954100851145e-06, "loss": 0.8736, "step": 31199 }, { "epoch": 0.59, "learning_rate": 1.909392566053909e-06, "loss": 1.2335, "step": 31200 }, { "epoch": 0.59, "learning_rate": 1.9092441258016766e-06, "loss": 0.9317, "step": 31201 }, { "epoch": 0.59, "learning_rate": 1.9090956877553092e-06, "loss": 0.8003, "step": 31202 }, { "epoch": 0.59, "learning_rate": 1.9089472519153606e-06, "loss": 1.0597, "step": 31203 }, { "epoch": 0.59, "learning_rate": 1.9087988182823843e-06, "loss": 0.7078, "step": 31204 }, { "epoch": 0.59, "learning_rate": 1.908650386856935e-06, "loss": 1.1867, "step": 31205 }, { "epoch": 0.59, "learning_rate": 1.908501957639568e-06, "loss": 1.0121, "step": 31206 }, { "epoch": 0.59, "learning_rate": 1.9083535306308354e-06, "loss": 0.8794, "step": 31207 }, { "epoch": 0.59, "learning_rate": 1.9082051058312934e-06, "loss": 0.9522, "step": 31208 }, { "epoch": 0.59, "learning_rate": 1.9080566832414955e-06, "loss": 0.8147, "step": 31209 }, { "epoch": 0.59, "learning_rate": 1.907908262861995e-06, "loss": 0.9408, "step": 31210 }, { "epoch": 0.59, "learning_rate": 1.9077598446933475e-06, "loss": 0.9611, "step": 31211 }, { "epoch": 0.59, "learning_rate": 1.9076114287361065e-06, "loss": 0.8836, "step": 31212 }, { "epoch": 0.59, "learning_rate": 1.907463014990825e-06, "loss": 1.115, "step": 31213 }, { "epoch": 0.59, "learning_rate": 1.9073146034580602e-06, "loss": 1.027, "step": 31214 }, { "epoch": 0.59, "learning_rate": 1.9071661941383646e-06, "loss": 0.9816, "step": 31215 }, { "epoch": 0.59, "learning_rate": 1.907017787032291e-06, "loss": 1.0335, "step": 31216 }, { "epoch": 0.59, "learning_rate": 1.9068693821403955e-06, "loss": 0.8777, "step": 31217 }, { "epoch": 0.59, "learning_rate": 1.9067209794632314e-06, "loss": 0.8881, "step": 31218 }, { "epoch": 0.59, "learning_rate": 1.9065725790013528e-06, "loss": 0.879, "step": 31219 }, { "epoch": 0.59, "learning_rate": 1.906424180755314e-06, "loss": 0.89, "step": 31220 }, { "epoch": 0.59, "learning_rate": 1.9062757847256697e-06, "loss": 0.9148, "step": 31221 }, { "epoch": 0.59, "learning_rate": 1.9061273909129724e-06, "loss": 1.0469, "step": 31222 }, { "epoch": 0.59, "learning_rate": 1.905978999317778e-06, "loss": 1.036, "step": 31223 }, { "epoch": 0.59, "learning_rate": 1.90583060994064e-06, "loss": 1.0892, "step": 31224 }, { "epoch": 0.59, "learning_rate": 1.9056822227821114e-06, "loss": 0.9528, "step": 31225 }, { "epoch": 0.59, "learning_rate": 1.9055338378427474e-06, "loss": 0.9475, "step": 31226 }, { "epoch": 0.59, "learning_rate": 1.9053854551231028e-06, "loss": 0.8837, "step": 31227 }, { "epoch": 0.59, "learning_rate": 1.9052370746237292e-06, "loss": 0.8146, "step": 31228 }, { "epoch": 0.59, "learning_rate": 1.9050886963451831e-06, "loss": 0.8652, "step": 31229 }, { "epoch": 0.59, "learning_rate": 1.904940320288018e-06, "loss": 1.3075, "step": 31230 }, { "epoch": 0.59, "learning_rate": 1.9047919464527859e-06, "loss": 0.9622, "step": 31231 }, { "epoch": 0.59, "learning_rate": 1.904643574840044e-06, "loss": 0.8675, "step": 31232 }, { "epoch": 0.59, "learning_rate": 1.9044952054503437e-06, "loss": 1.0755, "step": 31233 }, { "epoch": 0.59, "learning_rate": 1.9043468382842401e-06, "loss": 0.7274, "step": 31234 }, { "epoch": 0.59, "learning_rate": 1.9041984733422877e-06, "loss": 0.7645, "step": 31235 }, { "epoch": 0.59, "learning_rate": 1.9040501106250402e-06, "loss": 0.8275, "step": 31236 }, { "epoch": 0.59, "learning_rate": 1.9039017501330501e-06, "loss": 0.9856, "step": 31237 }, { "epoch": 0.59, "learning_rate": 1.9037533918668737e-06, "loss": 1.283, "step": 31238 }, { "epoch": 0.59, "learning_rate": 1.9036050358270635e-06, "loss": 0.8858, "step": 31239 }, { "epoch": 0.59, "learning_rate": 1.9034566820141737e-06, "loss": 1.0318, "step": 31240 }, { "epoch": 0.59, "learning_rate": 1.9033083304287581e-06, "loss": 0.8477, "step": 31241 }, { "epoch": 0.59, "learning_rate": 1.9031599810713719e-06, "loss": 0.8406, "step": 31242 }, { "epoch": 0.59, "learning_rate": 1.9030116339425666e-06, "loss": 0.6743, "step": 31243 }, { "epoch": 0.59, "learning_rate": 1.9028632890428988e-06, "loss": 1.1673, "step": 31244 }, { "epoch": 0.59, "learning_rate": 1.902714946372921e-06, "loss": 0.9756, "step": 31245 }, { "epoch": 0.59, "learning_rate": 1.9025666059331865e-06, "loss": 0.8923, "step": 31246 }, { "epoch": 0.59, "learning_rate": 1.9024182677242503e-06, "loss": 0.801, "step": 31247 }, { "epoch": 0.59, "learning_rate": 1.9022699317466664e-06, "loss": 0.8252, "step": 31248 }, { "epoch": 0.59, "learning_rate": 1.9021215980009874e-06, "loss": 1.0336, "step": 31249 }, { "epoch": 0.59, "learning_rate": 1.9019732664877692e-06, "loss": 1.0767, "step": 31250 }, { "epoch": 0.59, "learning_rate": 1.9018249372075642e-06, "loss": 0.826, "step": 31251 }, { "epoch": 0.59, "learning_rate": 1.9016766101609255e-06, "loss": 1.1105, "step": 31252 }, { "epoch": 0.59, "learning_rate": 1.9015282853484091e-06, "loss": 0.9056, "step": 31253 }, { "epoch": 0.59, "learning_rate": 1.9013799627705673e-06, "loss": 0.8459, "step": 31254 }, { "epoch": 0.59, "learning_rate": 1.9012316424279536e-06, "loss": 0.9203, "step": 31255 }, { "epoch": 0.59, "learning_rate": 1.9010833243211237e-06, "loss": 1.017, "step": 31256 }, { "epoch": 0.59, "learning_rate": 1.9009350084506307e-06, "loss": 1.1823, "step": 31257 }, { "epoch": 0.59, "learning_rate": 1.9007866948170267e-06, "loss": 0.878, "step": 31258 }, { "epoch": 0.59, "learning_rate": 1.9006383834208677e-06, "loss": 0.8474, "step": 31259 }, { "epoch": 0.59, "learning_rate": 1.9004900742627065e-06, "loss": 0.822, "step": 31260 }, { "epoch": 0.59, "learning_rate": 1.9003417673430962e-06, "loss": 1.0844, "step": 31261 }, { "epoch": 0.59, "learning_rate": 1.900193462662592e-06, "loss": 1.0522, "step": 31262 }, { "epoch": 0.59, "learning_rate": 1.9000451602217474e-06, "loss": 1.1161, "step": 31263 }, { "epoch": 0.59, "learning_rate": 1.899896860021115e-06, "loss": 0.628, "step": 31264 }, { "epoch": 0.59, "learning_rate": 1.89974856206125e-06, "loss": 0.8289, "step": 31265 }, { "epoch": 0.59, "learning_rate": 1.8996002663427054e-06, "loss": 0.7972, "step": 31266 }, { "epoch": 0.59, "learning_rate": 1.899451972866034e-06, "loss": 0.9646, "step": 31267 }, { "epoch": 0.59, "learning_rate": 1.8993036816317912e-06, "loss": 1.0668, "step": 31268 }, { "epoch": 0.59, "learning_rate": 1.8991553926405305e-06, "loss": 1.1381, "step": 31269 }, { "epoch": 0.59, "learning_rate": 1.8990071058928043e-06, "loss": 0.8478, "step": 31270 }, { "epoch": 0.59, "learning_rate": 1.898858821389168e-06, "loss": 0.9637, "step": 31271 }, { "epoch": 0.59, "learning_rate": 1.898710539130174e-06, "loss": 0.9003, "step": 31272 }, { "epoch": 0.59, "learning_rate": 1.898562259116376e-06, "loss": 0.8613, "step": 31273 }, { "epoch": 0.59, "learning_rate": 1.8984139813483289e-06, "loss": 1.1495, "step": 31274 }, { "epoch": 0.59, "learning_rate": 1.8982657058265853e-06, "loss": 1.2085, "step": 31275 }, { "epoch": 0.59, "learning_rate": 1.8981174325516982e-06, "loss": 0.7885, "step": 31276 }, { "epoch": 0.59, "learning_rate": 1.8979691615242233e-06, "loss": 0.735, "step": 31277 }, { "epoch": 0.59, "learning_rate": 1.897820892744713e-06, "loss": 0.9664, "step": 31278 }, { "epoch": 0.59, "learning_rate": 1.8976726262137203e-06, "loss": 0.6808, "step": 31279 }, { "epoch": 0.59, "learning_rate": 1.8975243619318002e-06, "loss": 1.1727, "step": 31280 }, { "epoch": 0.59, "learning_rate": 1.8973760998995052e-06, "loss": 1.0499, "step": 31281 }, { "epoch": 0.59, "learning_rate": 1.897227840117389e-06, "loss": 0.9671, "step": 31282 }, { "epoch": 0.59, "learning_rate": 1.8970795825860067e-06, "loss": 1.1472, "step": 31283 }, { "epoch": 0.59, "learning_rate": 1.8969313273059106e-06, "loss": 0.9194, "step": 31284 }, { "epoch": 0.59, "learning_rate": 1.8967830742776534e-06, "loss": 0.8204, "step": 31285 }, { "epoch": 0.59, "learning_rate": 1.8966348235017906e-06, "loss": 0.9753, "step": 31286 }, { "epoch": 0.59, "learning_rate": 1.8964865749788747e-06, "loss": 0.9465, "step": 31287 }, { "epoch": 0.59, "learning_rate": 1.8963383287094592e-06, "loss": 1.0607, "step": 31288 }, { "epoch": 0.59, "learning_rate": 1.8961900846940977e-06, "loss": 0.8143, "step": 31289 }, { "epoch": 0.59, "learning_rate": 1.8960418429333449e-06, "loss": 0.9049, "step": 31290 }, { "epoch": 0.59, "learning_rate": 1.895893603427752e-06, "loss": 0.926, "step": 31291 }, { "epoch": 0.59, "learning_rate": 1.895745366177875e-06, "loss": 0.812, "step": 31292 }, { "epoch": 0.59, "learning_rate": 1.895597131184266e-06, "loss": 0.8994, "step": 31293 }, { "epoch": 0.59, "learning_rate": 1.895448898447478e-06, "loss": 1.2085, "step": 31294 }, { "epoch": 0.59, "learning_rate": 1.8953006679680658e-06, "loss": 0.9781, "step": 31295 }, { "epoch": 0.59, "learning_rate": 1.895152439746583e-06, "loss": 0.9078, "step": 31296 }, { "epoch": 0.59, "learning_rate": 1.895004213783581e-06, "loss": 0.9853, "step": 31297 }, { "epoch": 0.59, "learning_rate": 1.8948559900796159e-06, "loss": 0.8276, "step": 31298 }, { "epoch": 0.59, "learning_rate": 1.8947077686352403e-06, "loss": 1.1254, "step": 31299 }, { "epoch": 0.59, "learning_rate": 1.894559549451006e-06, "loss": 1.1182, "step": 31300 }, { "epoch": 0.59, "learning_rate": 1.8944113325274689e-06, "loss": 0.8343, "step": 31301 }, { "epoch": 0.59, "learning_rate": 1.8942631178651808e-06, "loss": 0.9362, "step": 31302 }, { "epoch": 0.59, "learning_rate": 1.8941149054646952e-06, "loss": 0.9263, "step": 31303 }, { "epoch": 0.59, "learning_rate": 1.8939666953265668e-06, "loss": 0.8518, "step": 31304 }, { "epoch": 0.59, "learning_rate": 1.8938184874513483e-06, "loss": 0.6902, "step": 31305 }, { "epoch": 0.59, "learning_rate": 1.8936702818395918e-06, "loss": 1.2502, "step": 31306 }, { "epoch": 0.59, "learning_rate": 1.8935220784918532e-06, "loss": 0.8144, "step": 31307 }, { "epoch": 0.59, "learning_rate": 1.8933738774086838e-06, "loss": 0.8557, "step": 31308 }, { "epoch": 0.59, "learning_rate": 1.8932256785906377e-06, "loss": 0.8098, "step": 31309 }, { "epoch": 0.59, "learning_rate": 1.8930774820382685e-06, "loss": 0.641, "step": 31310 }, { "epoch": 0.59, "learning_rate": 1.8929292877521298e-06, "loss": 1.0492, "step": 31311 }, { "epoch": 0.59, "learning_rate": 1.8927810957327735e-06, "loss": 0.9241, "step": 31312 }, { "epoch": 0.59, "learning_rate": 1.8926329059807552e-06, "loss": 1.1118, "step": 31313 }, { "epoch": 0.59, "learning_rate": 1.892484718496627e-06, "loss": 1.0192, "step": 31314 }, { "epoch": 0.59, "learning_rate": 1.892336533280941e-06, "loss": 0.793, "step": 31315 }, { "epoch": 0.59, "learning_rate": 1.8921883503342523e-06, "loss": 0.7647, "step": 31316 }, { "epoch": 0.59, "learning_rate": 1.8920401696571142e-06, "loss": 0.9421, "step": 31317 }, { "epoch": 0.59, "learning_rate": 1.8918919912500783e-06, "loss": 1.0377, "step": 31318 }, { "epoch": 0.59, "learning_rate": 1.8917438151137002e-06, "loss": 1.0248, "step": 31319 }, { "epoch": 0.59, "learning_rate": 1.8915956412485324e-06, "loss": 1.1605, "step": 31320 }, { "epoch": 0.59, "learning_rate": 1.8914474696551263e-06, "loss": 0.789, "step": 31321 }, { "epoch": 0.59, "learning_rate": 1.891299300334038e-06, "loss": 0.8797, "step": 31322 }, { "epoch": 0.59, "learning_rate": 1.8911511332858186e-06, "loss": 0.8995, "step": 31323 }, { "epoch": 0.59, "learning_rate": 1.8910029685110221e-06, "loss": 1.0292, "step": 31324 }, { "epoch": 0.59, "learning_rate": 1.8908548060102024e-06, "loss": 1.0215, "step": 31325 }, { "epoch": 0.59, "learning_rate": 1.8907066457839127e-06, "loss": 0.9203, "step": 31326 }, { "epoch": 0.59, "learning_rate": 1.8905584878327044e-06, "loss": 0.8124, "step": 31327 }, { "epoch": 0.59, "learning_rate": 1.890410332157133e-06, "loss": 1.0092, "step": 31328 }, { "epoch": 0.59, "learning_rate": 1.8902621787577501e-06, "loss": 0.8871, "step": 31329 }, { "epoch": 0.59, "learning_rate": 1.8901140276351098e-06, "loss": 0.8434, "step": 31330 }, { "epoch": 0.59, "learning_rate": 1.889965878789765e-06, "loss": 0.9283, "step": 31331 }, { "epoch": 0.59, "learning_rate": 1.8898177322222693e-06, "loss": 0.9873, "step": 31332 }, { "epoch": 0.59, "learning_rate": 1.8896695879331745e-06, "loss": 1.0437, "step": 31333 }, { "epoch": 0.59, "learning_rate": 1.889521445923036e-06, "loss": 0.8736, "step": 31334 }, { "epoch": 0.59, "learning_rate": 1.8893733061924052e-06, "loss": 0.7097, "step": 31335 }, { "epoch": 0.59, "learning_rate": 1.8892251687418351e-06, "loss": 0.8098, "step": 31336 }, { "epoch": 0.59, "learning_rate": 1.88907703357188e-06, "loss": 0.9493, "step": 31337 }, { "epoch": 0.59, "learning_rate": 1.888928900683093e-06, "loss": 1.1191, "step": 31338 }, { "epoch": 0.59, "learning_rate": 1.8887807700760256e-06, "loss": 0.8819, "step": 31339 }, { "epoch": 0.59, "learning_rate": 1.8886326417512332e-06, "loss": 0.9034, "step": 31340 }, { "epoch": 0.59, "learning_rate": 1.8884845157092678e-06, "loss": 0.8372, "step": 31341 }, { "epoch": 0.59, "learning_rate": 1.8883363919506814e-06, "loss": 0.7859, "step": 31342 }, { "epoch": 0.59, "learning_rate": 1.8881882704760291e-06, "loss": 1.0842, "step": 31343 }, { "epoch": 0.59, "learning_rate": 1.8880401512858626e-06, "loss": 0.8816, "step": 31344 }, { "epoch": 0.59, "learning_rate": 1.887892034380735e-06, "loss": 0.8097, "step": 31345 }, { "epoch": 0.59, "learning_rate": 1.8877439197612005e-06, "loss": 0.9325, "step": 31346 }, { "epoch": 0.59, "learning_rate": 1.8875958074278116e-06, "loss": 0.8199, "step": 31347 }, { "epoch": 0.59, "learning_rate": 1.8874476973811202e-06, "loss": 0.8153, "step": 31348 }, { "epoch": 0.59, "learning_rate": 1.8872995896216813e-06, "loss": 1.0601, "step": 31349 }, { "epoch": 0.59, "learning_rate": 1.8871514841500465e-06, "loss": 1.1611, "step": 31350 }, { "epoch": 0.59, "learning_rate": 1.8870033809667692e-06, "loss": 0.9096, "step": 31351 }, { "epoch": 0.59, "learning_rate": 1.8868552800724028e-06, "loss": 0.8029, "step": 31352 }, { "epoch": 0.59, "learning_rate": 1.8867071814675001e-06, "loss": 0.9697, "step": 31353 }, { "epoch": 0.59, "learning_rate": 1.8865590851526127e-06, "loss": 0.8918, "step": 31354 }, { "epoch": 0.59, "learning_rate": 1.8864109911282965e-06, "loss": 0.7775, "step": 31355 }, { "epoch": 0.59, "learning_rate": 1.8862628993951026e-06, "loss": 1.0686, "step": 31356 }, { "epoch": 0.59, "learning_rate": 1.886114809953583e-06, "loss": 0.7925, "step": 31357 }, { "epoch": 0.59, "learning_rate": 1.8859667228042927e-06, "loss": 0.9461, "step": 31358 }, { "epoch": 0.59, "learning_rate": 1.8858186379477845e-06, "loss": 0.9111, "step": 31359 }, { "epoch": 0.59, "learning_rate": 1.885670555384609e-06, "loss": 0.9515, "step": 31360 }, { "epoch": 0.59, "learning_rate": 1.8855224751153224e-06, "loss": 0.8799, "step": 31361 }, { "epoch": 0.59, "learning_rate": 1.885374397140476e-06, "loss": 1.205, "step": 31362 }, { "epoch": 0.59, "learning_rate": 1.8852263214606214e-06, "loss": 0.866, "step": 31363 }, { "epoch": 0.59, "learning_rate": 1.8850782480763141e-06, "loss": 0.7185, "step": 31364 }, { "epoch": 0.59, "learning_rate": 1.8849301769881052e-06, "loss": 0.8834, "step": 31365 }, { "epoch": 0.59, "learning_rate": 1.8847821081965475e-06, "loss": 0.713, "step": 31366 }, { "epoch": 0.59, "learning_rate": 1.8846340417021959e-06, "loss": 0.7775, "step": 31367 }, { "epoch": 0.59, "learning_rate": 1.8844859775056018e-06, "loss": 1.1305, "step": 31368 }, { "epoch": 0.59, "learning_rate": 1.8843379156073172e-06, "loss": 1.0125, "step": 31369 }, { "epoch": 0.59, "learning_rate": 1.8841898560078966e-06, "loss": 0.8863, "step": 31370 }, { "epoch": 0.59, "learning_rate": 1.8840417987078922e-06, "loss": 0.8805, "step": 31371 }, { "epoch": 0.59, "learning_rate": 1.8838937437078565e-06, "loss": 1.0792, "step": 31372 }, { "epoch": 0.59, "learning_rate": 1.883745691008343e-06, "loss": 0.6734, "step": 31373 }, { "epoch": 0.59, "learning_rate": 1.8835976406099043e-06, "loss": 0.8196, "step": 31374 }, { "epoch": 0.59, "learning_rate": 1.8834495925130923e-06, "loss": 1.1784, "step": 31375 }, { "epoch": 0.59, "learning_rate": 1.8833015467184615e-06, "loss": 1.0275, "step": 31376 }, { "epoch": 0.59, "learning_rate": 1.8831535032265642e-06, "loss": 0.8805, "step": 31377 }, { "epoch": 0.59, "learning_rate": 1.8830054620379512e-06, "loss": 0.8331, "step": 31378 }, { "epoch": 0.59, "learning_rate": 1.8828574231531777e-06, "loss": 0.9219, "step": 31379 }, { "epoch": 0.59, "learning_rate": 1.8827093865727962e-06, "loss": 1.1304, "step": 31380 }, { "epoch": 0.59, "learning_rate": 1.8825613522973579e-06, "loss": 1.0356, "step": 31381 }, { "epoch": 0.59, "learning_rate": 1.8824133203274178e-06, "loss": 0.9239, "step": 31382 }, { "epoch": 0.59, "learning_rate": 1.8822652906635271e-06, "loss": 1.0444, "step": 31383 }, { "epoch": 0.59, "learning_rate": 1.882117263306238e-06, "loss": 0.9133, "step": 31384 }, { "epoch": 0.59, "learning_rate": 1.881969238256105e-06, "loss": 0.8678, "step": 31385 }, { "epoch": 0.59, "learning_rate": 1.8818212155136794e-06, "loss": 1.0281, "step": 31386 }, { "epoch": 0.59, "learning_rate": 1.8816731950795152e-06, "loss": 1.2145, "step": 31387 }, { "epoch": 0.59, "learning_rate": 1.881525176954163e-06, "loss": 1.2496, "step": 31388 }, { "epoch": 0.59, "learning_rate": 1.8813771611381781e-06, "loss": 0.8323, "step": 31389 }, { "epoch": 0.59, "learning_rate": 1.8812291476321117e-06, "loss": 0.8141, "step": 31390 }, { "epoch": 0.59, "learning_rate": 1.881081136436516e-06, "loss": 0.7372, "step": 31391 }, { "epoch": 0.59, "learning_rate": 1.8809331275519443e-06, "loss": 0.9305, "step": 31392 }, { "epoch": 0.59, "learning_rate": 1.8807851209789504e-06, "loss": 1.0583, "step": 31393 }, { "epoch": 0.59, "learning_rate": 1.8806371167180845e-06, "loss": 1.0892, "step": 31394 }, { "epoch": 0.59, "learning_rate": 1.8804891147699016e-06, "loss": 0.8703, "step": 31395 }, { "epoch": 0.59, "learning_rate": 1.8803411151349537e-06, "loss": 0.9714, "step": 31396 }, { "epoch": 0.59, "learning_rate": 1.880193117813792e-06, "loss": 0.8044, "step": 31397 }, { "epoch": 0.59, "learning_rate": 1.880045122806971e-06, "loss": 0.9664, "step": 31398 }, { "epoch": 0.59, "learning_rate": 1.879897130115042e-06, "loss": 0.9772, "step": 31399 }, { "epoch": 0.59, "learning_rate": 1.8797491397385575e-06, "loss": 1.1025, "step": 31400 }, { "epoch": 0.59, "learning_rate": 1.8796011516780721e-06, "loss": 0.8489, "step": 31401 }, { "epoch": 0.59, "learning_rate": 1.8794531659341367e-06, "loss": 0.8111, "step": 31402 }, { "epoch": 0.59, "learning_rate": 1.8793051825073034e-06, "loss": 0.9575, "step": 31403 }, { "epoch": 0.59, "learning_rate": 1.879157201398126e-06, "loss": 0.8008, "step": 31404 }, { "epoch": 0.59, "learning_rate": 1.8790092226071565e-06, "loss": 0.9346, "step": 31405 }, { "epoch": 0.59, "learning_rate": 1.8788612461349473e-06, "loss": 1.1262, "step": 31406 }, { "epoch": 0.59, "learning_rate": 1.8787132719820513e-06, "loss": 1.0402, "step": 31407 }, { "epoch": 0.59, "learning_rate": 1.8785653001490215e-06, "loss": 0.8344, "step": 31408 }, { "epoch": 0.59, "learning_rate": 1.8784173306364087e-06, "loss": 1.0065, "step": 31409 }, { "epoch": 0.59, "learning_rate": 1.8782693634447675e-06, "loss": 0.8727, "step": 31410 }, { "epoch": 0.59, "learning_rate": 1.8781213985746494e-06, "loss": 0.8896, "step": 31411 }, { "epoch": 0.59, "learning_rate": 1.877973436026606e-06, "loss": 1.1042, "step": 31412 }, { "epoch": 0.59, "learning_rate": 1.877825475801191e-06, "loss": 0.9521, "step": 31413 }, { "epoch": 0.59, "learning_rate": 1.8776775178989577e-06, "loss": 0.9183, "step": 31414 }, { "epoch": 0.59, "learning_rate": 1.877529562320456e-06, "loss": 0.7751, "step": 31415 }, { "epoch": 0.59, "learning_rate": 1.8773816090662406e-06, "loss": 0.7345, "step": 31416 }, { "epoch": 0.59, "learning_rate": 1.8772336581368635e-06, "loss": 0.8466, "step": 31417 }, { "epoch": 0.59, "learning_rate": 1.877085709532876e-06, "loss": 1.0802, "step": 31418 }, { "epoch": 0.59, "learning_rate": 1.8769377632548318e-06, "loss": 0.7023, "step": 31419 }, { "epoch": 0.59, "learning_rate": 1.8767898193032829e-06, "loss": 0.9734, "step": 31420 }, { "epoch": 0.59, "learning_rate": 1.876641877678781e-06, "loss": 0.9764, "step": 31421 }, { "epoch": 0.59, "learning_rate": 1.8764939383818803e-06, "loss": 0.9461, "step": 31422 }, { "epoch": 0.59, "learning_rate": 1.876346001413132e-06, "loss": 0.8566, "step": 31423 }, { "epoch": 0.59, "learning_rate": 1.8761980667730877e-06, "loss": 0.853, "step": 31424 }, { "epoch": 0.59, "learning_rate": 1.876050134462302e-06, "loss": 1.0125, "step": 31425 }, { "epoch": 0.59, "learning_rate": 1.8759022044813248e-06, "loss": 0.8828, "step": 31426 }, { "epoch": 0.59, "learning_rate": 1.8757542768307102e-06, "loss": 0.884, "step": 31427 }, { "epoch": 0.59, "learning_rate": 1.8756063515110098e-06, "loss": 0.8906, "step": 31428 }, { "epoch": 0.59, "learning_rate": 1.8754584285227767e-06, "loss": 0.6806, "step": 31429 }, { "epoch": 0.59, "learning_rate": 1.8753105078665615e-06, "loss": 1.0637, "step": 31430 }, { "epoch": 0.59, "learning_rate": 1.8751625895429187e-06, "loss": 1.2253, "step": 31431 }, { "epoch": 0.59, "learning_rate": 1.8750146735524e-06, "loss": 0.7495, "step": 31432 }, { "epoch": 0.59, "learning_rate": 1.874866759895556e-06, "loss": 0.8871, "step": 31433 }, { "epoch": 0.59, "learning_rate": 1.8747188485729407e-06, "loss": 0.9312, "step": 31434 }, { "epoch": 0.59, "learning_rate": 1.874570939585107e-06, "loss": 0.9691, "step": 31435 }, { "epoch": 0.59, "learning_rate": 1.874423032932605e-06, "loss": 0.9158, "step": 31436 }, { "epoch": 0.59, "learning_rate": 1.8742751286159894e-06, "loss": 0.8359, "step": 31437 }, { "epoch": 0.59, "learning_rate": 1.874127226635811e-06, "loss": 0.8957, "step": 31438 }, { "epoch": 0.59, "learning_rate": 1.8739793269926215e-06, "loss": 1.0804, "step": 31439 }, { "epoch": 0.59, "learning_rate": 1.8738314296869748e-06, "loss": 0.8049, "step": 31440 }, { "epoch": 0.59, "learning_rate": 1.873683534719422e-06, "loss": 0.7978, "step": 31441 }, { "epoch": 0.59, "learning_rate": 1.873535642090515e-06, "loss": 0.7561, "step": 31442 }, { "epoch": 0.59, "learning_rate": 1.873387751800808e-06, "loss": 0.9864, "step": 31443 }, { "epoch": 0.59, "learning_rate": 1.873239863850852e-06, "loss": 0.8671, "step": 31444 }, { "epoch": 0.59, "learning_rate": 1.8730919782411977e-06, "loss": 0.8805, "step": 31445 }, { "epoch": 0.59, "learning_rate": 1.8729440949724001e-06, "loss": 0.9261, "step": 31446 }, { "epoch": 0.59, "learning_rate": 1.8727962140450095e-06, "loss": 0.8254, "step": 31447 }, { "epoch": 0.59, "learning_rate": 1.8726483354595785e-06, "loss": 0.8422, "step": 31448 }, { "epoch": 0.59, "learning_rate": 1.8725004592166593e-06, "loss": 1.0623, "step": 31449 }, { "epoch": 0.59, "learning_rate": 1.8723525853168048e-06, "loss": 1.0112, "step": 31450 }, { "epoch": 0.59, "learning_rate": 1.8722047137605654e-06, "loss": 0.9976, "step": 31451 }, { "epoch": 0.59, "learning_rate": 1.8720568445484955e-06, "loss": 0.8738, "step": 31452 }, { "epoch": 0.59, "learning_rate": 1.8719089776811459e-06, "loss": 0.8897, "step": 31453 }, { "epoch": 0.59, "learning_rate": 1.871761113159068e-06, "loss": 0.7856, "step": 31454 }, { "epoch": 0.59, "learning_rate": 1.8716132509828153e-06, "loss": 0.8914, "step": 31455 }, { "epoch": 0.59, "learning_rate": 1.8714653911529402e-06, "loss": 1.1391, "step": 31456 }, { "epoch": 0.59, "learning_rate": 1.8713175336699926e-06, "loss": 0.7825, "step": 31457 }, { "epoch": 0.59, "learning_rate": 1.8711696785345274e-06, "loss": 0.9215, "step": 31458 }, { "epoch": 0.59, "learning_rate": 1.8710218257470952e-06, "loss": 0.7644, "step": 31459 }, { "epoch": 0.59, "learning_rate": 1.8708739753082472e-06, "loss": 0.6949, "step": 31460 }, { "epoch": 0.59, "learning_rate": 1.8707261272185376e-06, "loss": 0.848, "step": 31461 }, { "epoch": 0.59, "learning_rate": 1.8705782814785167e-06, "loss": 1.1218, "step": 31462 }, { "epoch": 0.59, "learning_rate": 1.8704304380887367e-06, "loss": 0.9839, "step": 31463 }, { "epoch": 0.59, "learning_rate": 1.8702825970497513e-06, "loss": 0.7857, "step": 31464 }, { "epoch": 0.59, "learning_rate": 1.8701347583621116e-06, "loss": 0.7132, "step": 31465 }, { "epoch": 0.59, "learning_rate": 1.8699869220263678e-06, "loss": 0.6655, "step": 31466 }, { "epoch": 0.59, "learning_rate": 1.869839088043075e-06, "loss": 1.0546, "step": 31467 }, { "epoch": 0.59, "learning_rate": 1.8696912564127828e-06, "loss": 1.0917, "step": 31468 }, { "epoch": 0.59, "learning_rate": 1.8695434271360446e-06, "loss": 1.052, "step": 31469 }, { "epoch": 0.59, "learning_rate": 1.8693956002134116e-06, "loss": 0.8461, "step": 31470 }, { "epoch": 0.59, "learning_rate": 1.8692477756454366e-06, "loss": 0.8638, "step": 31471 }, { "epoch": 0.59, "learning_rate": 1.8690999534326703e-06, "loss": 0.8984, "step": 31472 }, { "epoch": 0.59, "learning_rate": 1.8689521335756662e-06, "loss": 0.7935, "step": 31473 }, { "epoch": 0.59, "learning_rate": 1.8688043160749755e-06, "loss": 0.797, "step": 31474 }, { "epoch": 0.59, "learning_rate": 1.8686565009311492e-06, "loss": 0.859, "step": 31475 }, { "epoch": 0.59, "learning_rate": 1.8685086881447407e-06, "loss": 0.8835, "step": 31476 }, { "epoch": 0.59, "learning_rate": 1.8683608777163021e-06, "loss": 0.7413, "step": 31477 }, { "epoch": 0.59, "learning_rate": 1.868213069646383e-06, "loss": 0.851, "step": 31478 }, { "epoch": 0.59, "learning_rate": 1.8680652639355384e-06, "loss": 0.7983, "step": 31479 }, { "epoch": 0.59, "learning_rate": 1.8679174605843186e-06, "loss": 0.8442, "step": 31480 }, { "epoch": 0.59, "learning_rate": 1.8677696595932749e-06, "loss": 1.181, "step": 31481 }, { "epoch": 0.59, "learning_rate": 1.8676218609629604e-06, "loss": 0.861, "step": 31482 }, { "epoch": 0.59, "learning_rate": 1.8674740646939263e-06, "loss": 0.6958, "step": 31483 }, { "epoch": 0.59, "learning_rate": 1.867326270786724e-06, "loss": 0.9428, "step": 31484 }, { "epoch": 0.59, "learning_rate": 1.8671784792419074e-06, "loss": 0.8799, "step": 31485 }, { "epoch": 0.59, "learning_rate": 1.8670306900600265e-06, "loss": 0.707, "step": 31486 }, { "epoch": 0.59, "learning_rate": 1.8668829032416324e-06, "loss": 0.9065, "step": 31487 }, { "epoch": 0.59, "learning_rate": 1.8667351187872798e-06, "loss": 0.9839, "step": 31488 }, { "epoch": 0.59, "learning_rate": 1.866587336697518e-06, "loss": 0.8296, "step": 31489 }, { "epoch": 0.59, "learning_rate": 1.8664395569728997e-06, "loss": 0.8723, "step": 31490 }, { "epoch": 0.59, "learning_rate": 1.8662917796139769e-06, "loss": 0.925, "step": 31491 }, { "epoch": 0.59, "learning_rate": 1.8661440046213012e-06, "loss": 0.8619, "step": 31492 }, { "epoch": 0.59, "learning_rate": 1.8659962319954234e-06, "loss": 1.0516, "step": 31493 }, { "epoch": 0.59, "learning_rate": 1.8658484617368974e-06, "loss": 1.2198, "step": 31494 }, { "epoch": 0.59, "learning_rate": 1.865700693846274e-06, "loss": 0.9944, "step": 31495 }, { "epoch": 0.59, "learning_rate": 1.8655529283241037e-06, "loss": 0.8558, "step": 31496 }, { "epoch": 0.59, "learning_rate": 1.8654051651709393e-06, "loss": 0.8937, "step": 31497 }, { "epoch": 0.59, "learning_rate": 1.8652574043873334e-06, "loss": 0.7534, "step": 31498 }, { "epoch": 0.59, "learning_rate": 1.865109645973836e-06, "loss": 1.0917, "step": 31499 }, { "epoch": 0.59, "learning_rate": 1.8649618899310007e-06, "loss": 1.132, "step": 31500 }, { "epoch": 0.59, "learning_rate": 1.864814136259378e-06, "loss": 0.95, "step": 31501 }, { "epoch": 0.59, "learning_rate": 1.8646663849595193e-06, "loss": 0.8728, "step": 31502 }, { "epoch": 0.59, "learning_rate": 1.8645186360319776e-06, "loss": 0.8279, "step": 31503 }, { "epoch": 0.59, "learning_rate": 1.8643708894773033e-06, "loss": 0.8661, "step": 31504 }, { "epoch": 0.59, "learning_rate": 1.864223145296048e-06, "loss": 1.1335, "step": 31505 }, { "epoch": 0.59, "learning_rate": 1.8640754034887648e-06, "loss": 1.0729, "step": 31506 }, { "epoch": 0.59, "learning_rate": 1.863927664056005e-06, "loss": 0.9003, "step": 31507 }, { "epoch": 0.59, "learning_rate": 1.8637799269983186e-06, "loss": 0.7758, "step": 31508 }, { "epoch": 0.59, "learning_rate": 1.8636321923162596e-06, "loss": 0.9313, "step": 31509 }, { "epoch": 0.59, "learning_rate": 1.8634844600103776e-06, "loss": 0.9617, "step": 31510 }, { "epoch": 0.59, "learning_rate": 1.8633367300812254e-06, "loss": 0.9778, "step": 31511 }, { "epoch": 0.59, "learning_rate": 1.8631890025293542e-06, "loss": 0.9261, "step": 31512 }, { "epoch": 0.59, "learning_rate": 1.8630412773553165e-06, "loss": 0.8491, "step": 31513 }, { "epoch": 0.59, "learning_rate": 1.862893554559662e-06, "loss": 0.9363, "step": 31514 }, { "epoch": 0.59, "learning_rate": 1.8627458341429444e-06, "loss": 0.7847, "step": 31515 }, { "epoch": 0.59, "learning_rate": 1.8625981161057145e-06, "loss": 0.789, "step": 31516 }, { "epoch": 0.59, "learning_rate": 1.8624504004485222e-06, "loss": 0.7037, "step": 31517 }, { "epoch": 0.59, "learning_rate": 1.8623026871719213e-06, "loss": 0.8961, "step": 31518 }, { "epoch": 0.59, "learning_rate": 1.8621549762764634e-06, "loss": 0.9853, "step": 31519 }, { "epoch": 0.59, "learning_rate": 1.862007267762698e-06, "loss": 1.0198, "step": 31520 }, { "epoch": 0.59, "learning_rate": 1.8618595616311792e-06, "loss": 0.7483, "step": 31521 }, { "epoch": 0.59, "learning_rate": 1.8617118578824567e-06, "loss": 0.6413, "step": 31522 }, { "epoch": 0.59, "learning_rate": 1.8615641565170817e-06, "loss": 0.7697, "step": 31523 }, { "epoch": 0.59, "learning_rate": 1.8614164575356077e-06, "loss": 0.818, "step": 31524 }, { "epoch": 0.59, "learning_rate": 1.8612687609385845e-06, "loss": 1.019, "step": 31525 }, { "epoch": 0.59, "learning_rate": 1.861121066726564e-06, "loss": 0.9339, "step": 31526 }, { "epoch": 0.59, "learning_rate": 1.8609733749000985e-06, "loss": 0.8415, "step": 31527 }, { "epoch": 0.59, "learning_rate": 1.860825685459739e-06, "loss": 0.8587, "step": 31528 }, { "epoch": 0.59, "learning_rate": 1.8606779984060355e-06, "loss": 0.8565, "step": 31529 }, { "epoch": 0.59, "learning_rate": 1.8605303137395419e-06, "loss": 0.8996, "step": 31530 }, { "epoch": 0.59, "learning_rate": 1.8603826314608082e-06, "loss": 0.9908, "step": 31531 }, { "epoch": 0.59, "learning_rate": 1.860234951570386e-06, "loss": 0.925, "step": 31532 }, { "epoch": 0.59, "learning_rate": 1.8600872740688267e-06, "loss": 0.7546, "step": 31533 }, { "epoch": 0.59, "learning_rate": 1.8599395989566827e-06, "loss": 0.8385, "step": 31534 }, { "epoch": 0.59, "learning_rate": 1.8597919262345033e-06, "loss": 0.7642, "step": 31535 }, { "epoch": 0.59, "learning_rate": 1.8596442559028423e-06, "loss": 0.9659, "step": 31536 }, { "epoch": 0.6, "learning_rate": 1.8594965879622501e-06, "loss": 1.071, "step": 31537 }, { "epoch": 0.6, "learning_rate": 1.859348922413277e-06, "loss": 0.819, "step": 31538 }, { "epoch": 0.6, "learning_rate": 1.859201259256476e-06, "loss": 0.9876, "step": 31539 }, { "epoch": 0.6, "learning_rate": 1.8590535984923982e-06, "loss": 0.9278, "step": 31540 }, { "epoch": 0.6, "learning_rate": 1.8589059401215935e-06, "loss": 0.8564, "step": 31541 }, { "epoch": 0.6, "learning_rate": 1.8587582841446156e-06, "loss": 0.8314, "step": 31542 }, { "epoch": 0.6, "learning_rate": 1.8586106305620147e-06, "loss": 0.9266, "step": 31543 }, { "epoch": 0.6, "learning_rate": 1.8584629793743409e-06, "loss": 1.0022, "step": 31544 }, { "epoch": 0.6, "learning_rate": 1.8583153305821475e-06, "loss": 0.7876, "step": 31545 }, { "epoch": 0.6, "learning_rate": 1.8581676841859847e-06, "loss": 0.9869, "step": 31546 }, { "epoch": 0.6, "learning_rate": 1.8580200401864035e-06, "loss": 0.9438, "step": 31547 }, { "epoch": 0.6, "learning_rate": 1.8578723985839567e-06, "loss": 0.9894, "step": 31548 }, { "epoch": 0.6, "learning_rate": 1.8577247593791948e-06, "loss": 0.9202, "step": 31549 }, { "epoch": 0.6, "learning_rate": 1.857577122572668e-06, "loss": 1.0403, "step": 31550 }, { "epoch": 0.6, "learning_rate": 1.857429488164929e-06, "loss": 0.938, "step": 31551 }, { "epoch": 0.6, "learning_rate": 1.8572818561565288e-06, "loss": 0.8354, "step": 31552 }, { "epoch": 0.6, "learning_rate": 1.857134226548018e-06, "loss": 0.87, "step": 31553 }, { "epoch": 0.6, "learning_rate": 1.8569865993399486e-06, "loss": 0.7533, "step": 31554 }, { "epoch": 0.6, "learning_rate": 1.856838974532872e-06, "loss": 0.9623, "step": 31555 }, { "epoch": 0.6, "learning_rate": 1.8566913521273378e-06, "loss": 0.9746, "step": 31556 }, { "epoch": 0.6, "learning_rate": 1.8565437321238993e-06, "loss": 0.9989, "step": 31557 }, { "epoch": 0.6, "learning_rate": 1.8563961145231068e-06, "loss": 0.9271, "step": 31558 }, { "epoch": 0.6, "learning_rate": 1.8562484993255105e-06, "loss": 0.815, "step": 31559 }, { "epoch": 0.6, "learning_rate": 1.8561008865316632e-06, "loss": 1.0564, "step": 31560 }, { "epoch": 0.6, "learning_rate": 1.8559532761421158e-06, "loss": 0.9036, "step": 31561 }, { "epoch": 0.6, "learning_rate": 1.8558056681574182e-06, "loss": 0.9426, "step": 31562 }, { "epoch": 0.6, "learning_rate": 1.8556580625781235e-06, "loss": 0.9549, "step": 31563 }, { "epoch": 0.6, "learning_rate": 1.8555104594047818e-06, "loss": 0.9443, "step": 31564 }, { "epoch": 0.6, "learning_rate": 1.8553628586379433e-06, "loss": 0.8111, "step": 31565 }, { "epoch": 0.6, "learning_rate": 1.855215260278161e-06, "loss": 0.767, "step": 31566 }, { "epoch": 0.6, "learning_rate": 1.855067664325985e-06, "loss": 0.8386, "step": 31567 }, { "epoch": 0.6, "learning_rate": 1.8549200707819655e-06, "loss": 0.9321, "step": 31568 }, { "epoch": 0.6, "learning_rate": 1.8547724796466563e-06, "loss": 1.2655, "step": 31569 }, { "epoch": 0.6, "learning_rate": 1.8546248909206065e-06, "loss": 0.9677, "step": 31570 }, { "epoch": 0.6, "learning_rate": 1.8544773046043665e-06, "loss": 0.8039, "step": 31571 }, { "epoch": 0.6, "learning_rate": 1.8543297206984898e-06, "loss": 1.135, "step": 31572 }, { "epoch": 0.6, "learning_rate": 1.8541821392035254e-06, "loss": 0.9813, "step": 31573 }, { "epoch": 0.6, "learning_rate": 1.854034560120025e-06, "loss": 0.977, "step": 31574 }, { "epoch": 0.6, "learning_rate": 1.8538869834485398e-06, "loss": 0.9257, "step": 31575 }, { "epoch": 0.6, "learning_rate": 1.8537394091896215e-06, "loss": 0.9647, "step": 31576 }, { "epoch": 0.6, "learning_rate": 1.8535918373438194e-06, "loss": 1.0135, "step": 31577 }, { "epoch": 0.6, "learning_rate": 1.8534442679116862e-06, "loss": 1.1284, "step": 31578 }, { "epoch": 0.6, "learning_rate": 1.8532967008937724e-06, "loss": 0.7731, "step": 31579 }, { "epoch": 0.6, "learning_rate": 1.8531491362906285e-06, "loss": 0.9, "step": 31580 }, { "epoch": 0.6, "learning_rate": 1.8530015741028057e-06, "loss": 1.0822, "step": 31581 }, { "epoch": 0.6, "learning_rate": 1.852854014330856e-06, "loss": 0.94, "step": 31582 }, { "epoch": 0.6, "learning_rate": 1.8527064569753283e-06, "loss": 0.7296, "step": 31583 }, { "epoch": 0.6, "learning_rate": 1.852558902036776e-06, "loss": 0.884, "step": 31584 }, { "epoch": 0.6, "learning_rate": 1.8524113495157489e-06, "loss": 0.9126, "step": 31585 }, { "epoch": 0.6, "learning_rate": 1.852263799412797e-06, "loss": 0.9211, "step": 31586 }, { "epoch": 0.6, "learning_rate": 1.8521162517284733e-06, "loss": 1.204, "step": 31587 }, { "epoch": 0.6, "learning_rate": 1.8519687064633268e-06, "loss": 1.1225, "step": 31588 }, { "epoch": 0.6, "learning_rate": 1.851821163617909e-06, "loss": 0.8994, "step": 31589 }, { "epoch": 0.6, "learning_rate": 1.8516736231927723e-06, "loss": 0.8525, "step": 31590 }, { "epoch": 0.6, "learning_rate": 1.8515260851884664e-06, "loss": 0.9544, "step": 31591 }, { "epoch": 0.6, "learning_rate": 1.8513785496055409e-06, "loss": 0.9041, "step": 31592 }, { "epoch": 0.6, "learning_rate": 1.851231016444549e-06, "loss": 1.1153, "step": 31593 }, { "epoch": 0.6, "learning_rate": 1.8510834857060406e-06, "loss": 0.9538, "step": 31594 }, { "epoch": 0.6, "learning_rate": 1.850935957390566e-06, "loss": 0.61, "step": 31595 }, { "epoch": 0.6, "learning_rate": 1.8507884314986769e-06, "loss": 0.9126, "step": 31596 }, { "epoch": 0.6, "learning_rate": 1.8506409080309246e-06, "loss": 0.8497, "step": 31597 }, { "epoch": 0.6, "learning_rate": 1.8504933869878577e-06, "loss": 0.8685, "step": 31598 }, { "epoch": 0.6, "learning_rate": 1.8503458683700298e-06, "loss": 0.9563, "step": 31599 }, { "epoch": 0.6, "learning_rate": 1.8501983521779907e-06, "loss": 1.0691, "step": 31600 }, { "epoch": 0.6, "learning_rate": 1.85005083841229e-06, "loss": 0.8782, "step": 31601 }, { "epoch": 0.6, "learning_rate": 1.8499033270734799e-06, "loss": 0.9451, "step": 31602 }, { "epoch": 0.6, "learning_rate": 1.8497558181621112e-06, "loss": 0.8661, "step": 31603 }, { "epoch": 0.6, "learning_rate": 1.8496083116787337e-06, "loss": 0.731, "step": 31604 }, { "epoch": 0.6, "learning_rate": 1.8494608076238995e-06, "loss": 1.0043, "step": 31605 }, { "epoch": 0.6, "learning_rate": 1.8493133059981588e-06, "loss": 0.905, "step": 31606 }, { "epoch": 0.6, "learning_rate": 1.8491658068020615e-06, "loss": 1.0411, "step": 31607 }, { "epoch": 0.6, "learning_rate": 1.84901831003616e-06, "loss": 0.9684, "step": 31608 }, { "epoch": 0.6, "learning_rate": 1.8488708157010035e-06, "loss": 0.7395, "step": 31609 }, { "epoch": 0.6, "learning_rate": 1.8487233237971431e-06, "loss": 0.9155, "step": 31610 }, { "epoch": 0.6, "learning_rate": 1.8485758343251308e-06, "loss": 0.9308, "step": 31611 }, { "epoch": 0.6, "learning_rate": 1.8484283472855164e-06, "loss": 1.0785, "step": 31612 }, { "epoch": 0.6, "learning_rate": 1.8482808626788492e-06, "loss": 0.9204, "step": 31613 }, { "epoch": 0.6, "learning_rate": 1.8481333805056828e-06, "loss": 0.738, "step": 31614 }, { "epoch": 0.6, "learning_rate": 1.8479859007665657e-06, "loss": 0.7714, "step": 31615 }, { "epoch": 0.6, "learning_rate": 1.847838423462049e-06, "loss": 0.7578, "step": 31616 }, { "epoch": 0.6, "learning_rate": 1.8476909485926839e-06, "loss": 0.8737, "step": 31617 }, { "epoch": 0.6, "learning_rate": 1.8475434761590212e-06, "loss": 1.1382, "step": 31618 }, { "epoch": 0.6, "learning_rate": 1.8473960061616103e-06, "loss": 1.1651, "step": 31619 }, { "epoch": 0.6, "learning_rate": 1.8472485386010035e-06, "loss": 0.9953, "step": 31620 }, { "epoch": 0.6, "learning_rate": 1.8471010734777506e-06, "loss": 0.6283, "step": 31621 }, { "epoch": 0.6, "learning_rate": 1.8469536107924018e-06, "loss": 0.7824, "step": 31622 }, { "epoch": 0.6, "learning_rate": 1.8468061505455082e-06, "loss": 0.8984, "step": 31623 }, { "epoch": 0.6, "learning_rate": 1.8466586927376208e-06, "loss": 1.0196, "step": 31624 }, { "epoch": 0.6, "learning_rate": 1.84651123736929e-06, "loss": 0.991, "step": 31625 }, { "epoch": 0.6, "learning_rate": 1.8463637844410654e-06, "loss": 0.9554, "step": 31626 }, { "epoch": 0.6, "learning_rate": 1.8462163339534991e-06, "loss": 0.9065, "step": 31627 }, { "epoch": 0.6, "learning_rate": 1.8460688859071408e-06, "loss": 0.8124, "step": 31628 }, { "epoch": 0.6, "learning_rate": 1.8459214403025407e-06, "loss": 0.7924, "step": 31629 }, { "epoch": 0.6, "learning_rate": 1.8457739971402502e-06, "loss": 0.8235, "step": 31630 }, { "epoch": 0.6, "learning_rate": 1.84562655642082e-06, "loss": 1.0237, "step": 31631 }, { "epoch": 0.6, "learning_rate": 1.8454791181447992e-06, "loss": 0.8865, "step": 31632 }, { "epoch": 0.6, "learning_rate": 1.8453316823127403e-06, "loss": 0.9819, "step": 31633 }, { "epoch": 0.6, "learning_rate": 1.845184248925193e-06, "loss": 0.8207, "step": 31634 }, { "epoch": 0.6, "learning_rate": 1.8450368179827064e-06, "loss": 0.8029, "step": 31635 }, { "epoch": 0.6, "learning_rate": 1.8448893894858327e-06, "loss": 1.0024, "step": 31636 }, { "epoch": 0.6, "learning_rate": 1.8447419634351227e-06, "loss": 1.0574, "step": 31637 }, { "epoch": 0.6, "learning_rate": 1.844594539831125e-06, "loss": 0.9093, "step": 31638 }, { "epoch": 0.6, "learning_rate": 1.844447118674392e-06, "loss": 0.9503, "step": 31639 }, { "epoch": 0.6, "learning_rate": 1.8442996999654733e-06, "loss": 0.7258, "step": 31640 }, { "epoch": 0.6, "learning_rate": 1.8441522837049187e-06, "loss": 0.8876, "step": 31641 }, { "epoch": 0.6, "learning_rate": 1.8440048698932806e-06, "loss": 0.9503, "step": 31642 }, { "epoch": 0.6, "learning_rate": 1.843857458531107e-06, "loss": 1.0669, "step": 31643 }, { "epoch": 0.6, "learning_rate": 1.8437100496189498e-06, "loss": 1.0177, "step": 31644 }, { "epoch": 0.6, "learning_rate": 1.8435626431573594e-06, "loss": 1.0556, "step": 31645 }, { "epoch": 0.6, "learning_rate": 1.8434152391468864e-06, "loss": 0.6804, "step": 31646 }, { "epoch": 0.6, "learning_rate": 1.8432678375880796e-06, "loss": 0.8924, "step": 31647 }, { "epoch": 0.6, "learning_rate": 1.8431204384814919e-06, "loss": 0.6956, "step": 31648 }, { "epoch": 0.6, "learning_rate": 1.8429730418276714e-06, "loss": 0.9878, "step": 31649 }, { "epoch": 0.6, "learning_rate": 1.84282564762717e-06, "loss": 1.2665, "step": 31650 }, { "epoch": 0.6, "learning_rate": 1.8426782558805367e-06, "loss": 0.9132, "step": 31651 }, { "epoch": 0.6, "learning_rate": 1.8425308665883238e-06, "loss": 1.1076, "step": 31652 }, { "epoch": 0.6, "learning_rate": 1.8423834797510792e-06, "loss": 1.0004, "step": 31653 }, { "epoch": 0.6, "learning_rate": 1.8422360953693556e-06, "loss": 0.9171, "step": 31654 }, { "epoch": 0.6, "learning_rate": 1.842088713443702e-06, "loss": 0.8849, "step": 31655 }, { "epoch": 0.6, "learning_rate": 1.8419413339746683e-06, "loss": 0.8796, "step": 31656 }, { "epoch": 0.6, "learning_rate": 1.8417939569628058e-06, "loss": 0.8501, "step": 31657 }, { "epoch": 0.6, "learning_rate": 1.841646582408665e-06, "loss": 0.9353, "step": 31658 }, { "epoch": 0.6, "learning_rate": 1.8414992103127948e-06, "loss": 0.804, "step": 31659 }, { "epoch": 0.6, "learning_rate": 1.8413518406757475e-06, "loss": 0.9584, "step": 31660 }, { "epoch": 0.6, "learning_rate": 1.841204473498072e-06, "loss": 0.998, "step": 31661 }, { "epoch": 0.6, "learning_rate": 1.8410571087803175e-06, "loss": 1.0485, "step": 31662 }, { "epoch": 0.6, "learning_rate": 1.840909746523037e-06, "loss": 0.978, "step": 31663 }, { "epoch": 0.6, "learning_rate": 1.8407623867267788e-06, "loss": 0.7978, "step": 31664 }, { "epoch": 0.6, "learning_rate": 1.8406150293920926e-06, "loss": 0.8083, "step": 31665 }, { "epoch": 0.6, "learning_rate": 1.8404676745195313e-06, "loss": 0.9334, "step": 31666 }, { "epoch": 0.6, "learning_rate": 1.8403203221096433e-06, "loss": 1.0359, "step": 31667 }, { "epoch": 0.6, "learning_rate": 1.840172972162978e-06, "loss": 1.0742, "step": 31668 }, { "epoch": 0.6, "learning_rate": 1.8400256246800874e-06, "loss": 0.9626, "step": 31669 }, { "epoch": 0.6, "learning_rate": 1.8398782796615205e-06, "loss": 0.8451, "step": 31670 }, { "epoch": 0.6, "learning_rate": 1.8397309371078278e-06, "loss": 0.9225, "step": 31671 }, { "epoch": 0.6, "learning_rate": 1.8395835970195597e-06, "loss": 0.8106, "step": 31672 }, { "epoch": 0.6, "learning_rate": 1.8394362593972665e-06, "loss": 0.7883, "step": 31673 }, { "epoch": 0.6, "learning_rate": 1.839288924241497e-06, "loss": 0.9635, "step": 31674 }, { "epoch": 0.6, "learning_rate": 1.8391415915528039e-06, "loss": 1.1573, "step": 31675 }, { "epoch": 0.6, "learning_rate": 1.8389942613317353e-06, "loss": 0.8445, "step": 31676 }, { "epoch": 0.6, "learning_rate": 1.8388469335788411e-06, "loss": 0.8832, "step": 31677 }, { "epoch": 0.6, "learning_rate": 1.8386996082946725e-06, "loss": 0.8944, "step": 31678 }, { "epoch": 0.6, "learning_rate": 1.8385522854797799e-06, "loss": 0.927, "step": 31679 }, { "epoch": 0.6, "learning_rate": 1.8384049651347119e-06, "loss": 1.1484, "step": 31680 }, { "epoch": 0.6, "learning_rate": 1.8382576472600205e-06, "loss": 1.037, "step": 31681 }, { "epoch": 0.6, "learning_rate": 1.8381103318562545e-06, "loss": 0.9946, "step": 31682 }, { "epoch": 0.6, "learning_rate": 1.8379630189239634e-06, "loss": 1.0113, "step": 31683 }, { "epoch": 0.6, "learning_rate": 1.837815708463699e-06, "loss": 0.8984, "step": 31684 }, { "epoch": 0.6, "learning_rate": 1.83766840047601e-06, "loss": 0.873, "step": 31685 }, { "epoch": 0.6, "learning_rate": 1.8375210949614464e-06, "loss": 0.8671, "step": 31686 }, { "epoch": 0.6, "learning_rate": 1.8373737919205597e-06, "loss": 1.0875, "step": 31687 }, { "epoch": 0.6, "learning_rate": 1.837226491353899e-06, "loss": 0.9003, "step": 31688 }, { "epoch": 0.6, "learning_rate": 1.837079193262013e-06, "loss": 1.001, "step": 31689 }, { "epoch": 0.6, "learning_rate": 1.8369318976454543e-06, "loss": 0.9209, "step": 31690 }, { "epoch": 0.6, "learning_rate": 1.836784604504771e-06, "loss": 0.9106, "step": 31691 }, { "epoch": 0.6, "learning_rate": 1.8366373138405136e-06, "loss": 0.6192, "step": 31692 }, { "epoch": 0.6, "learning_rate": 1.836490025653232e-06, "loss": 1.028, "step": 31693 }, { "epoch": 0.6, "learning_rate": 1.836342739943477e-06, "loss": 1.0875, "step": 31694 }, { "epoch": 0.6, "learning_rate": 1.8361954567117969e-06, "loss": 0.9923, "step": 31695 }, { "epoch": 0.6, "learning_rate": 1.8360481759587435e-06, "loss": 0.8706, "step": 31696 }, { "epoch": 0.6, "learning_rate": 1.8359008976848658e-06, "loss": 0.8362, "step": 31697 }, { "epoch": 0.6, "learning_rate": 1.8357536218907126e-06, "loss": 0.8342, "step": 31698 }, { "epoch": 0.6, "learning_rate": 1.8356063485768358e-06, "loss": 0.8022, "step": 31699 }, { "epoch": 0.6, "learning_rate": 1.835459077743785e-06, "loss": 1.1812, "step": 31700 }, { "epoch": 0.6, "learning_rate": 1.8353118093921085e-06, "loss": 0.9411, "step": 31701 }, { "epoch": 0.6, "learning_rate": 1.8351645435223587e-06, "loss": 0.7885, "step": 31702 }, { "epoch": 0.6, "learning_rate": 1.8350172801350836e-06, "loss": 0.9232, "step": 31703 }, { "epoch": 0.6, "learning_rate": 1.8348700192308328e-06, "loss": 0.9189, "step": 31704 }, { "epoch": 0.6, "learning_rate": 1.8347227608101582e-06, "loss": 0.7997, "step": 31705 }, { "epoch": 0.6, "learning_rate": 1.8345755048736074e-06, "loss": 1.1956, "step": 31706 }, { "epoch": 0.6, "learning_rate": 1.834428251421731e-06, "loss": 0.8035, "step": 31707 }, { "epoch": 0.6, "learning_rate": 1.8342810004550804e-06, "loss": 0.8332, "step": 31708 }, { "epoch": 0.6, "learning_rate": 1.8341337519742036e-06, "loss": 0.9559, "step": 31709 }, { "epoch": 0.6, "learning_rate": 1.8339865059796501e-06, "loss": 0.636, "step": 31710 }, { "epoch": 0.6, "learning_rate": 1.8338392624719719e-06, "loss": 1.0736, "step": 31711 }, { "epoch": 0.6, "learning_rate": 1.8336920214517168e-06, "loss": 0.9653, "step": 31712 }, { "epoch": 0.6, "learning_rate": 1.8335447829194353e-06, "loss": 0.9219, "step": 31713 }, { "epoch": 0.6, "learning_rate": 1.8333975468756772e-06, "loss": 0.7778, "step": 31714 }, { "epoch": 0.6, "learning_rate": 1.8332503133209922e-06, "loss": 0.9252, "step": 31715 }, { "epoch": 0.6, "learning_rate": 1.8331030822559298e-06, "loss": 0.8583, "step": 31716 }, { "epoch": 0.6, "learning_rate": 1.8329558536810404e-06, "loss": 0.8355, "step": 31717 }, { "epoch": 0.6, "learning_rate": 1.832808627596874e-06, "loss": 1.1697, "step": 31718 }, { "epoch": 0.6, "learning_rate": 1.8326614040039783e-06, "loss": 1.1556, "step": 31719 }, { "epoch": 0.6, "learning_rate": 1.8325141829029054e-06, "loss": 0.7745, "step": 31720 }, { "epoch": 0.6, "learning_rate": 1.832366964294204e-06, "loss": 0.7212, "step": 31721 }, { "epoch": 0.6, "learning_rate": 1.8322197481784231e-06, "loss": 0.9438, "step": 31722 }, { "epoch": 0.6, "learning_rate": 1.8320725345561143e-06, "loss": 0.8816, "step": 31723 }, { "epoch": 0.6, "learning_rate": 1.8319253234278262e-06, "loss": 0.938, "step": 31724 }, { "epoch": 0.6, "learning_rate": 1.8317781147941071e-06, "loss": 0.9081, "step": 31725 }, { "epoch": 0.6, "learning_rate": 1.8316309086555095e-06, "loss": 0.8983, "step": 31726 }, { "epoch": 0.6, "learning_rate": 1.831483705012581e-06, "loss": 0.9784, "step": 31727 }, { "epoch": 0.6, "learning_rate": 1.8313365038658713e-06, "loss": 1.0424, "step": 31728 }, { "epoch": 0.6, "learning_rate": 1.8311893052159314e-06, "loss": 0.8256, "step": 31729 }, { "epoch": 0.6, "learning_rate": 1.8310421090633105e-06, "loss": 0.8902, "step": 31730 }, { "epoch": 0.6, "learning_rate": 1.8308949154085564e-06, "loss": 1.0555, "step": 31731 }, { "epoch": 0.6, "learning_rate": 1.8307477242522214e-06, "loss": 0.9054, "step": 31732 }, { "epoch": 0.6, "learning_rate": 1.8306005355948537e-06, "loss": 0.9388, "step": 31733 }, { "epoch": 0.6, "learning_rate": 1.8304533494370025e-06, "loss": 0.871, "step": 31734 }, { "epoch": 0.6, "learning_rate": 1.8303061657792181e-06, "loss": 0.803, "step": 31735 }, { "epoch": 0.6, "learning_rate": 1.8301589846220508e-06, "loss": 0.904, "step": 31736 }, { "epoch": 0.6, "learning_rate": 1.8300118059660478e-06, "loss": 1.3177, "step": 31737 }, { "epoch": 0.6, "learning_rate": 1.8298646298117618e-06, "loss": 1.0816, "step": 31738 }, { "epoch": 0.6, "learning_rate": 1.8297174561597403e-06, "loss": 0.9405, "step": 31739 }, { "epoch": 0.6, "learning_rate": 1.8295702850105323e-06, "loss": 1.1056, "step": 31740 }, { "epoch": 0.6, "learning_rate": 1.829423116364689e-06, "loss": 0.7894, "step": 31741 }, { "epoch": 0.6, "learning_rate": 1.8292759502227595e-06, "loss": 0.889, "step": 31742 }, { "epoch": 0.6, "learning_rate": 1.829128786585292e-06, "loss": 1.2236, "step": 31743 }, { "epoch": 0.6, "learning_rate": 1.8289816254528381e-06, "loss": 0.8944, "step": 31744 }, { "epoch": 0.6, "learning_rate": 1.8288344668259463e-06, "loss": 0.9516, "step": 31745 }, { "epoch": 0.6, "learning_rate": 1.828687310705165e-06, "loss": 0.8535, "step": 31746 }, { "epoch": 0.6, "learning_rate": 1.8285401570910457e-06, "loss": 0.8363, "step": 31747 }, { "epoch": 0.6, "learning_rate": 1.8283930059841365e-06, "loss": 0.8944, "step": 31748 }, { "epoch": 0.6, "learning_rate": 1.8282458573849866e-06, "loss": 1.0255, "step": 31749 }, { "epoch": 0.6, "learning_rate": 1.828098711294147e-06, "loss": 0.9742, "step": 31750 }, { "epoch": 0.6, "learning_rate": 1.8279515677121661e-06, "loss": 0.7123, "step": 31751 }, { "epoch": 0.6, "learning_rate": 1.8278044266395927e-06, "loss": 1.0607, "step": 31752 }, { "epoch": 0.6, "learning_rate": 1.827657288076978e-06, "loss": 0.9103, "step": 31753 }, { "epoch": 0.6, "learning_rate": 1.8275101520248698e-06, "loss": 0.7437, "step": 31754 }, { "epoch": 0.6, "learning_rate": 1.8273630184838182e-06, "loss": 1.1768, "step": 31755 }, { "epoch": 0.6, "learning_rate": 1.8272158874543722e-06, "loss": 1.1278, "step": 31756 }, { "epoch": 0.6, "learning_rate": 1.8270687589370817e-06, "loss": 0.9436, "step": 31757 }, { "epoch": 0.6, "learning_rate": 1.8269216329324951e-06, "loss": 0.8247, "step": 31758 }, { "epoch": 0.6, "learning_rate": 1.8267745094411638e-06, "loss": 1.0349, "step": 31759 }, { "epoch": 0.6, "learning_rate": 1.8266273884636354e-06, "loss": 0.8776, "step": 31760 }, { "epoch": 0.6, "learning_rate": 1.826480270000459e-06, "loss": 0.8832, "step": 31761 }, { "epoch": 0.6, "learning_rate": 1.826333154052185e-06, "loss": 1.0825, "step": 31762 }, { "epoch": 0.6, "learning_rate": 1.826186040619363e-06, "loss": 1.0915, "step": 31763 }, { "epoch": 0.6, "learning_rate": 1.8260389297025404e-06, "loss": 1.0567, "step": 31764 }, { "epoch": 0.6, "learning_rate": 1.8258918213022688e-06, "loss": 1.1636, "step": 31765 }, { "epoch": 0.6, "learning_rate": 1.8257447154190965e-06, "loss": 0.8812, "step": 31766 }, { "epoch": 0.6, "learning_rate": 1.8255976120535718e-06, "loss": 0.883, "step": 31767 }, { "epoch": 0.6, "learning_rate": 1.825450511206246e-06, "loss": 0.9086, "step": 31768 }, { "epoch": 0.6, "learning_rate": 1.825303412877667e-06, "loss": 1.0361, "step": 31769 }, { "epoch": 0.6, "learning_rate": 1.8251563170683835e-06, "loss": 0.9308, "step": 31770 }, { "epoch": 0.6, "learning_rate": 1.825009223778947e-06, "loss": 0.9654, "step": 31771 }, { "epoch": 0.6, "learning_rate": 1.8248621330099048e-06, "loss": 1.0384, "step": 31772 }, { "epoch": 0.6, "learning_rate": 1.8247150447618062e-06, "loss": 0.7844, "step": 31773 }, { "epoch": 0.6, "learning_rate": 1.8245679590352016e-06, "loss": 0.9348, "step": 31774 }, { "epoch": 0.6, "learning_rate": 1.8244208758306391e-06, "loss": 1.2098, "step": 31775 }, { "epoch": 0.6, "learning_rate": 1.8242737951486682e-06, "loss": 0.8961, "step": 31776 }, { "epoch": 0.6, "learning_rate": 1.8241267169898386e-06, "loss": 0.9967, "step": 31777 }, { "epoch": 0.6, "learning_rate": 1.8239796413546995e-06, "loss": 0.8823, "step": 31778 }, { "epoch": 0.6, "learning_rate": 1.8238325682437985e-06, "loss": 0.803, "step": 31779 }, { "epoch": 0.6, "learning_rate": 1.8236854976576872e-06, "loss": 0.889, "step": 31780 }, { "epoch": 0.6, "learning_rate": 1.8235384295969134e-06, "loss": 1.1481, "step": 31781 }, { "epoch": 0.6, "learning_rate": 1.8233913640620255e-06, "loss": 1.1265, "step": 31782 }, { "epoch": 0.6, "learning_rate": 1.8232443010535738e-06, "loss": 0.8189, "step": 31783 }, { "epoch": 0.6, "learning_rate": 1.8230972405721076e-06, "loss": 0.7032, "step": 31784 }, { "epoch": 0.6, "learning_rate": 1.8229501826181745e-06, "loss": 0.9166, "step": 31785 }, { "epoch": 0.6, "learning_rate": 1.8228031271923258e-06, "loss": 1.0272, "step": 31786 }, { "epoch": 0.6, "learning_rate": 1.8226560742951097e-06, "loss": 1.0205, "step": 31787 }, { "epoch": 0.6, "learning_rate": 1.8225090239270737e-06, "loss": 1.0622, "step": 31788 }, { "epoch": 0.6, "learning_rate": 1.8223619760887695e-06, "loss": 0.7587, "step": 31789 }, { "epoch": 0.6, "learning_rate": 1.822214930780744e-06, "loss": 0.9116, "step": 31790 }, { "epoch": 0.6, "learning_rate": 1.822067888003547e-06, "loss": 1.0712, "step": 31791 }, { "epoch": 0.6, "learning_rate": 1.8219208477577288e-06, "loss": 0.8055, "step": 31792 }, { "epoch": 0.6, "learning_rate": 1.821773810043837e-06, "loss": 1.0898, "step": 31793 }, { "epoch": 0.6, "learning_rate": 1.8216267748624203e-06, "loss": 1.1389, "step": 31794 }, { "epoch": 0.6, "learning_rate": 1.8214797422140294e-06, "loss": 1.0396, "step": 31795 }, { "epoch": 0.6, "learning_rate": 1.8213327120992116e-06, "loss": 0.9666, "step": 31796 }, { "epoch": 0.6, "learning_rate": 1.821185684518517e-06, "loss": 0.736, "step": 31797 }, { "epoch": 0.6, "learning_rate": 1.8210386594724938e-06, "loss": 0.6098, "step": 31798 }, { "epoch": 0.6, "learning_rate": 1.8208916369616926e-06, "loss": 1.0187, "step": 31799 }, { "epoch": 0.6, "learning_rate": 1.8207446169866594e-06, "loss": 1.0826, "step": 31800 }, { "epoch": 0.6, "learning_rate": 1.8205975995479463e-06, "loss": 0.9161, "step": 31801 }, { "epoch": 0.6, "learning_rate": 1.8204505846461014e-06, "loss": 0.8826, "step": 31802 }, { "epoch": 0.6, "learning_rate": 1.8203035722816715e-06, "loss": 0.9914, "step": 31803 }, { "epoch": 0.6, "learning_rate": 1.8201565624552081e-06, "loss": 0.93, "step": 31804 }, { "epoch": 0.6, "learning_rate": 1.8200095551672598e-06, "loss": 1.0525, "step": 31805 }, { "epoch": 0.6, "learning_rate": 1.8198625504183737e-06, "loss": 1.1606, "step": 31806 }, { "epoch": 0.6, "learning_rate": 1.819715548209101e-06, "loss": 0.7904, "step": 31807 }, { "epoch": 0.6, "learning_rate": 1.8195685485399898e-06, "loss": 0.9086, "step": 31808 }, { "epoch": 0.6, "learning_rate": 1.8194215514115875e-06, "loss": 1.0397, "step": 31809 }, { "epoch": 0.6, "learning_rate": 1.8192745568244455e-06, "loss": 0.7484, "step": 31810 }, { "epoch": 0.6, "learning_rate": 1.8191275647791108e-06, "loss": 0.7566, "step": 31811 }, { "epoch": 0.6, "learning_rate": 1.8189805752761326e-06, "loss": 1.1739, "step": 31812 }, { "epoch": 0.6, "learning_rate": 1.8188335883160607e-06, "loss": 0.8736, "step": 31813 }, { "epoch": 0.6, "learning_rate": 1.8186866038994436e-06, "loss": 0.8349, "step": 31814 }, { "epoch": 0.6, "learning_rate": 1.8185396220268287e-06, "loss": 0.7776, "step": 31815 }, { "epoch": 0.6, "learning_rate": 1.8183926426987668e-06, "loss": 1.0414, "step": 31816 }, { "epoch": 0.6, "learning_rate": 1.8182456659158056e-06, "loss": 0.8992, "step": 31817 }, { "epoch": 0.6, "learning_rate": 1.8180986916784944e-06, "loss": 0.9587, "step": 31818 }, { "epoch": 0.6, "learning_rate": 1.8179517199873813e-06, "loss": 0.9326, "step": 31819 }, { "epoch": 0.6, "learning_rate": 1.8178047508430164e-06, "loss": 0.9648, "step": 31820 }, { "epoch": 0.6, "learning_rate": 1.8176577842459463e-06, "loss": 0.7843, "step": 31821 }, { "epoch": 0.6, "learning_rate": 1.8175108201967226e-06, "loss": 0.9391, "step": 31822 }, { "epoch": 0.6, "learning_rate": 1.8173638586958926e-06, "loss": 0.8009, "step": 31823 }, { "epoch": 0.6, "learning_rate": 1.8172168997440034e-06, "loss": 0.8708, "step": 31824 }, { "epoch": 0.6, "learning_rate": 1.8170699433416061e-06, "loss": 0.9371, "step": 31825 }, { "epoch": 0.6, "learning_rate": 1.8169229894892492e-06, "loss": 0.7822, "step": 31826 }, { "epoch": 0.6, "learning_rate": 1.8167760381874802e-06, "loss": 0.8822, "step": 31827 }, { "epoch": 0.6, "learning_rate": 1.8166290894368493e-06, "loss": 0.9561, "step": 31828 }, { "epoch": 0.6, "learning_rate": 1.8164821432379045e-06, "loss": 0.9263, "step": 31829 }, { "epoch": 0.6, "learning_rate": 1.8163351995911932e-06, "loss": 0.8935, "step": 31830 }, { "epoch": 0.6, "learning_rate": 1.8161882584972668e-06, "loss": 0.933, "step": 31831 }, { "epoch": 0.6, "learning_rate": 1.8160413199566715e-06, "loss": 0.8596, "step": 31832 }, { "epoch": 0.6, "learning_rate": 1.8158943839699566e-06, "loss": 0.7886, "step": 31833 }, { "epoch": 0.6, "learning_rate": 1.8157474505376722e-06, "loss": 0.9669, "step": 31834 }, { "epoch": 0.6, "learning_rate": 1.8156005196603656e-06, "loss": 0.9522, "step": 31835 }, { "epoch": 0.6, "learning_rate": 1.8154535913385848e-06, "loss": 0.8619, "step": 31836 }, { "epoch": 0.6, "learning_rate": 1.81530666557288e-06, "loss": 1.0828, "step": 31837 }, { "epoch": 0.6, "learning_rate": 1.8151597423637992e-06, "loss": 0.9026, "step": 31838 }, { "epoch": 0.6, "learning_rate": 1.8150128217118905e-06, "loss": 1.0219, "step": 31839 }, { "epoch": 0.6, "learning_rate": 1.8148659036177033e-06, "loss": 1.2108, "step": 31840 }, { "epoch": 0.6, "learning_rate": 1.8147189880817861e-06, "loss": 0.78, "step": 31841 }, { "epoch": 0.6, "learning_rate": 1.814572075104686e-06, "loss": 0.9459, "step": 31842 }, { "epoch": 0.6, "learning_rate": 1.8144251646869543e-06, "loss": 1.0832, "step": 31843 }, { "epoch": 0.6, "learning_rate": 1.8142782568291373e-06, "loss": 1.0365, "step": 31844 }, { "epoch": 0.6, "learning_rate": 1.8141313515317838e-06, "loss": 0.9918, "step": 31845 }, { "epoch": 0.6, "learning_rate": 1.813984448795443e-06, "loss": 0.7412, "step": 31846 }, { "epoch": 0.6, "learning_rate": 1.8138375486206638e-06, "loss": 0.9067, "step": 31847 }, { "epoch": 0.6, "learning_rate": 1.8136906510079932e-06, "loss": 0.6798, "step": 31848 }, { "epoch": 0.6, "learning_rate": 1.8135437559579817e-06, "loss": 0.8613, "step": 31849 }, { "epoch": 0.6, "learning_rate": 1.813396863471177e-06, "loss": 0.9432, "step": 31850 }, { "epoch": 0.6, "learning_rate": 1.8132499735481258e-06, "loss": 0.9513, "step": 31851 }, { "epoch": 0.6, "learning_rate": 1.8131030861893794e-06, "loss": 0.9472, "step": 31852 }, { "epoch": 0.6, "learning_rate": 1.8129562013954846e-06, "loss": 0.9154, "step": 31853 }, { "epoch": 0.6, "learning_rate": 1.812809319166991e-06, "loss": 0.8299, "step": 31854 }, { "epoch": 0.6, "learning_rate": 1.8126624395044448e-06, "loss": 1.0886, "step": 31855 }, { "epoch": 0.6, "learning_rate": 1.8125155624083973e-06, "loss": 1.0201, "step": 31856 }, { "epoch": 0.6, "learning_rate": 1.8123686878793956e-06, "loss": 0.8477, "step": 31857 }, { "epoch": 0.6, "learning_rate": 1.8122218159179872e-06, "loss": 1.0699, "step": 31858 }, { "epoch": 0.6, "learning_rate": 1.8120749465247218e-06, "loss": 0.9779, "step": 31859 }, { "epoch": 0.6, "learning_rate": 1.811928079700148e-06, "loss": 0.7822, "step": 31860 }, { "epoch": 0.6, "learning_rate": 1.8117812154448125e-06, "loss": 0.8552, "step": 31861 }, { "epoch": 0.6, "learning_rate": 1.8116343537592659e-06, "loss": 0.9214, "step": 31862 }, { "epoch": 0.6, "learning_rate": 1.8114874946440558e-06, "loss": 0.9572, "step": 31863 }, { "epoch": 0.6, "learning_rate": 1.811340638099729e-06, "loss": 1.0568, "step": 31864 }, { "epoch": 0.6, "learning_rate": 1.8111937841268362e-06, "loss": 0.7516, "step": 31865 }, { "epoch": 0.6, "learning_rate": 1.8110469327259245e-06, "loss": 0.9364, "step": 31866 }, { "epoch": 0.6, "learning_rate": 1.8109000838975416e-06, "loss": 0.7681, "step": 31867 }, { "epoch": 0.6, "learning_rate": 1.8107532376422377e-06, "loss": 1.175, "step": 31868 }, { "epoch": 0.6, "learning_rate": 1.81060639396056e-06, "loss": 1.0984, "step": 31869 }, { "epoch": 0.6, "learning_rate": 1.810459552853056e-06, "loss": 0.8206, "step": 31870 }, { "epoch": 0.6, "learning_rate": 1.8103127143202759e-06, "loss": 0.7346, "step": 31871 }, { "epoch": 0.6, "learning_rate": 1.8101658783627662e-06, "loss": 0.7091, "step": 31872 }, { "epoch": 0.6, "learning_rate": 1.8100190449810762e-06, "loss": 0.9894, "step": 31873 }, { "epoch": 0.6, "learning_rate": 1.809872214175754e-06, "loss": 1.0537, "step": 31874 }, { "epoch": 0.6, "learning_rate": 1.8097253859473484e-06, "loss": 0.8878, "step": 31875 }, { "epoch": 0.6, "learning_rate": 1.8095785602964056e-06, "loss": 0.8409, "step": 31876 }, { "epoch": 0.6, "learning_rate": 1.8094317372234765e-06, "loss": 0.7582, "step": 31877 }, { "epoch": 0.6, "learning_rate": 1.8092849167291083e-06, "loss": 0.8525, "step": 31878 }, { "epoch": 0.6, "learning_rate": 1.809138098813848e-06, "loss": 0.9186, "step": 31879 }, { "epoch": 0.6, "learning_rate": 1.8089912834782452e-06, "loss": 0.9766, "step": 31880 }, { "epoch": 0.6, "learning_rate": 1.8088444707228487e-06, "loss": 1.1495, "step": 31881 }, { "epoch": 0.6, "learning_rate": 1.8086976605482043e-06, "loss": 0.7468, "step": 31882 }, { "epoch": 0.6, "learning_rate": 1.8085508529548625e-06, "loss": 0.8011, "step": 31883 }, { "epoch": 0.6, "learning_rate": 1.808404047943371e-06, "loss": 0.9005, "step": 31884 }, { "epoch": 0.6, "learning_rate": 1.8082572455142764e-06, "loss": 0.6594, "step": 31885 }, { "epoch": 0.6, "learning_rate": 1.8081104456681292e-06, "loss": 0.7651, "step": 31886 }, { "epoch": 0.6, "learning_rate": 1.8079636484054755e-06, "loss": 0.9164, "step": 31887 }, { "epoch": 0.6, "learning_rate": 1.8078168537268643e-06, "loss": 0.941, "step": 31888 }, { "epoch": 0.6, "learning_rate": 1.8076700616328444e-06, "loss": 0.8265, "step": 31889 }, { "epoch": 0.6, "learning_rate": 1.8075232721239633e-06, "loss": 0.9196, "step": 31890 }, { "epoch": 0.6, "learning_rate": 1.807376485200768e-06, "loss": 0.9485, "step": 31891 }, { "epoch": 0.6, "learning_rate": 1.807229700863809e-06, "loss": 0.7845, "step": 31892 }, { "epoch": 0.6, "learning_rate": 1.8070829191136324e-06, "loss": 1.0318, "step": 31893 }, { "epoch": 0.6, "learning_rate": 1.8069361399507861e-06, "loss": 1.0018, "step": 31894 }, { "epoch": 0.6, "learning_rate": 1.8067893633758205e-06, "loss": 0.8121, "step": 31895 }, { "epoch": 0.6, "learning_rate": 1.806642589389282e-06, "loss": 0.8256, "step": 31896 }, { "epoch": 0.6, "learning_rate": 1.8064958179917178e-06, "loss": 0.9005, "step": 31897 }, { "epoch": 0.6, "learning_rate": 1.806349049183678e-06, "loss": 0.7984, "step": 31898 }, { "epoch": 0.6, "learning_rate": 1.8062022829657088e-06, "loss": 0.9908, "step": 31899 }, { "epoch": 0.6, "learning_rate": 1.8060555193383594e-06, "loss": 0.9778, "step": 31900 }, { "epoch": 0.6, "learning_rate": 1.8059087583021773e-06, "loss": 0.9597, "step": 31901 }, { "epoch": 0.6, "learning_rate": 1.805761999857711e-06, "loss": 0.9589, "step": 31902 }, { "epoch": 0.6, "learning_rate": 1.805615244005507e-06, "loss": 0.8065, "step": 31903 }, { "epoch": 0.6, "learning_rate": 1.8054684907461157e-06, "loss": 0.7487, "step": 31904 }, { "epoch": 0.6, "learning_rate": 1.8053217400800838e-06, "loss": 0.7893, "step": 31905 }, { "epoch": 0.6, "learning_rate": 1.8051749920079579e-06, "loss": 0.8592, "step": 31906 }, { "epoch": 0.6, "learning_rate": 1.8050282465302876e-06, "loss": 0.8007, "step": 31907 }, { "epoch": 0.6, "learning_rate": 1.8048815036476215e-06, "loss": 0.7777, "step": 31908 }, { "epoch": 0.6, "learning_rate": 1.8047347633605053e-06, "loss": 0.8223, "step": 31909 }, { "epoch": 0.6, "learning_rate": 1.8045880256694893e-06, "loss": 0.7298, "step": 31910 }, { "epoch": 0.6, "learning_rate": 1.8044412905751202e-06, "loss": 0.7715, "step": 31911 }, { "epoch": 0.6, "learning_rate": 1.8042945580779452e-06, "loss": 1.1955, "step": 31912 }, { "epoch": 0.6, "learning_rate": 1.8041478281785138e-06, "loss": 0.8452, "step": 31913 }, { "epoch": 0.6, "learning_rate": 1.8040011008773726e-06, "loss": 0.818, "step": 31914 }, { "epoch": 0.6, "learning_rate": 1.8038543761750693e-06, "loss": 0.9795, "step": 31915 }, { "epoch": 0.6, "learning_rate": 1.8037076540721537e-06, "loss": 0.9101, "step": 31916 }, { "epoch": 0.6, "learning_rate": 1.8035609345691724e-06, "loss": 0.6277, "step": 31917 }, { "epoch": 0.6, "learning_rate": 1.8034142176666719e-06, "loss": 0.8973, "step": 31918 }, { "epoch": 0.6, "learning_rate": 1.8032675033652024e-06, "loss": 0.9651, "step": 31919 }, { "epoch": 0.6, "learning_rate": 1.8031207916653104e-06, "loss": 0.8315, "step": 31920 }, { "epoch": 0.6, "learning_rate": 1.8029740825675438e-06, "loss": 0.8743, "step": 31921 }, { "epoch": 0.6, "learning_rate": 1.8028273760724507e-06, "loss": 0.8555, "step": 31922 }, { "epoch": 0.6, "learning_rate": 1.8026806721805795e-06, "loss": 0.8334, "step": 31923 }, { "epoch": 0.6, "learning_rate": 1.8025339708924761e-06, "loss": 0.83, "step": 31924 }, { "epoch": 0.6, "learning_rate": 1.8023872722086902e-06, "loss": 1.0613, "step": 31925 }, { "epoch": 0.6, "learning_rate": 1.802240576129769e-06, "loss": 0.935, "step": 31926 }, { "epoch": 0.6, "learning_rate": 1.8020938826562592e-06, "loss": 0.6994, "step": 31927 }, { "epoch": 0.6, "learning_rate": 1.80194719178871e-06, "loss": 0.9247, "step": 31928 }, { "epoch": 0.6, "learning_rate": 1.8018005035276692e-06, "loss": 0.9474, "step": 31929 }, { "epoch": 0.6, "learning_rate": 1.8016538178736826e-06, "loss": 0.8316, "step": 31930 }, { "epoch": 0.6, "learning_rate": 1.8015071348273003e-06, "loss": 1.1354, "step": 31931 }, { "epoch": 0.6, "learning_rate": 1.8013604543890688e-06, "loss": 1.0785, "step": 31932 }, { "epoch": 0.6, "learning_rate": 1.8012137765595354e-06, "loss": 1.063, "step": 31933 }, { "epoch": 0.6, "learning_rate": 1.801067101339249e-06, "loss": 0.8842, "step": 31934 }, { "epoch": 0.6, "learning_rate": 1.8009204287287562e-06, "loss": 0.821, "step": 31935 }, { "epoch": 0.6, "learning_rate": 1.8007737587286045e-06, "loss": 1.0326, "step": 31936 }, { "epoch": 0.6, "learning_rate": 1.800627091339343e-06, "loss": 1.1022, "step": 31937 }, { "epoch": 0.6, "learning_rate": 1.800480426561519e-06, "loss": 1.2166, "step": 31938 }, { "epoch": 0.6, "learning_rate": 1.8003337643956783e-06, "loss": 0.9607, "step": 31939 }, { "epoch": 0.6, "learning_rate": 1.8001871048423708e-06, "loss": 0.9151, "step": 31940 }, { "epoch": 0.6, "learning_rate": 1.800040447902143e-06, "loss": 0.723, "step": 31941 }, { "epoch": 0.6, "learning_rate": 1.7998937935755423e-06, "loss": 0.8084, "step": 31942 }, { "epoch": 0.6, "learning_rate": 1.7997471418631172e-06, "loss": 1.0469, "step": 31943 }, { "epoch": 0.6, "learning_rate": 1.7996004927654147e-06, "loss": 1.1446, "step": 31944 }, { "epoch": 0.6, "learning_rate": 1.799453846282982e-06, "loss": 0.8779, "step": 31945 }, { "epoch": 0.6, "learning_rate": 1.7993072024163683e-06, "loss": 0.9229, "step": 31946 }, { "epoch": 0.6, "learning_rate": 1.7991605611661195e-06, "loss": 0.755, "step": 31947 }, { "epoch": 0.6, "learning_rate": 1.799013922532783e-06, "loss": 0.8632, "step": 31948 }, { "epoch": 0.6, "learning_rate": 1.7988672865169071e-06, "loss": 0.8004, "step": 31949 }, { "epoch": 0.6, "learning_rate": 1.7987206531190402e-06, "loss": 1.0045, "step": 31950 }, { "epoch": 0.6, "learning_rate": 1.7985740223397278e-06, "loss": 0.8874, "step": 31951 }, { "epoch": 0.6, "learning_rate": 1.7984273941795194e-06, "loss": 1.0541, "step": 31952 }, { "epoch": 0.6, "learning_rate": 1.7982807686389613e-06, "loss": 0.853, "step": 31953 }, { "epoch": 0.6, "learning_rate": 1.7981341457186008e-06, "loss": 0.8345, "step": 31954 }, { "epoch": 0.6, "learning_rate": 1.797987525418987e-06, "loss": 0.6924, "step": 31955 }, { "epoch": 0.6, "learning_rate": 1.7978409077406653e-06, "loss": 1.2199, "step": 31956 }, { "epoch": 0.6, "learning_rate": 1.7976942926841837e-06, "loss": 0.9323, "step": 31957 }, { "epoch": 0.6, "learning_rate": 1.7975476802500912e-06, "loss": 0.8448, "step": 31958 }, { "epoch": 0.6, "learning_rate": 1.7974010704389342e-06, "loss": 0.7877, "step": 31959 }, { "epoch": 0.6, "learning_rate": 1.797254463251259e-06, "loss": 0.748, "step": 31960 }, { "epoch": 0.6, "learning_rate": 1.7971078586876148e-06, "loss": 0.6857, "step": 31961 }, { "epoch": 0.6, "learning_rate": 1.7969612567485482e-06, "loss": 1.1245, "step": 31962 }, { "epoch": 0.6, "learning_rate": 1.7968146574346063e-06, "loss": 0.9275, "step": 31963 }, { "epoch": 0.6, "learning_rate": 1.796668060746337e-06, "loss": 0.7925, "step": 31964 }, { "epoch": 0.6, "learning_rate": 1.7965214666842883e-06, "loss": 0.9865, "step": 31965 }, { "epoch": 0.6, "learning_rate": 1.7963748752490062e-06, "loss": 0.7859, "step": 31966 }, { "epoch": 0.6, "learning_rate": 1.796228286441039e-06, "loss": 0.98, "step": 31967 }, { "epoch": 0.6, "learning_rate": 1.7960817002609344e-06, "loss": 1.0227, "step": 31968 }, { "epoch": 0.6, "learning_rate": 1.7959351167092378e-06, "loss": 0.7979, "step": 31969 }, { "epoch": 0.6, "learning_rate": 1.7957885357864985e-06, "loss": 1.0188, "step": 31970 }, { "epoch": 0.6, "learning_rate": 1.7956419574932638e-06, "loss": 0.9604, "step": 31971 }, { "epoch": 0.6, "learning_rate": 1.7954953818300795e-06, "loss": 0.8203, "step": 31972 }, { "epoch": 0.6, "learning_rate": 1.7953488087974947e-06, "loss": 0.7896, "step": 31973 }, { "epoch": 0.6, "learning_rate": 1.7952022383960557e-06, "loss": 1.0981, "step": 31974 }, { "epoch": 0.6, "learning_rate": 1.795055670626309e-06, "loss": 1.0491, "step": 31975 }, { "epoch": 0.6, "learning_rate": 1.7949091054888041e-06, "loss": 1.1013, "step": 31976 }, { "epoch": 0.6, "learning_rate": 1.7947625429840863e-06, "loss": 0.7257, "step": 31977 }, { "epoch": 0.6, "learning_rate": 1.794615983112703e-06, "loss": 0.8448, "step": 31978 }, { "epoch": 0.6, "learning_rate": 1.7944694258752026e-06, "loss": 0.9016, "step": 31979 }, { "epoch": 0.6, "learning_rate": 1.7943228712721322e-06, "loss": 1.0446, "step": 31980 }, { "epoch": 0.6, "learning_rate": 1.7941763193040377e-06, "loss": 1.0262, "step": 31981 }, { "epoch": 0.6, "learning_rate": 1.7940297699714682e-06, "loss": 0.9168, "step": 31982 }, { "epoch": 0.6, "learning_rate": 1.793883223274969e-06, "loss": 0.9734, "step": 31983 }, { "epoch": 0.6, "learning_rate": 1.7937366792150884e-06, "loss": 0.9875, "step": 31984 }, { "epoch": 0.6, "learning_rate": 1.793590137792373e-06, "loss": 1.0011, "step": 31985 }, { "epoch": 0.6, "learning_rate": 1.7934435990073714e-06, "loss": 1.0332, "step": 31986 }, { "epoch": 0.6, "learning_rate": 1.7932970628606287e-06, "loss": 1.0388, "step": 31987 }, { "epoch": 0.6, "learning_rate": 1.7931505293526938e-06, "loss": 1.0045, "step": 31988 }, { "epoch": 0.6, "learning_rate": 1.7930039984841136e-06, "loss": 0.8947, "step": 31989 }, { "epoch": 0.6, "learning_rate": 1.7928574702554333e-06, "loss": 0.711, "step": 31990 }, { "epoch": 0.6, "learning_rate": 1.792710944667202e-06, "loss": 0.9645, "step": 31991 }, { "epoch": 0.6, "learning_rate": 1.7925644217199672e-06, "loss": 0.7901, "step": 31992 }, { "epoch": 0.6, "learning_rate": 1.7924179014142739e-06, "loss": 0.9496, "step": 31993 }, { "epoch": 0.6, "learning_rate": 1.7922713837506718e-06, "loss": 1.2044, "step": 31994 }, { "epoch": 0.6, "learning_rate": 1.7921248687297066e-06, "loss": 0.8798, "step": 31995 }, { "epoch": 0.6, "learning_rate": 1.7919783563519238e-06, "loss": 0.9419, "step": 31996 }, { "epoch": 0.6, "learning_rate": 1.791831846617874e-06, "loss": 0.9153, "step": 31997 }, { "epoch": 0.6, "learning_rate": 1.7916853395281013e-06, "loss": 0.8783, "step": 31998 }, { "epoch": 0.6, "learning_rate": 1.7915388350831537e-06, "loss": 0.9929, "step": 31999 }, { "epoch": 0.6, "learning_rate": 1.791392333283579e-06, "loss": 1.1193, "step": 32000 }, { "epoch": 0.6, "learning_rate": 1.7912458341299238e-06, "loss": 0.9612, "step": 32001 }, { "epoch": 0.6, "learning_rate": 1.7910993376227337e-06, "loss": 0.9671, "step": 32002 }, { "epoch": 0.6, "learning_rate": 1.7909528437625584e-06, "loss": 0.9479, "step": 32003 }, { "epoch": 0.6, "learning_rate": 1.7908063525499425e-06, "loss": 0.828, "step": 32004 }, { "epoch": 0.6, "learning_rate": 1.790659863985434e-06, "loss": 0.8324, "step": 32005 }, { "epoch": 0.6, "learning_rate": 1.7905133780695798e-06, "loss": 1.231, "step": 32006 }, { "epoch": 0.6, "learning_rate": 1.7903668948029275e-06, "loss": 1.0546, "step": 32007 }, { "epoch": 0.6, "learning_rate": 1.7902204141860224e-06, "loss": 0.6471, "step": 32008 }, { "epoch": 0.6, "learning_rate": 1.7900739362194136e-06, "loss": 0.9801, "step": 32009 }, { "epoch": 0.6, "learning_rate": 1.789927460903647e-06, "loss": 0.8034, "step": 32010 }, { "epoch": 0.6, "learning_rate": 1.7897809882392687e-06, "loss": 1.1167, "step": 32011 }, { "epoch": 0.6, "learning_rate": 1.7896345182268266e-06, "loss": 1.147, "step": 32012 }, { "epoch": 0.6, "learning_rate": 1.7894880508668677e-06, "loss": 1.0143, "step": 32013 }, { "epoch": 0.6, "learning_rate": 1.7893415861599379e-06, "loss": 0.7735, "step": 32014 }, { "epoch": 0.6, "learning_rate": 1.7891951241065858e-06, "loss": 0.9574, "step": 32015 }, { "epoch": 0.6, "learning_rate": 1.7890486647073573e-06, "loss": 0.7867, "step": 32016 }, { "epoch": 0.6, "learning_rate": 1.7889022079627984e-06, "loss": 0.7957, "step": 32017 }, { "epoch": 0.6, "learning_rate": 1.7887557538734579e-06, "loss": 0.8865, "step": 32018 }, { "epoch": 0.6, "learning_rate": 1.788609302439881e-06, "loss": 1.0163, "step": 32019 }, { "epoch": 0.6, "learning_rate": 1.7884628536626148e-06, "loss": 0.8312, "step": 32020 }, { "epoch": 0.6, "learning_rate": 1.7883164075422072e-06, "loss": 1.0149, "step": 32021 }, { "epoch": 0.6, "learning_rate": 1.7881699640792043e-06, "loss": 0.9826, "step": 32022 }, { "epoch": 0.6, "learning_rate": 1.7880235232741521e-06, "loss": 0.8343, "step": 32023 }, { "epoch": 0.6, "learning_rate": 1.7878770851275992e-06, "loss": 1.011, "step": 32024 }, { "epoch": 0.6, "learning_rate": 1.7877306496400909e-06, "loss": 1.1293, "step": 32025 }, { "epoch": 0.6, "learning_rate": 1.7875842168121745e-06, "loss": 0.7924, "step": 32026 }, { "epoch": 0.6, "learning_rate": 1.7874377866443971e-06, "loss": 0.8739, "step": 32027 }, { "epoch": 0.6, "learning_rate": 1.7872913591373054e-06, "loss": 1.0107, "step": 32028 }, { "epoch": 0.6, "learning_rate": 1.787144934291445e-06, "loss": 0.9485, "step": 32029 }, { "epoch": 0.6, "learning_rate": 1.786998512107364e-06, "loss": 1.0286, "step": 32030 }, { "epoch": 0.6, "learning_rate": 1.7868520925856092e-06, "loss": 1.0949, "step": 32031 }, { "epoch": 0.6, "learning_rate": 1.786705675726726e-06, "loss": 0.8139, "step": 32032 }, { "epoch": 0.6, "learning_rate": 1.7865592615312621e-06, "loss": 0.763, "step": 32033 }, { "epoch": 0.6, "learning_rate": 1.7864128499997645e-06, "loss": 1.0729, "step": 32034 }, { "epoch": 0.6, "learning_rate": 1.7862664411327788e-06, "loss": 0.8529, "step": 32035 }, { "epoch": 0.6, "learning_rate": 1.7861200349308532e-06, "loss": 0.7734, "step": 32036 }, { "epoch": 0.6, "learning_rate": 1.7859736313945334e-06, "loss": 1.0294, "step": 32037 }, { "epoch": 0.6, "learning_rate": 1.785827230524365e-06, "loss": 0.9315, "step": 32038 }, { "epoch": 0.6, "learning_rate": 1.7856808323208972e-06, "loss": 0.9935, "step": 32039 }, { "epoch": 0.6, "learning_rate": 1.7855344367846745e-06, "loss": 0.9628, "step": 32040 }, { "epoch": 0.6, "learning_rate": 1.785388043916244e-06, "loss": 0.8045, "step": 32041 }, { "epoch": 0.6, "learning_rate": 1.7852416537161535e-06, "loss": 0.7972, "step": 32042 }, { "epoch": 0.6, "learning_rate": 1.7850952661849488e-06, "loss": 1.1352, "step": 32043 }, { "epoch": 0.6, "learning_rate": 1.7849488813231753e-06, "loss": 1.0863, "step": 32044 }, { "epoch": 0.6, "learning_rate": 1.784802499131382e-06, "loss": 0.9299, "step": 32045 }, { "epoch": 0.6, "learning_rate": 1.7846561196101136e-06, "loss": 0.9592, "step": 32046 }, { "epoch": 0.6, "learning_rate": 1.7845097427599173e-06, "loss": 0.9476, "step": 32047 }, { "epoch": 0.6, "learning_rate": 1.78436336858134e-06, "loss": 0.6652, "step": 32048 }, { "epoch": 0.6, "learning_rate": 1.7842169970749278e-06, "loss": 0.8759, "step": 32049 }, { "epoch": 0.6, "learning_rate": 1.7840706282412267e-06, "loss": 1.2018, "step": 32050 }, { "epoch": 0.6, "learning_rate": 1.783924262080785e-06, "loss": 0.9008, "step": 32051 }, { "epoch": 0.6, "learning_rate": 1.7837778985941483e-06, "loss": 0.966, "step": 32052 }, { "epoch": 0.6, "learning_rate": 1.783631537781862e-06, "loss": 0.7654, "step": 32053 }, { "epoch": 0.6, "learning_rate": 1.7834851796444736e-06, "loss": 0.7928, "step": 32054 }, { "epoch": 0.6, "learning_rate": 1.7833388241825305e-06, "loss": 0.7799, "step": 32055 }, { "epoch": 0.6, "learning_rate": 1.783192471396577e-06, "loss": 1.0691, "step": 32056 }, { "epoch": 0.6, "learning_rate": 1.783046121287162e-06, "loss": 0.9957, "step": 32057 }, { "epoch": 0.6, "learning_rate": 1.7828997738548306e-06, "loss": 0.8845, "step": 32058 }, { "epoch": 0.6, "learning_rate": 1.7827534291001287e-06, "loss": 0.9212, "step": 32059 }, { "epoch": 0.6, "learning_rate": 1.7826070870236046e-06, "loss": 0.8959, "step": 32060 }, { "epoch": 0.6, "learning_rate": 1.7824607476258027e-06, "loss": 0.9174, "step": 32061 }, { "epoch": 0.6, "learning_rate": 1.78231441090727e-06, "loss": 0.8147, "step": 32062 }, { "epoch": 0.6, "learning_rate": 1.7821680768685545e-06, "loss": 0.847, "step": 32063 }, { "epoch": 0.6, "learning_rate": 1.7820217455102012e-06, "loss": 1.0262, "step": 32064 }, { "epoch": 0.6, "learning_rate": 1.7818754168327556e-06, "loss": 0.9209, "step": 32065 }, { "epoch": 0.6, "learning_rate": 1.7817290908367666e-06, "loss": 1.0205, "step": 32066 }, { "epoch": 0.61, "learning_rate": 1.7815827675227784e-06, "loss": 0.9642, "step": 32067 }, { "epoch": 0.61, "learning_rate": 1.7814364468913381e-06, "loss": 1.08, "step": 32068 }, { "epoch": 0.61, "learning_rate": 1.781290128942992e-06, "loss": 1.0027, "step": 32069 }, { "epoch": 0.61, "learning_rate": 1.7811438136782872e-06, "loss": 0.8597, "step": 32070 }, { "epoch": 0.61, "learning_rate": 1.780997501097768e-06, "loss": 0.958, "step": 32071 }, { "epoch": 0.61, "learning_rate": 1.7808511912019837e-06, "loss": 1.0224, "step": 32072 }, { "epoch": 0.61, "learning_rate": 1.7807048839914787e-06, "loss": 0.9417, "step": 32073 }, { "epoch": 0.61, "learning_rate": 1.7805585794667985e-06, "loss": 1.1426, "step": 32074 }, { "epoch": 0.61, "learning_rate": 1.780412277628491e-06, "loss": 0.968, "step": 32075 }, { "epoch": 0.61, "learning_rate": 1.7802659784771025e-06, "loss": 0.734, "step": 32076 }, { "epoch": 0.61, "learning_rate": 1.7801196820131777e-06, "loss": 0.813, "step": 32077 }, { "epoch": 0.61, "learning_rate": 1.7799733882372653e-06, "loss": 0.7957, "step": 32078 }, { "epoch": 0.61, "learning_rate": 1.7798270971499098e-06, "loss": 0.9089, "step": 32079 }, { "epoch": 0.61, "learning_rate": 1.779680808751657e-06, "loss": 0.9371, "step": 32080 }, { "epoch": 0.61, "learning_rate": 1.779534523043055e-06, "loss": 0.9677, "step": 32081 }, { "epoch": 0.61, "learning_rate": 1.7793882400246486e-06, "loss": 1.1414, "step": 32082 }, { "epoch": 0.61, "learning_rate": 1.7792419596969837e-06, "loss": 0.8533, "step": 32083 }, { "epoch": 0.61, "learning_rate": 1.7790956820606084e-06, "loss": 0.8075, "step": 32084 }, { "epoch": 0.61, "learning_rate": 1.7789494071160677e-06, "loss": 0.8129, "step": 32085 }, { "epoch": 0.61, "learning_rate": 1.7788031348639069e-06, "loss": 0.9335, "step": 32086 }, { "epoch": 0.61, "learning_rate": 1.7786568653046737e-06, "loss": 0.9508, "step": 32087 }, { "epoch": 0.61, "learning_rate": 1.7785105984389133e-06, "loss": 1.1509, "step": 32088 }, { "epoch": 0.61, "learning_rate": 1.778364334267173e-06, "loss": 0.8338, "step": 32089 }, { "epoch": 0.61, "learning_rate": 1.7782180727899966e-06, "loss": 0.8685, "step": 32090 }, { "epoch": 0.61, "learning_rate": 1.7780718140079333e-06, "loss": 0.8612, "step": 32091 }, { "epoch": 0.61, "learning_rate": 1.7779255579215276e-06, "loss": 0.8562, "step": 32092 }, { "epoch": 0.61, "learning_rate": 1.7777793045313245e-06, "loss": 1.1049, "step": 32093 }, { "epoch": 0.61, "learning_rate": 1.7776330538378728e-06, "loss": 1.1967, "step": 32094 }, { "epoch": 0.61, "learning_rate": 1.7774868058417161e-06, "loss": 0.9095, "step": 32095 }, { "epoch": 0.61, "learning_rate": 1.7773405605434014e-06, "loss": 0.8239, "step": 32096 }, { "epoch": 0.61, "learning_rate": 1.7771943179434756e-06, "loss": 1.1237, "step": 32097 }, { "epoch": 0.61, "learning_rate": 1.7770480780424842e-06, "loss": 0.9612, "step": 32098 }, { "epoch": 0.61, "learning_rate": 1.7769018408409722e-06, "loss": 0.9092, "step": 32099 }, { "epoch": 0.61, "learning_rate": 1.7767556063394872e-06, "loss": 1.2179, "step": 32100 }, { "epoch": 0.61, "learning_rate": 1.7766093745385742e-06, "loss": 0.8948, "step": 32101 }, { "epoch": 0.61, "learning_rate": 1.7764631454387799e-06, "loss": 0.7908, "step": 32102 }, { "epoch": 0.61, "learning_rate": 1.7763169190406499e-06, "loss": 1.0253, "step": 32103 }, { "epoch": 0.61, "learning_rate": 1.776170695344731e-06, "loss": 0.7902, "step": 32104 }, { "epoch": 0.61, "learning_rate": 1.776024474351567e-06, "loss": 1.1154, "step": 32105 }, { "epoch": 0.61, "learning_rate": 1.775878256061707e-06, "loss": 1.0751, "step": 32106 }, { "epoch": 0.61, "learning_rate": 1.775732040475695e-06, "loss": 1.0842, "step": 32107 }, { "epoch": 0.61, "learning_rate": 1.7755858275940767e-06, "loss": 0.6859, "step": 32108 }, { "epoch": 0.61, "learning_rate": 1.7754396174173988e-06, "loss": 0.8762, "step": 32109 }, { "epoch": 0.61, "learning_rate": 1.775293409946208e-06, "loss": 0.6693, "step": 32110 }, { "epoch": 0.61, "learning_rate": 1.7751472051810482e-06, "loss": 0.8377, "step": 32111 }, { "epoch": 0.61, "learning_rate": 1.7750010031224673e-06, "loss": 1.1124, "step": 32112 }, { "epoch": 0.61, "learning_rate": 1.774854803771011e-06, "loss": 1.0005, "step": 32113 }, { "epoch": 0.61, "learning_rate": 1.7747086071272232e-06, "loss": 0.9249, "step": 32114 }, { "epoch": 0.61, "learning_rate": 1.7745624131916523e-06, "loss": 0.8288, "step": 32115 }, { "epoch": 0.61, "learning_rate": 1.7744162219648427e-06, "loss": 0.9099, "step": 32116 }, { "epoch": 0.61, "learning_rate": 1.77427003344734e-06, "loss": 0.9147, "step": 32117 }, { "epoch": 0.61, "learning_rate": 1.774123847639692e-06, "loss": 1.1036, "step": 32118 }, { "epoch": 0.61, "learning_rate": 1.7739776645424435e-06, "loss": 1.0341, "step": 32119 }, { "epoch": 0.61, "learning_rate": 1.7738314841561386e-06, "loss": 0.8641, "step": 32120 }, { "epoch": 0.61, "learning_rate": 1.773685306481326e-06, "loss": 0.9149, "step": 32121 }, { "epoch": 0.61, "learning_rate": 1.7735391315185493e-06, "loss": 0.8366, "step": 32122 }, { "epoch": 0.61, "learning_rate": 1.7733929592683557e-06, "loss": 0.8244, "step": 32123 }, { "epoch": 0.61, "learning_rate": 1.7732467897312902e-06, "loss": 0.833, "step": 32124 }, { "epoch": 0.61, "learning_rate": 1.7731006229078996e-06, "loss": 1.2547, "step": 32125 }, { "epoch": 0.61, "learning_rate": 1.772954458798728e-06, "loss": 0.9514, "step": 32126 }, { "epoch": 0.61, "learning_rate": 1.7728082974043228e-06, "loss": 0.9219, "step": 32127 }, { "epoch": 0.61, "learning_rate": 1.7726621387252297e-06, "loss": 0.8998, "step": 32128 }, { "epoch": 0.61, "learning_rate": 1.7725159827619922e-06, "loss": 0.8299, "step": 32129 }, { "epoch": 0.61, "learning_rate": 1.7723698295151588e-06, "loss": 0.9756, "step": 32130 }, { "epoch": 0.61, "learning_rate": 1.7722236789852743e-06, "loss": 0.9498, "step": 32131 }, { "epoch": 0.61, "learning_rate": 1.7720775311728833e-06, "loss": 0.9636, "step": 32132 }, { "epoch": 0.61, "learning_rate": 1.7719313860785336e-06, "loss": 1.0184, "step": 32133 }, { "epoch": 0.61, "learning_rate": 1.7717852437027698e-06, "loss": 0.831, "step": 32134 }, { "epoch": 0.61, "learning_rate": 1.7716391040461365e-06, "loss": 1.1204, "step": 32135 }, { "epoch": 0.61, "learning_rate": 1.7714929671091814e-06, "loss": 0.8493, "step": 32136 }, { "epoch": 0.61, "learning_rate": 1.7713468328924489e-06, "loss": 0.9906, "step": 32137 }, { "epoch": 0.61, "learning_rate": 1.7712007013964845e-06, "loss": 1.0175, "step": 32138 }, { "epoch": 0.61, "learning_rate": 1.7710545726218349e-06, "loss": 0.8374, "step": 32139 }, { "epoch": 0.61, "learning_rate": 1.7709084465690456e-06, "loss": 0.7693, "step": 32140 }, { "epoch": 0.61, "learning_rate": 1.7707623232386605e-06, "loss": 0.8652, "step": 32141 }, { "epoch": 0.61, "learning_rate": 1.770616202631228e-06, "loss": 0.9919, "step": 32142 }, { "epoch": 0.61, "learning_rate": 1.7704700847472911e-06, "loss": 1.1683, "step": 32143 }, { "epoch": 0.61, "learning_rate": 1.7703239695873968e-06, "loss": 1.1306, "step": 32144 }, { "epoch": 0.61, "learning_rate": 1.7701778571520905e-06, "loss": 1.0889, "step": 32145 }, { "epoch": 0.61, "learning_rate": 1.7700317474419185e-06, "loss": 1.1165, "step": 32146 }, { "epoch": 0.61, "learning_rate": 1.7698856404574245e-06, "loss": 0.7321, "step": 32147 }, { "epoch": 0.61, "learning_rate": 1.7697395361991557e-06, "loss": 0.7641, "step": 32148 }, { "epoch": 0.61, "learning_rate": 1.7695934346676575e-06, "loss": 0.8807, "step": 32149 }, { "epoch": 0.61, "learning_rate": 1.7694473358634737e-06, "loss": 1.0272, "step": 32150 }, { "epoch": 0.61, "learning_rate": 1.7693012397871518e-06, "loss": 1.0136, "step": 32151 }, { "epoch": 0.61, "learning_rate": 1.769155146439237e-06, "loss": 0.8517, "step": 32152 }, { "epoch": 0.61, "learning_rate": 1.7690090558202737e-06, "loss": 0.8433, "step": 32153 }, { "epoch": 0.61, "learning_rate": 1.7688629679308089e-06, "loss": 0.891, "step": 32154 }, { "epoch": 0.61, "learning_rate": 1.7687168827713878e-06, "loss": 0.8917, "step": 32155 }, { "epoch": 0.61, "learning_rate": 1.768570800342554e-06, "loss": 0.9308, "step": 32156 }, { "epoch": 0.61, "learning_rate": 1.7684247206448557e-06, "loss": 0.7828, "step": 32157 }, { "epoch": 0.61, "learning_rate": 1.7682786436788363e-06, "loss": 0.9784, "step": 32158 }, { "epoch": 0.61, "learning_rate": 1.7681325694450419e-06, "loss": 0.8219, "step": 32159 }, { "epoch": 0.61, "learning_rate": 1.7679864979440187e-06, "loss": 0.899, "step": 32160 }, { "epoch": 0.61, "learning_rate": 1.7678404291763114e-06, "loss": 0.7859, "step": 32161 }, { "epoch": 0.61, "learning_rate": 1.7676943631424648e-06, "loss": 1.0011, "step": 32162 }, { "epoch": 0.61, "learning_rate": 1.767548299843026e-06, "loss": 0.921, "step": 32163 }, { "epoch": 0.61, "learning_rate": 1.7674022392785387e-06, "loss": 0.7075, "step": 32164 }, { "epoch": 0.61, "learning_rate": 1.767256181449549e-06, "loss": 0.8662, "step": 32165 }, { "epoch": 0.61, "learning_rate": 1.7671101263566024e-06, "loss": 0.9413, "step": 32166 }, { "epoch": 0.61, "learning_rate": 1.7669640740002445e-06, "loss": 0.9268, "step": 32167 }, { "epoch": 0.61, "learning_rate": 1.766818024381019e-06, "loss": 0.9612, "step": 32168 }, { "epoch": 0.61, "learning_rate": 1.766671977499474e-06, "loss": 0.9051, "step": 32169 }, { "epoch": 0.61, "learning_rate": 1.7665259333561529e-06, "loss": 0.9678, "step": 32170 }, { "epoch": 0.61, "learning_rate": 1.766379891951601e-06, "loss": 0.9973, "step": 32171 }, { "epoch": 0.61, "learning_rate": 1.7662338532863643e-06, "loss": 0.9532, "step": 32172 }, { "epoch": 0.61, "learning_rate": 1.7660878173609886e-06, "loss": 0.7488, "step": 32173 }, { "epoch": 0.61, "learning_rate": 1.7659417841760171e-06, "loss": 1.0814, "step": 32174 }, { "epoch": 0.61, "learning_rate": 1.7657957537319975e-06, "loss": 0.964, "step": 32175 }, { "epoch": 0.61, "learning_rate": 1.7656497260294743e-06, "loss": 0.8043, "step": 32176 }, { "epoch": 0.61, "learning_rate": 1.7655037010689913e-06, "loss": 0.718, "step": 32177 }, { "epoch": 0.61, "learning_rate": 1.7653576788510962e-06, "loss": 0.8179, "step": 32178 }, { "epoch": 0.61, "learning_rate": 1.7652116593763324e-06, "loss": 0.7858, "step": 32179 }, { "epoch": 0.61, "learning_rate": 1.765065642645245e-06, "loss": 1.0349, "step": 32180 }, { "epoch": 0.61, "learning_rate": 1.7649196286583814e-06, "loss": 1.0136, "step": 32181 }, { "epoch": 0.61, "learning_rate": 1.7647736174162849e-06, "loss": 0.8165, "step": 32182 }, { "epoch": 0.61, "learning_rate": 1.7646276089195008e-06, "loss": 0.952, "step": 32183 }, { "epoch": 0.61, "learning_rate": 1.764481603168575e-06, "loss": 0.9068, "step": 32184 }, { "epoch": 0.61, "learning_rate": 1.7643356001640522e-06, "loss": 0.8473, "step": 32185 }, { "epoch": 0.61, "learning_rate": 1.7641895999064776e-06, "loss": 0.9404, "step": 32186 }, { "epoch": 0.61, "learning_rate": 1.7640436023963963e-06, "loss": 1.05, "step": 32187 }, { "epoch": 0.61, "learning_rate": 1.7638976076343545e-06, "loss": 0.8334, "step": 32188 }, { "epoch": 0.61, "learning_rate": 1.7637516156208954e-06, "loss": 0.9183, "step": 32189 }, { "epoch": 0.61, "learning_rate": 1.763605626356566e-06, "loss": 0.8327, "step": 32190 }, { "epoch": 0.61, "learning_rate": 1.7634596398419107e-06, "loss": 0.8361, "step": 32191 }, { "epoch": 0.61, "learning_rate": 1.7633136560774736e-06, "loss": 0.7519, "step": 32192 }, { "epoch": 0.61, "learning_rate": 1.7631676750638011e-06, "loss": 1.09, "step": 32193 }, { "epoch": 0.61, "learning_rate": 1.7630216968014385e-06, "loss": 1.0554, "step": 32194 }, { "epoch": 0.61, "learning_rate": 1.7628757212909291e-06, "loss": 1.0634, "step": 32195 }, { "epoch": 0.61, "learning_rate": 1.7627297485328204e-06, "loss": 0.779, "step": 32196 }, { "epoch": 0.61, "learning_rate": 1.762583778527656e-06, "loss": 0.7748, "step": 32197 }, { "epoch": 0.61, "learning_rate": 1.7624378112759804e-06, "loss": 0.8183, "step": 32198 }, { "epoch": 0.61, "learning_rate": 1.7622918467783402e-06, "loss": 1.1063, "step": 32199 }, { "epoch": 0.61, "learning_rate": 1.762145885035279e-06, "loss": 1.0772, "step": 32200 }, { "epoch": 0.61, "learning_rate": 1.7619999260473421e-06, "loss": 0.8789, "step": 32201 }, { "epoch": 0.61, "learning_rate": 1.761853969815076e-06, "loss": 0.9102, "step": 32202 }, { "epoch": 0.61, "learning_rate": 1.7617080163390244e-06, "loss": 0.8196, "step": 32203 }, { "epoch": 0.61, "learning_rate": 1.7615620656197316e-06, "loss": 0.7948, "step": 32204 }, { "epoch": 0.61, "learning_rate": 1.7614161176577443e-06, "loss": 1.0796, "step": 32205 }, { "epoch": 0.61, "learning_rate": 1.7612701724536058e-06, "loss": 1.1033, "step": 32206 }, { "epoch": 0.61, "learning_rate": 1.7611242300078623e-06, "loss": 1.045, "step": 32207 }, { "epoch": 0.61, "learning_rate": 1.7609782903210579e-06, "loss": 0.7396, "step": 32208 }, { "epoch": 0.61, "learning_rate": 1.7608323533937385e-06, "loss": 1.1113, "step": 32209 }, { "epoch": 0.61, "learning_rate": 1.7606864192264476e-06, "loss": 0.7987, "step": 32210 }, { "epoch": 0.61, "learning_rate": 1.760540487819732e-06, "loss": 0.9052, "step": 32211 }, { "epoch": 0.61, "learning_rate": 1.7603945591741351e-06, "loss": 1.0026, "step": 32212 }, { "epoch": 0.61, "learning_rate": 1.7602486332902013e-06, "loss": 1.0216, "step": 32213 }, { "epoch": 0.61, "learning_rate": 1.7601027101684774e-06, "loss": 0.8946, "step": 32214 }, { "epoch": 0.61, "learning_rate": 1.7599567898095074e-06, "loss": 0.8972, "step": 32215 }, { "epoch": 0.61, "learning_rate": 1.759810872213835e-06, "loss": 0.8105, "step": 32216 }, { "epoch": 0.61, "learning_rate": 1.7596649573820073e-06, "loss": 0.8087, "step": 32217 }, { "epoch": 0.61, "learning_rate": 1.759519045314568e-06, "loss": 1.0012, "step": 32218 }, { "epoch": 0.61, "learning_rate": 1.759373136012061e-06, "loss": 1.0639, "step": 32219 }, { "epoch": 0.61, "learning_rate": 1.7592272294750328e-06, "loss": 0.8682, "step": 32220 }, { "epoch": 0.61, "learning_rate": 1.7590813257040268e-06, "loss": 0.8902, "step": 32221 }, { "epoch": 0.61, "learning_rate": 1.758935424699588e-06, "loss": 1.0229, "step": 32222 }, { "epoch": 0.61, "learning_rate": 1.7587895264622626e-06, "loss": 0.8172, "step": 32223 }, { "epoch": 0.61, "learning_rate": 1.7586436309925944e-06, "loss": 0.8638, "step": 32224 }, { "epoch": 0.61, "learning_rate": 1.7584977382911272e-06, "loss": 0.9622, "step": 32225 }, { "epoch": 0.61, "learning_rate": 1.7583518483584078e-06, "loss": 0.9789, "step": 32226 }, { "epoch": 0.61, "learning_rate": 1.7582059611949792e-06, "loss": 0.7777, "step": 32227 }, { "epoch": 0.61, "learning_rate": 1.7580600768013867e-06, "loss": 0.817, "step": 32228 }, { "epoch": 0.61, "learning_rate": 1.7579141951781754e-06, "loss": 0.933, "step": 32229 }, { "epoch": 0.61, "learning_rate": 1.7577683163258902e-06, "loss": 0.8029, "step": 32230 }, { "epoch": 0.61, "learning_rate": 1.7576224402450742e-06, "loss": 0.9855, "step": 32231 }, { "epoch": 0.61, "learning_rate": 1.7574765669362742e-06, "loss": 1.1779, "step": 32232 }, { "epoch": 0.61, "learning_rate": 1.7573306964000342e-06, "loss": 0.6013, "step": 32233 }, { "epoch": 0.61, "learning_rate": 1.7571848286368973e-06, "loss": 1.1552, "step": 32234 }, { "epoch": 0.61, "learning_rate": 1.75703896364741e-06, "loss": 0.9034, "step": 32235 }, { "epoch": 0.61, "learning_rate": 1.7568931014321172e-06, "loss": 0.8819, "step": 32236 }, { "epoch": 0.61, "learning_rate": 1.7567472419915615e-06, "loss": 0.8834, "step": 32237 }, { "epoch": 0.61, "learning_rate": 1.7566013853262897e-06, "loss": 0.8126, "step": 32238 }, { "epoch": 0.61, "learning_rate": 1.7564555314368458e-06, "loss": 0.8238, "step": 32239 }, { "epoch": 0.61, "learning_rate": 1.7563096803237735e-06, "loss": 0.8631, "step": 32240 }, { "epoch": 0.61, "learning_rate": 1.7561638319876184e-06, "loss": 0.6955, "step": 32241 }, { "epoch": 0.61, "learning_rate": 1.7560179864289246e-06, "loss": 0.753, "step": 32242 }, { "epoch": 0.61, "learning_rate": 1.7558721436482363e-06, "loss": 1.0423, "step": 32243 }, { "epoch": 0.61, "learning_rate": 1.7557263036460996e-06, "loss": 1.1159, "step": 32244 }, { "epoch": 0.61, "learning_rate": 1.755580466423058e-06, "loss": 1.081, "step": 32245 }, { "epoch": 0.61, "learning_rate": 1.7554346319796551e-06, "loss": 0.8591, "step": 32246 }, { "epoch": 0.61, "learning_rate": 1.7552888003164373e-06, "loss": 1.0107, "step": 32247 }, { "epoch": 0.61, "learning_rate": 1.755142971433948e-06, "loss": 0.688, "step": 32248 }, { "epoch": 0.61, "learning_rate": 1.754997145332732e-06, "loss": 0.9022, "step": 32249 }, { "epoch": 0.61, "learning_rate": 1.7548513220133337e-06, "loss": 1.011, "step": 32250 }, { "epoch": 0.61, "learning_rate": 1.7547055014762981e-06, "loss": 0.9322, "step": 32251 }, { "epoch": 0.61, "learning_rate": 1.7545596837221687e-06, "loss": 0.8608, "step": 32252 }, { "epoch": 0.61, "learning_rate": 1.7544138687514914e-06, "loss": 0.7833, "step": 32253 }, { "epoch": 0.61, "learning_rate": 1.7542680565648099e-06, "loss": 0.7774, "step": 32254 }, { "epoch": 0.61, "learning_rate": 1.7541222471626674e-06, "loss": 0.7931, "step": 32255 }, { "epoch": 0.61, "learning_rate": 1.7539764405456103e-06, "loss": 1.0537, "step": 32256 }, { "epoch": 0.61, "learning_rate": 1.7538306367141828e-06, "loss": 0.88, "step": 32257 }, { "epoch": 0.61, "learning_rate": 1.7536848356689275e-06, "loss": 0.8547, "step": 32258 }, { "epoch": 0.61, "learning_rate": 1.7535390374103918e-06, "loss": 0.9881, "step": 32259 }, { "epoch": 0.61, "learning_rate": 1.7533932419391179e-06, "loss": 0.8116, "step": 32260 }, { "epoch": 0.61, "learning_rate": 1.7532474492556494e-06, "loss": 0.7706, "step": 32261 }, { "epoch": 0.61, "learning_rate": 1.7531016593605338e-06, "loss": 1.04, "step": 32262 }, { "epoch": 0.61, "learning_rate": 1.7529558722543128e-06, "loss": 0.9874, "step": 32263 }, { "epoch": 0.61, "learning_rate": 1.7528100879375315e-06, "loss": 0.9626, "step": 32264 }, { "epoch": 0.61, "learning_rate": 1.7526643064107353e-06, "loss": 0.8452, "step": 32265 }, { "epoch": 0.61, "learning_rate": 1.7525185276744673e-06, "loss": 0.7868, "step": 32266 }, { "epoch": 0.61, "learning_rate": 1.7523727517292715e-06, "loss": 1.0271, "step": 32267 }, { "epoch": 0.61, "learning_rate": 1.752226978575694e-06, "loss": 0.942, "step": 32268 }, { "epoch": 0.61, "learning_rate": 1.7520812082142775e-06, "loss": 0.9722, "step": 32269 }, { "epoch": 0.61, "learning_rate": 1.7519354406455663e-06, "loss": 0.9625, "step": 32270 }, { "epoch": 0.61, "learning_rate": 1.751789675870106e-06, "loss": 0.9946, "step": 32271 }, { "epoch": 0.61, "learning_rate": 1.75164391388844e-06, "loss": 0.7985, "step": 32272 }, { "epoch": 0.61, "learning_rate": 1.751498154701112e-06, "loss": 0.9601, "step": 32273 }, { "epoch": 0.61, "learning_rate": 1.7513523983086681e-06, "loss": 1.2977, "step": 32274 }, { "epoch": 0.61, "learning_rate": 1.751206644711651e-06, "loss": 0.9829, "step": 32275 }, { "epoch": 0.61, "learning_rate": 1.7510608939106044e-06, "loss": 0.8373, "step": 32276 }, { "epoch": 0.61, "learning_rate": 1.7509151459060741e-06, "loss": 0.8094, "step": 32277 }, { "epoch": 0.61, "learning_rate": 1.7507694006986042e-06, "loss": 0.841, "step": 32278 }, { "epoch": 0.61, "learning_rate": 1.7506236582887375e-06, "loss": 0.7189, "step": 32279 }, { "epoch": 0.61, "learning_rate": 1.7504779186770198e-06, "loss": 1.1282, "step": 32280 }, { "epoch": 0.61, "learning_rate": 1.750332181863995e-06, "loss": 1.08, "step": 32281 }, { "epoch": 0.61, "learning_rate": 1.7501864478502054e-06, "loss": 0.8309, "step": 32282 }, { "epoch": 0.61, "learning_rate": 1.7500407166361976e-06, "loss": 0.7971, "step": 32283 }, { "epoch": 0.61, "learning_rate": 1.7498949882225147e-06, "loss": 0.8585, "step": 32284 }, { "epoch": 0.61, "learning_rate": 1.7497492626097002e-06, "loss": 0.7961, "step": 32285 }, { "epoch": 0.61, "learning_rate": 1.7496035397982997e-06, "loss": 0.7964, "step": 32286 }, { "epoch": 0.61, "learning_rate": 1.7494578197888567e-06, "loss": 1.073, "step": 32287 }, { "epoch": 0.61, "learning_rate": 1.7493121025819144e-06, "loss": 0.801, "step": 32288 }, { "epoch": 0.61, "learning_rate": 1.7491663881780185e-06, "loss": 1.0198, "step": 32289 }, { "epoch": 0.61, "learning_rate": 1.7490206765777118e-06, "loss": 0.7903, "step": 32290 }, { "epoch": 0.61, "learning_rate": 1.748874967781539e-06, "loss": 1.0155, "step": 32291 }, { "epoch": 0.61, "learning_rate": 1.748729261790044e-06, "loss": 0.9038, "step": 32292 }, { "epoch": 0.61, "learning_rate": 1.7485835586037714e-06, "loss": 0.9268, "step": 32293 }, { "epoch": 0.61, "learning_rate": 1.7484378582232637e-06, "loss": 0.7949, "step": 32294 }, { "epoch": 0.61, "learning_rate": 1.748292160649067e-06, "loss": 0.8478, "step": 32295 }, { "epoch": 0.61, "learning_rate": 1.7481464658817244e-06, "loss": 0.6975, "step": 32296 }, { "epoch": 0.61, "learning_rate": 1.7480007739217785e-06, "loss": 0.9909, "step": 32297 }, { "epoch": 0.61, "learning_rate": 1.7478550847697756e-06, "loss": 0.957, "step": 32298 }, { "epoch": 0.61, "learning_rate": 1.747709398426259e-06, "loss": 1.0923, "step": 32299 }, { "epoch": 0.61, "learning_rate": 1.7475637148917714e-06, "loss": 1.1144, "step": 32300 }, { "epoch": 0.61, "learning_rate": 1.747418034166859e-06, "loss": 0.8717, "step": 32301 }, { "epoch": 0.61, "learning_rate": 1.7472723562520644e-06, "loss": 0.9495, "step": 32302 }, { "epoch": 0.61, "learning_rate": 1.747126681147931e-06, "loss": 0.9466, "step": 32303 }, { "epoch": 0.61, "learning_rate": 1.7469810088550043e-06, "loss": 0.8502, "step": 32304 }, { "epoch": 0.61, "learning_rate": 1.746835339373827e-06, "loss": 0.6773, "step": 32305 }, { "epoch": 0.61, "learning_rate": 1.746689672704943e-06, "loss": 0.9464, "step": 32306 }, { "epoch": 0.61, "learning_rate": 1.7465440088488974e-06, "loss": 1.0584, "step": 32307 }, { "epoch": 0.61, "learning_rate": 1.7463983478062334e-06, "loss": 0.7817, "step": 32308 }, { "epoch": 0.61, "learning_rate": 1.7462526895774945e-06, "loss": 0.9071, "step": 32309 }, { "epoch": 0.61, "learning_rate": 1.7461070341632252e-06, "loss": 0.7076, "step": 32310 }, { "epoch": 0.61, "learning_rate": 1.745961381563969e-06, "loss": 0.8229, "step": 32311 }, { "epoch": 0.61, "learning_rate": 1.7458157317802699e-06, "loss": 0.9213, "step": 32312 }, { "epoch": 0.61, "learning_rate": 1.7456700848126715e-06, "loss": 1.1068, "step": 32313 }, { "epoch": 0.61, "learning_rate": 1.7455244406617184e-06, "loss": 1.1699, "step": 32314 }, { "epoch": 0.61, "learning_rate": 1.745378799327953e-06, "loss": 0.7761, "step": 32315 }, { "epoch": 0.61, "learning_rate": 1.7452331608119211e-06, "loss": 0.9274, "step": 32316 }, { "epoch": 0.61, "learning_rate": 1.7450875251141652e-06, "loss": 0.7042, "step": 32317 }, { "epoch": 0.61, "learning_rate": 1.7449418922352284e-06, "loss": 0.9232, "step": 32318 }, { "epoch": 0.61, "learning_rate": 1.7447962621756562e-06, "loss": 0.8773, "step": 32319 }, { "epoch": 0.61, "learning_rate": 1.744650634935992e-06, "loss": 0.8039, "step": 32320 }, { "epoch": 0.61, "learning_rate": 1.744505010516778e-06, "loss": 0.9054, "step": 32321 }, { "epoch": 0.61, "learning_rate": 1.74435938891856e-06, "loss": 0.8221, "step": 32322 }, { "epoch": 0.61, "learning_rate": 1.7442137701418813e-06, "loss": 0.8674, "step": 32323 }, { "epoch": 0.61, "learning_rate": 1.7440681541872845e-06, "loss": 0.9524, "step": 32324 }, { "epoch": 0.61, "learning_rate": 1.743922541055314e-06, "loss": 1.2389, "step": 32325 }, { "epoch": 0.61, "learning_rate": 1.7437769307465135e-06, "loss": 0.908, "step": 32326 }, { "epoch": 0.61, "learning_rate": 1.7436313232614273e-06, "loss": 0.8305, "step": 32327 }, { "epoch": 0.61, "learning_rate": 1.7434857186005976e-06, "loss": 0.9911, "step": 32328 }, { "epoch": 0.61, "learning_rate": 1.74334011676457e-06, "loss": 0.9369, "step": 32329 }, { "epoch": 0.61, "learning_rate": 1.7431945177538873e-06, "loss": 1.1546, "step": 32330 }, { "epoch": 0.61, "learning_rate": 1.7430489215690922e-06, "loss": 1.1996, "step": 32331 }, { "epoch": 0.61, "learning_rate": 1.7429033282107294e-06, "loss": 0.8085, "step": 32332 }, { "epoch": 0.61, "learning_rate": 1.7427577376793428e-06, "loss": 0.6645, "step": 32333 }, { "epoch": 0.61, "learning_rate": 1.7426121499754747e-06, "loss": 1.0587, "step": 32334 }, { "epoch": 0.61, "learning_rate": 1.7424665650996708e-06, "loss": 0.8464, "step": 32335 }, { "epoch": 0.61, "learning_rate": 1.7423209830524735e-06, "loss": 0.8889, "step": 32336 }, { "epoch": 0.61, "learning_rate": 1.7421754038344251e-06, "loss": 0.8041, "step": 32337 }, { "epoch": 0.61, "learning_rate": 1.7420298274460718e-06, "loss": 1.0344, "step": 32338 }, { "epoch": 0.61, "learning_rate": 1.7418842538879552e-06, "loss": 0.8331, "step": 32339 }, { "epoch": 0.61, "learning_rate": 1.7417386831606189e-06, "loss": 0.9026, "step": 32340 }, { "epoch": 0.61, "learning_rate": 1.7415931152646085e-06, "loss": 0.9457, "step": 32341 }, { "epoch": 0.61, "learning_rate": 1.741447550200466e-06, "loss": 0.9036, "step": 32342 }, { "epoch": 0.61, "learning_rate": 1.741301987968734e-06, "loss": 1.0448, "step": 32343 }, { "epoch": 0.61, "learning_rate": 1.7411564285699584e-06, "loss": 0.9131, "step": 32344 }, { "epoch": 0.61, "learning_rate": 1.7410108720046807e-06, "loss": 0.9958, "step": 32345 }, { "epoch": 0.61, "learning_rate": 1.740865318273445e-06, "loss": 0.795, "step": 32346 }, { "epoch": 0.61, "learning_rate": 1.7407197673767951e-06, "loss": 1.0521, "step": 32347 }, { "epoch": 0.61, "learning_rate": 1.7405742193152746e-06, "loss": 0.8852, "step": 32348 }, { "epoch": 0.61, "learning_rate": 1.740428674089426e-06, "loss": 0.7463, "step": 32349 }, { "epoch": 0.61, "learning_rate": 1.7402831316997945e-06, "loss": 1.1585, "step": 32350 }, { "epoch": 0.61, "learning_rate": 1.7401375921469222e-06, "loss": 1.0252, "step": 32351 }, { "epoch": 0.61, "learning_rate": 1.7399920554313521e-06, "loss": 1.0168, "step": 32352 }, { "epoch": 0.61, "learning_rate": 1.7398465215536287e-06, "loss": 0.9941, "step": 32353 }, { "epoch": 0.61, "learning_rate": 1.7397009905142956e-06, "loss": 0.9688, "step": 32354 }, { "epoch": 0.61, "learning_rate": 1.7395554623138944e-06, "loss": 1.0725, "step": 32355 }, { "epoch": 0.61, "learning_rate": 1.7394099369529712e-06, "loss": 1.1587, "step": 32356 }, { "epoch": 0.61, "learning_rate": 1.739264414432068e-06, "loss": 0.8301, "step": 32357 }, { "epoch": 0.61, "learning_rate": 1.7391188947517268e-06, "loss": 0.9499, "step": 32358 }, { "epoch": 0.61, "learning_rate": 1.7389733779124934e-06, "loss": 1.0561, "step": 32359 }, { "epoch": 0.61, "learning_rate": 1.7388278639149097e-06, "loss": 0.8046, "step": 32360 }, { "epoch": 0.61, "learning_rate": 1.7386823527595193e-06, "loss": 0.89, "step": 32361 }, { "epoch": 0.61, "learning_rate": 1.738536844446866e-06, "loss": 1.1544, "step": 32362 }, { "epoch": 0.61, "learning_rate": 1.738391338977493e-06, "loss": 0.9809, "step": 32363 }, { "epoch": 0.61, "learning_rate": 1.7382458363519426e-06, "loss": 0.9355, "step": 32364 }, { "epoch": 0.61, "learning_rate": 1.7381003365707597e-06, "loss": 0.9738, "step": 32365 }, { "epoch": 0.61, "learning_rate": 1.7379548396344864e-06, "loss": 0.822, "step": 32366 }, { "epoch": 0.61, "learning_rate": 1.7378093455436662e-06, "loss": 0.9504, "step": 32367 }, { "epoch": 0.61, "learning_rate": 1.7376638542988424e-06, "loss": 0.9648, "step": 32368 }, { "epoch": 0.61, "learning_rate": 1.737518365900559e-06, "loss": 1.0682, "step": 32369 }, { "epoch": 0.61, "learning_rate": 1.7373728803493579e-06, "loss": 1.0073, "step": 32370 }, { "epoch": 0.61, "learning_rate": 1.7372273976457837e-06, "loss": 0.9615, "step": 32371 }, { "epoch": 0.61, "learning_rate": 1.7370819177903794e-06, "loss": 0.7964, "step": 32372 }, { "epoch": 0.61, "learning_rate": 1.7369364407836866e-06, "loss": 0.9278, "step": 32373 }, { "epoch": 0.61, "learning_rate": 1.7367909666262505e-06, "loss": 0.8507, "step": 32374 }, { "epoch": 0.61, "learning_rate": 1.7366454953186138e-06, "loss": 1.0735, "step": 32375 }, { "epoch": 0.61, "learning_rate": 1.7365000268613183e-06, "loss": 1.0657, "step": 32376 }, { "epoch": 0.61, "learning_rate": 1.7363545612549093e-06, "loss": 0.6404, "step": 32377 }, { "epoch": 0.61, "learning_rate": 1.7362090984999292e-06, "loss": 0.9682, "step": 32378 }, { "epoch": 0.61, "learning_rate": 1.7360636385969198e-06, "loss": 0.9348, "step": 32379 }, { "epoch": 0.61, "learning_rate": 1.7359181815464266e-06, "loss": 0.8854, "step": 32380 }, { "epoch": 0.61, "learning_rate": 1.7357727273489905e-06, "loss": 1.1436, "step": 32381 }, { "epoch": 0.61, "learning_rate": 1.735627276005155e-06, "loss": 0.9098, "step": 32382 }, { "epoch": 0.61, "learning_rate": 1.7354818275154655e-06, "loss": 0.7164, "step": 32383 }, { "epoch": 0.61, "learning_rate": 1.735336381880463e-06, "loss": 0.7214, "step": 32384 }, { "epoch": 0.61, "learning_rate": 1.73519093910069e-06, "loss": 0.9338, "step": 32385 }, { "epoch": 0.61, "learning_rate": 1.7350454991766918e-06, "loss": 1.171, "step": 32386 }, { "epoch": 0.61, "learning_rate": 1.7349000621090095e-06, "loss": 0.9152, "step": 32387 }, { "epoch": 0.61, "learning_rate": 1.734754627898187e-06, "loss": 0.9505, "step": 32388 }, { "epoch": 0.61, "learning_rate": 1.7346091965447673e-06, "loss": 0.9352, "step": 32389 }, { "epoch": 0.61, "learning_rate": 1.7344637680492937e-06, "loss": 0.8304, "step": 32390 }, { "epoch": 0.61, "learning_rate": 1.7343183424123084e-06, "loss": 0.8523, "step": 32391 }, { "epoch": 0.61, "learning_rate": 1.7341729196343554e-06, "loss": 0.8964, "step": 32392 }, { "epoch": 0.61, "learning_rate": 1.7340274997159772e-06, "loss": 0.8605, "step": 32393 }, { "epoch": 0.61, "learning_rate": 1.7338820826577163e-06, "loss": 1.0305, "step": 32394 }, { "epoch": 0.61, "learning_rate": 1.7337366684601164e-06, "loss": 0.878, "step": 32395 }, { "epoch": 0.61, "learning_rate": 1.733591257123721e-06, "loss": 0.8476, "step": 32396 }, { "epoch": 0.61, "learning_rate": 1.7334458486490713e-06, "loss": 0.8147, "step": 32397 }, { "epoch": 0.61, "learning_rate": 1.7333004430367123e-06, "loss": 0.9499, "step": 32398 }, { "epoch": 0.61, "learning_rate": 1.7331550402871854e-06, "loss": 0.9054, "step": 32399 }, { "epoch": 0.61, "learning_rate": 1.7330096404010339e-06, "loss": 0.9092, "step": 32400 }, { "epoch": 0.61, "learning_rate": 1.7328642433788011e-06, "loss": 0.9955, "step": 32401 }, { "epoch": 0.61, "learning_rate": 1.73271884922103e-06, "loss": 0.8851, "step": 32402 }, { "epoch": 0.61, "learning_rate": 1.7325734579282622e-06, "loss": 0.9471, "step": 32403 }, { "epoch": 0.61, "learning_rate": 1.7324280695010426e-06, "loss": 0.9229, "step": 32404 }, { "epoch": 0.61, "learning_rate": 1.7322826839399132e-06, "loss": 0.9612, "step": 32405 }, { "epoch": 0.61, "learning_rate": 1.7321373012454157e-06, "loss": 1.0491, "step": 32406 }, { "epoch": 0.61, "learning_rate": 1.7319919214180947e-06, "loss": 1.045, "step": 32407 }, { "epoch": 0.61, "learning_rate": 1.7318465444584923e-06, "loss": 0.9219, "step": 32408 }, { "epoch": 0.61, "learning_rate": 1.731701170367151e-06, "loss": 0.8395, "step": 32409 }, { "epoch": 0.61, "learning_rate": 1.731555799144614e-06, "loss": 0.8759, "step": 32410 }, { "epoch": 0.61, "learning_rate": 1.7314104307914248e-06, "loss": 0.9623, "step": 32411 }, { "epoch": 0.61, "learning_rate": 1.7312650653081242e-06, "loss": 1.1412, "step": 32412 }, { "epoch": 0.61, "learning_rate": 1.7311197026952575e-06, "loss": 1.1224, "step": 32413 }, { "epoch": 0.61, "learning_rate": 1.730974342953366e-06, "loss": 0.7903, "step": 32414 }, { "epoch": 0.61, "learning_rate": 1.7308289860829918e-06, "loss": 0.7011, "step": 32415 }, { "epoch": 0.61, "learning_rate": 1.7306836320846793e-06, "loss": 0.7187, "step": 32416 }, { "epoch": 0.61, "learning_rate": 1.730538280958971e-06, "loss": 0.975, "step": 32417 }, { "epoch": 0.61, "learning_rate": 1.7303929327064079e-06, "loss": 0.9134, "step": 32418 }, { "epoch": 0.61, "learning_rate": 1.7302475873275355e-06, "loss": 1.0018, "step": 32419 }, { "epoch": 0.61, "learning_rate": 1.7301022448228943e-06, "loss": 0.913, "step": 32420 }, { "epoch": 0.61, "learning_rate": 1.729956905193027e-06, "loss": 1.0308, "step": 32421 }, { "epoch": 0.61, "learning_rate": 1.7298115684384784e-06, "loss": 0.8087, "step": 32422 }, { "epoch": 0.61, "learning_rate": 1.7296662345597889e-06, "loss": 0.8601, "step": 32423 }, { "epoch": 0.61, "learning_rate": 1.7295209035575017e-06, "loss": 1.1149, "step": 32424 }, { "epoch": 0.61, "learning_rate": 1.7293755754321606e-06, "loss": 0.8201, "step": 32425 }, { "epoch": 0.61, "learning_rate": 1.7292302501843077e-06, "loss": 0.9211, "step": 32426 }, { "epoch": 0.61, "learning_rate": 1.7290849278144844e-06, "loss": 1.0297, "step": 32427 }, { "epoch": 0.61, "learning_rate": 1.7289396083232352e-06, "loss": 0.9192, "step": 32428 }, { "epoch": 0.61, "learning_rate": 1.7287942917111017e-06, "loss": 0.9788, "step": 32429 }, { "epoch": 0.61, "learning_rate": 1.7286489779786265e-06, "loss": 1.0025, "step": 32430 }, { "epoch": 0.61, "learning_rate": 1.7285036671263522e-06, "loss": 1.0121, "step": 32431 }, { "epoch": 0.61, "learning_rate": 1.728358359154822e-06, "loss": 0.9511, "step": 32432 }, { "epoch": 0.61, "learning_rate": 1.728213054064577e-06, "loss": 0.8494, "step": 32433 }, { "epoch": 0.61, "learning_rate": 1.7280677518561623e-06, "loss": 0.7914, "step": 32434 }, { "epoch": 0.61, "learning_rate": 1.7279224525301187e-06, "loss": 0.9219, "step": 32435 }, { "epoch": 0.61, "learning_rate": 1.7277771560869877e-06, "loss": 0.9612, "step": 32436 }, { "epoch": 0.61, "learning_rate": 1.7276318625273135e-06, "loss": 1.1013, "step": 32437 }, { "epoch": 0.61, "learning_rate": 1.7274865718516392e-06, "loss": 1.1571, "step": 32438 }, { "epoch": 0.61, "learning_rate": 1.7273412840605053e-06, "loss": 0.8382, "step": 32439 }, { "epoch": 0.61, "learning_rate": 1.7271959991544562e-06, "loss": 0.9123, "step": 32440 }, { "epoch": 0.61, "learning_rate": 1.7270507171340339e-06, "loss": 0.6708, "step": 32441 }, { "epoch": 0.61, "learning_rate": 1.726905437999779e-06, "loss": 0.9054, "step": 32442 }, { "epoch": 0.61, "learning_rate": 1.7267601617522368e-06, "loss": 1.2377, "step": 32443 }, { "epoch": 0.61, "learning_rate": 1.726614888391948e-06, "loss": 0.8528, "step": 32444 }, { "epoch": 0.61, "learning_rate": 1.7264696179194546e-06, "loss": 0.7027, "step": 32445 }, { "epoch": 0.61, "learning_rate": 1.7263243503353013e-06, "loss": 0.7747, "step": 32446 }, { "epoch": 0.61, "learning_rate": 1.726179085640029e-06, "loss": 1.0103, "step": 32447 }, { "epoch": 0.61, "learning_rate": 1.7260338238341795e-06, "loss": 1.0354, "step": 32448 }, { "epoch": 0.61, "learning_rate": 1.7258885649182967e-06, "loss": 0.8977, "step": 32449 }, { "epoch": 0.61, "learning_rate": 1.725743308892922e-06, "loss": 1.1585, "step": 32450 }, { "epoch": 0.61, "learning_rate": 1.7255980557585977e-06, "loss": 0.8446, "step": 32451 }, { "epoch": 0.61, "learning_rate": 1.725452805515867e-06, "loss": 0.8502, "step": 32452 }, { "epoch": 0.61, "learning_rate": 1.7253075581652717e-06, "loss": 0.888, "step": 32453 }, { "epoch": 0.61, "learning_rate": 1.7251623137073536e-06, "loss": 0.7274, "step": 32454 }, { "epoch": 0.61, "learning_rate": 1.7250170721426568e-06, "loss": 0.6928, "step": 32455 }, { "epoch": 0.61, "learning_rate": 1.7248718334717222e-06, "loss": 0.9014, "step": 32456 }, { "epoch": 0.61, "learning_rate": 1.7247265976950913e-06, "loss": 1.1613, "step": 32457 }, { "epoch": 0.61, "learning_rate": 1.7245813648133083e-06, "loss": 0.9409, "step": 32458 }, { "epoch": 0.61, "learning_rate": 1.724436134826915e-06, "loss": 0.984, "step": 32459 }, { "epoch": 0.61, "learning_rate": 1.724290907736453e-06, "loss": 0.5921, "step": 32460 }, { "epoch": 0.61, "learning_rate": 1.7241456835424653e-06, "loss": 0.859, "step": 32461 }, { "epoch": 0.61, "learning_rate": 1.7240004622454936e-06, "loss": 1.063, "step": 32462 }, { "epoch": 0.61, "learning_rate": 1.72385524384608e-06, "loss": 0.8963, "step": 32463 }, { "epoch": 0.61, "learning_rate": 1.7237100283447677e-06, "loss": 0.711, "step": 32464 }, { "epoch": 0.61, "learning_rate": 1.7235648157420981e-06, "loss": 0.8694, "step": 32465 }, { "epoch": 0.61, "learning_rate": 1.7234196060386133e-06, "loss": 0.5928, "step": 32466 }, { "epoch": 0.61, "learning_rate": 1.7232743992348567e-06, "loss": 0.7425, "step": 32467 }, { "epoch": 0.61, "learning_rate": 1.7231291953313697e-06, "loss": 1.0707, "step": 32468 }, { "epoch": 0.61, "learning_rate": 1.7229839943286935e-06, "loss": 1.2697, "step": 32469 }, { "epoch": 0.61, "learning_rate": 1.7228387962273722e-06, "loss": 0.9763, "step": 32470 }, { "epoch": 0.61, "learning_rate": 1.7226936010279466e-06, "loss": 0.9118, "step": 32471 }, { "epoch": 0.61, "learning_rate": 1.722548408730959e-06, "loss": 0.8575, "step": 32472 }, { "epoch": 0.61, "learning_rate": 1.722403219336952e-06, "loss": 0.716, "step": 32473 }, { "epoch": 0.61, "learning_rate": 1.722258032846468e-06, "loss": 1.0578, "step": 32474 }, { "epoch": 0.61, "learning_rate": 1.7221128492600475e-06, "loss": 1.0616, "step": 32475 }, { "epoch": 0.61, "learning_rate": 1.721967668578235e-06, "loss": 1.0569, "step": 32476 }, { "epoch": 0.61, "learning_rate": 1.7218224908015712e-06, "loss": 0.8185, "step": 32477 }, { "epoch": 0.61, "learning_rate": 1.7216773159305978e-06, "loss": 0.9268, "step": 32478 }, { "epoch": 0.61, "learning_rate": 1.7215321439658572e-06, "loss": 0.8137, "step": 32479 }, { "epoch": 0.61, "learning_rate": 1.7213869749078926e-06, "loss": 0.994, "step": 32480 }, { "epoch": 0.61, "learning_rate": 1.7212418087572445e-06, "loss": 1.0461, "step": 32481 }, { "epoch": 0.61, "learning_rate": 1.7210966455144562e-06, "loss": 1.2542, "step": 32482 }, { "epoch": 0.61, "learning_rate": 1.720951485180069e-06, "loss": 0.7411, "step": 32483 }, { "epoch": 0.61, "learning_rate": 1.7208063277546245e-06, "loss": 0.9008, "step": 32484 }, { "epoch": 0.61, "learning_rate": 1.7206611732386661e-06, "loss": 0.8452, "step": 32485 }, { "epoch": 0.61, "learning_rate": 1.7205160216327343e-06, "loss": 1.0231, "step": 32486 }, { "epoch": 0.61, "learning_rate": 1.7203708729373714e-06, "loss": 0.9511, "step": 32487 }, { "epoch": 0.61, "learning_rate": 1.7202257271531208e-06, "loss": 0.9473, "step": 32488 }, { "epoch": 0.61, "learning_rate": 1.7200805842805235e-06, "loss": 0.8247, "step": 32489 }, { "epoch": 0.61, "learning_rate": 1.7199354443201205e-06, "loss": 0.966, "step": 32490 }, { "epoch": 0.61, "learning_rate": 1.7197903072724553e-06, "loss": 0.7907, "step": 32491 }, { "epoch": 0.61, "learning_rate": 1.7196451731380686e-06, "loss": 0.8634, "step": 32492 }, { "epoch": 0.61, "learning_rate": 1.7195000419175034e-06, "loss": 0.9417, "step": 32493 }, { "epoch": 0.61, "learning_rate": 1.7193549136113007e-06, "loss": 1.0621, "step": 32494 }, { "epoch": 0.61, "learning_rate": 1.7192097882200034e-06, "loss": 0.9985, "step": 32495 }, { "epoch": 0.61, "learning_rate": 1.7190646657441517e-06, "loss": 0.9727, "step": 32496 }, { "epoch": 0.61, "learning_rate": 1.71891954618429e-06, "loss": 0.8906, "step": 32497 }, { "epoch": 0.61, "learning_rate": 1.7187744295409587e-06, "loss": 0.8486, "step": 32498 }, { "epoch": 0.61, "learning_rate": 1.7186293158146982e-06, "loss": 0.9984, "step": 32499 }, { "epoch": 0.61, "learning_rate": 1.718484205006053e-06, "loss": 1.0928, "step": 32500 }, { "epoch": 0.61, "learning_rate": 1.7183390971155639e-06, "loss": 0.8181, "step": 32501 }, { "epoch": 0.61, "learning_rate": 1.7181939921437717e-06, "loss": 0.9702, "step": 32502 }, { "epoch": 0.61, "learning_rate": 1.7180488900912202e-06, "loss": 0.9506, "step": 32503 }, { "epoch": 0.61, "learning_rate": 1.71790379095845e-06, "loss": 0.7539, "step": 32504 }, { "epoch": 0.61, "learning_rate": 1.7177586947460022e-06, "loss": 0.8494, "step": 32505 }, { "epoch": 0.61, "learning_rate": 1.7176136014544204e-06, "loss": 0.9461, "step": 32506 }, { "epoch": 0.61, "learning_rate": 1.7174685110842454e-06, "loss": 0.9136, "step": 32507 }, { "epoch": 0.61, "learning_rate": 1.7173234236360182e-06, "loss": 0.9279, "step": 32508 }, { "epoch": 0.61, "learning_rate": 1.7171783391102824e-06, "loss": 0.897, "step": 32509 }, { "epoch": 0.61, "learning_rate": 1.7170332575075782e-06, "loss": 0.7265, "step": 32510 }, { "epoch": 0.61, "learning_rate": 1.7168881788284475e-06, "loss": 0.8514, "step": 32511 }, { "epoch": 0.61, "learning_rate": 1.7167431030734327e-06, "loss": 0.9619, "step": 32512 }, { "epoch": 0.61, "learning_rate": 1.7165980302430752e-06, "loss": 0.7541, "step": 32513 }, { "epoch": 0.61, "learning_rate": 1.7164529603379158e-06, "loss": 0.8109, "step": 32514 }, { "epoch": 0.61, "learning_rate": 1.7163078933584981e-06, "loss": 0.8859, "step": 32515 }, { "epoch": 0.61, "learning_rate": 1.7161628293053625e-06, "loss": 0.9043, "step": 32516 }, { "epoch": 0.61, "learning_rate": 1.71601776817905e-06, "loss": 0.7011, "step": 32517 }, { "epoch": 0.61, "learning_rate": 1.7158727099801043e-06, "loss": 1.2163, "step": 32518 }, { "epoch": 0.61, "learning_rate": 1.7157276547090651e-06, "loss": 1.0959, "step": 32519 }, { "epoch": 0.61, "learning_rate": 1.715582602366475e-06, "loss": 0.8551, "step": 32520 }, { "epoch": 0.61, "learning_rate": 1.7154375529528754e-06, "loss": 0.9368, "step": 32521 }, { "epoch": 0.61, "learning_rate": 1.7152925064688084e-06, "loss": 0.8641, "step": 32522 }, { "epoch": 0.61, "learning_rate": 1.7151474629148141e-06, "loss": 0.8318, "step": 32523 }, { "epoch": 0.61, "learning_rate": 1.7150024222914359e-06, "loss": 1.2184, "step": 32524 }, { "epoch": 0.61, "learning_rate": 1.7148573845992147e-06, "loss": 0.853, "step": 32525 }, { "epoch": 0.61, "learning_rate": 1.714712349838691e-06, "loss": 0.8326, "step": 32526 }, { "epoch": 0.61, "learning_rate": 1.7145673180104078e-06, "loss": 0.7064, "step": 32527 }, { "epoch": 0.61, "learning_rate": 1.7144222891149067e-06, "loss": 0.8415, "step": 32528 }, { "epoch": 0.61, "learning_rate": 1.7142772631527277e-06, "loss": 0.9929, "step": 32529 }, { "epoch": 0.61, "learning_rate": 1.7141322401244142e-06, "loss": 0.7818, "step": 32530 }, { "epoch": 0.61, "learning_rate": 1.7139872200305068e-06, "loss": 1.1932, "step": 32531 }, { "epoch": 0.61, "learning_rate": 1.7138422028715463e-06, "loss": 1.0188, "step": 32532 }, { "epoch": 0.61, "learning_rate": 1.7136971886480757e-06, "loss": 0.9638, "step": 32533 }, { "epoch": 0.61, "learning_rate": 1.7135521773606351e-06, "loss": 0.8892, "step": 32534 }, { "epoch": 0.61, "learning_rate": 1.7134071690097665e-06, "loss": 0.8893, "step": 32535 }, { "epoch": 0.61, "learning_rate": 1.7132621635960118e-06, "loss": 0.9482, "step": 32536 }, { "epoch": 0.61, "learning_rate": 1.7131171611199124e-06, "loss": 1.0522, "step": 32537 }, { "epoch": 0.61, "learning_rate": 1.7129721615820083e-06, "loss": 1.0166, "step": 32538 }, { "epoch": 0.61, "learning_rate": 1.7128271649828432e-06, "loss": 1.0225, "step": 32539 }, { "epoch": 0.61, "learning_rate": 1.7126821713229567e-06, "loss": 0.8065, "step": 32540 }, { "epoch": 0.61, "learning_rate": 1.7125371806028906e-06, "loss": 0.7692, "step": 32541 }, { "epoch": 0.61, "learning_rate": 1.7123921928231868e-06, "loss": 0.8302, "step": 32542 }, { "epoch": 0.61, "learning_rate": 1.7122472079843869e-06, "loss": 1.0597, "step": 32543 }, { "epoch": 0.61, "learning_rate": 1.7121022260870306e-06, "loss": 1.0737, "step": 32544 }, { "epoch": 0.61, "learning_rate": 1.7119572471316614e-06, "loss": 0.8083, "step": 32545 }, { "epoch": 0.61, "learning_rate": 1.71181227111882e-06, "loss": 0.972, "step": 32546 }, { "epoch": 0.61, "learning_rate": 1.7116672980490462e-06, "loss": 0.8111, "step": 32547 }, { "epoch": 0.61, "learning_rate": 1.711522327922883e-06, "loss": 0.8271, "step": 32548 }, { "epoch": 0.61, "learning_rate": 1.7113773607408718e-06, "loss": 1.0439, "step": 32549 }, { "epoch": 0.61, "learning_rate": 1.7112323965035526e-06, "loss": 0.9207, "step": 32550 }, { "epoch": 0.61, "learning_rate": 1.7110874352114682e-06, "loss": 1.0303, "step": 32551 }, { "epoch": 0.61, "learning_rate": 1.7109424768651592e-06, "loss": 0.8778, "step": 32552 }, { "epoch": 0.61, "learning_rate": 1.7107975214651657e-06, "loss": 0.9438, "step": 32553 }, { "epoch": 0.61, "learning_rate": 1.7106525690120312e-06, "loss": 0.7953, "step": 32554 }, { "epoch": 0.61, "learning_rate": 1.7105076195062953e-06, "loss": 0.8502, "step": 32555 }, { "epoch": 0.61, "learning_rate": 1.7103626729485002e-06, "loss": 1.0319, "step": 32556 }, { "epoch": 0.61, "learning_rate": 1.7102177293391852e-06, "loss": 0.9794, "step": 32557 }, { "epoch": 0.61, "learning_rate": 1.710072788678895e-06, "loss": 0.8339, "step": 32558 }, { "epoch": 0.61, "learning_rate": 1.7099278509681677e-06, "loss": 0.8032, "step": 32559 }, { "epoch": 0.61, "learning_rate": 1.7097829162075453e-06, "loss": 0.8802, "step": 32560 }, { "epoch": 0.61, "learning_rate": 1.7096379843975694e-06, "loss": 0.8537, "step": 32561 }, { "epoch": 0.61, "learning_rate": 1.7094930555387818e-06, "loss": 1.1829, "step": 32562 }, { "epoch": 0.61, "learning_rate": 1.7093481296317215e-06, "loss": 1.196, "step": 32563 }, { "epoch": 0.61, "learning_rate": 1.7092032066769327e-06, "loss": 0.8778, "step": 32564 }, { "epoch": 0.61, "learning_rate": 1.7090582866749543e-06, "loss": 1.0049, "step": 32565 }, { "epoch": 0.61, "learning_rate": 1.7089133696263272e-06, "loss": 0.9173, "step": 32566 }, { "epoch": 0.61, "learning_rate": 1.7087684555315941e-06, "loss": 1.0123, "step": 32567 }, { "epoch": 0.61, "learning_rate": 1.7086235443912952e-06, "loss": 1.0052, "step": 32568 }, { "epoch": 0.61, "learning_rate": 1.7084786362059711e-06, "loss": 1.2078, "step": 32569 }, { "epoch": 0.61, "learning_rate": 1.7083337309761644e-06, "loss": 1.067, "step": 32570 }, { "epoch": 0.61, "learning_rate": 1.7081888287024156e-06, "loss": 0.8248, "step": 32571 }, { "epoch": 0.61, "learning_rate": 1.708043929385264e-06, "loss": 0.7059, "step": 32572 }, { "epoch": 0.61, "learning_rate": 1.7078990330252532e-06, "loss": 0.8833, "step": 32573 }, { "epoch": 0.61, "learning_rate": 1.7077541396229228e-06, "loss": 0.8521, "step": 32574 }, { "epoch": 0.61, "learning_rate": 1.7076092491788141e-06, "loss": 1.046, "step": 32575 }, { "epoch": 0.61, "learning_rate": 1.707464361693468e-06, "loss": 0.9738, "step": 32576 }, { "epoch": 0.61, "learning_rate": 1.7073194771674262e-06, "loss": 1.0204, "step": 32577 }, { "epoch": 0.61, "learning_rate": 1.7071745956012284e-06, "loss": 0.9696, "step": 32578 }, { "epoch": 0.61, "learning_rate": 1.707029716995417e-06, "loss": 0.7819, "step": 32579 }, { "epoch": 0.61, "learning_rate": 1.7068848413505328e-06, "loss": 0.7988, "step": 32580 }, { "epoch": 0.61, "learning_rate": 1.706739968667115e-06, "loss": 1.1497, "step": 32581 }, { "epoch": 0.61, "learning_rate": 1.7065950989457065e-06, "loss": 1.1171, "step": 32582 }, { "epoch": 0.61, "learning_rate": 1.7064502321868476e-06, "loss": 0.8696, "step": 32583 }, { "epoch": 0.61, "learning_rate": 1.7063053683910786e-06, "loss": 0.9032, "step": 32584 }, { "epoch": 0.61, "learning_rate": 1.706160507558942e-06, "loss": 0.8431, "step": 32585 }, { "epoch": 0.61, "learning_rate": 1.7060156496909777e-06, "loss": 0.9166, "step": 32586 }, { "epoch": 0.61, "learning_rate": 1.7058707947877256e-06, "loss": 1.1579, "step": 32587 }, { "epoch": 0.61, "learning_rate": 1.7057259428497285e-06, "loss": 1.0157, "step": 32588 }, { "epoch": 0.61, "learning_rate": 1.7055810938775259e-06, "loss": 0.9806, "step": 32589 }, { "epoch": 0.61, "learning_rate": 1.7054362478716588e-06, "loss": 0.9134, "step": 32590 }, { "epoch": 0.61, "learning_rate": 1.7052914048326691e-06, "loss": 0.8526, "step": 32591 }, { "epoch": 0.61, "learning_rate": 1.7051465647610973e-06, "loss": 0.9244, "step": 32592 }, { "epoch": 0.61, "learning_rate": 1.7050017276574826e-06, "loss": 1.0446, "step": 32593 }, { "epoch": 0.61, "learning_rate": 1.704856893522368e-06, "loss": 0.9736, "step": 32594 }, { "epoch": 0.61, "learning_rate": 1.7047120623562933e-06, "loss": 0.7415, "step": 32595 }, { "epoch": 0.61, "learning_rate": 1.704567234159799e-06, "loss": 0.7765, "step": 32596 }, { "epoch": 0.62, "learning_rate": 1.7044224089334266e-06, "loss": 0.8654, "step": 32597 }, { "epoch": 0.62, "learning_rate": 1.7042775866777167e-06, "loss": 0.9033, "step": 32598 }, { "epoch": 0.62, "learning_rate": 1.704132767393209e-06, "loss": 0.9514, "step": 32599 }, { "epoch": 0.62, "learning_rate": 1.703987951080446e-06, "loss": 1.2036, "step": 32600 }, { "epoch": 0.62, "learning_rate": 1.7038431377399678e-06, "loss": 0.9759, "step": 32601 }, { "epoch": 0.62, "learning_rate": 1.703698327372314e-06, "loss": 0.7932, "step": 32602 }, { "epoch": 0.62, "learning_rate": 1.7035535199780265e-06, "loss": 0.8381, "step": 32603 }, { "epoch": 0.62, "learning_rate": 1.7034087155576463e-06, "loss": 0.8394, "step": 32604 }, { "epoch": 0.62, "learning_rate": 1.7032639141117125e-06, "loss": 0.9162, "step": 32605 }, { "epoch": 0.62, "learning_rate": 1.7031191156407678e-06, "loss": 1.0549, "step": 32606 }, { "epoch": 0.62, "learning_rate": 1.702974320145352e-06, "loss": 0.4567, "step": 32607 }, { "epoch": 0.62, "learning_rate": 1.7028295276260047e-06, "loss": 0.8656, "step": 32608 }, { "epoch": 0.62, "learning_rate": 1.7026847380832683e-06, "loss": 0.8833, "step": 32609 }, { "epoch": 0.62, "learning_rate": 1.7025399515176822e-06, "loss": 0.7473, "step": 32610 }, { "epoch": 0.62, "learning_rate": 1.702395167929787e-06, "loss": 0.9754, "step": 32611 }, { "epoch": 0.62, "learning_rate": 1.7022503873201246e-06, "loss": 0.9122, "step": 32612 }, { "epoch": 0.62, "learning_rate": 1.7021056096892353e-06, "loss": 0.9294, "step": 32613 }, { "epoch": 0.62, "learning_rate": 1.7019608350376577e-06, "loss": 0.9714, "step": 32614 }, { "epoch": 0.62, "learning_rate": 1.7018160633659353e-06, "loss": 0.6496, "step": 32615 }, { "epoch": 0.62, "learning_rate": 1.701671294674606e-06, "loss": 0.7982, "step": 32616 }, { "epoch": 0.62, "learning_rate": 1.7015265289642124e-06, "loss": 0.828, "step": 32617 }, { "epoch": 0.62, "learning_rate": 1.7013817662352937e-06, "loss": 1.0813, "step": 32618 }, { "epoch": 0.62, "learning_rate": 1.701237006488392e-06, "loss": 0.9133, "step": 32619 }, { "epoch": 0.62, "learning_rate": 1.7010922497240457e-06, "loss": 0.963, "step": 32620 }, { "epoch": 0.62, "learning_rate": 1.7009474959427973e-06, "loss": 0.8078, "step": 32621 }, { "epoch": 0.62, "learning_rate": 1.7008027451451863e-06, "loss": 0.8801, "step": 32622 }, { "epoch": 0.62, "learning_rate": 1.7006579973317528e-06, "loss": 0.7371, "step": 32623 }, { "epoch": 0.62, "learning_rate": 1.700513252503038e-06, "loss": 1.0132, "step": 32624 }, { "epoch": 0.62, "learning_rate": 1.7003685106595826e-06, "loss": 0.9939, "step": 32625 }, { "epoch": 0.62, "learning_rate": 1.700223771801926e-06, "loss": 0.9316, "step": 32626 }, { "epoch": 0.62, "learning_rate": 1.7000790359306102e-06, "loss": 0.7515, "step": 32627 }, { "epoch": 0.62, "learning_rate": 1.6999343030461746e-06, "loss": 0.9122, "step": 32628 }, { "epoch": 0.62, "learning_rate": 1.6997895731491587e-06, "loss": 0.9969, "step": 32629 }, { "epoch": 0.62, "learning_rate": 1.6996448462401055e-06, "loss": 0.9487, "step": 32630 }, { "epoch": 0.62, "learning_rate": 1.699500122319553e-06, "loss": 1.4031, "step": 32631 }, { "epoch": 0.62, "learning_rate": 1.699355401388042e-06, "loss": 0.941, "step": 32632 }, { "epoch": 0.62, "learning_rate": 1.6992106834461145e-06, "loss": 0.7348, "step": 32633 }, { "epoch": 0.62, "learning_rate": 1.6990659684943098e-06, "loss": 0.8351, "step": 32634 }, { "epoch": 0.62, "learning_rate": 1.698921256533167e-06, "loss": 0.9854, "step": 32635 }, { "epoch": 0.62, "learning_rate": 1.698776547563229e-06, "loss": 0.8959, "step": 32636 }, { "epoch": 0.62, "learning_rate": 1.698631841585034e-06, "loss": 1.0045, "step": 32637 }, { "epoch": 0.62, "learning_rate": 1.698487138599123e-06, "loss": 0.9023, "step": 32638 }, { "epoch": 0.62, "learning_rate": 1.6983424386060371e-06, "loss": 0.8232, "step": 32639 }, { "epoch": 0.62, "learning_rate": 1.6981977416063158e-06, "loss": 1.0652, "step": 32640 }, { "epoch": 0.62, "learning_rate": 1.6980530476004988e-06, "loss": 0.8531, "step": 32641 }, { "epoch": 0.62, "learning_rate": 1.697908356589128e-06, "loss": 0.8701, "step": 32642 }, { "epoch": 0.62, "learning_rate": 1.6977636685727433e-06, "loss": 0.9622, "step": 32643 }, { "epoch": 0.62, "learning_rate": 1.697618983551883e-06, "loss": 0.9819, "step": 32644 }, { "epoch": 0.62, "learning_rate": 1.6974743015270894e-06, "loss": 0.8633, "step": 32645 }, { "epoch": 0.62, "learning_rate": 1.6973296224989027e-06, "loss": 0.7847, "step": 32646 }, { "epoch": 0.62, "learning_rate": 1.6971849464678615e-06, "loss": 0.8377, "step": 32647 }, { "epoch": 0.62, "learning_rate": 1.697040273434508e-06, "loss": 0.8346, "step": 32648 }, { "epoch": 0.62, "learning_rate": 1.6968956033993816e-06, "loss": 0.9481, "step": 32649 }, { "epoch": 0.62, "learning_rate": 1.6967509363630213e-06, "loss": 1.1597, "step": 32650 }, { "epoch": 0.62, "learning_rate": 1.6966062723259697e-06, "loss": 0.9283, "step": 32651 }, { "epoch": 0.62, "learning_rate": 1.696461611288765e-06, "loss": 0.8743, "step": 32652 }, { "epoch": 0.62, "learning_rate": 1.6963169532519474e-06, "loss": 0.906, "step": 32653 }, { "epoch": 0.62, "learning_rate": 1.6961722982160589e-06, "loss": 0.7611, "step": 32654 }, { "epoch": 0.62, "learning_rate": 1.6960276461816382e-06, "loss": 1.1591, "step": 32655 }, { "epoch": 0.62, "learning_rate": 1.6958829971492247e-06, "loss": 1.1253, "step": 32656 }, { "epoch": 0.62, "learning_rate": 1.6957383511193603e-06, "loss": 1.0486, "step": 32657 }, { "epoch": 0.62, "learning_rate": 1.6955937080925838e-06, "loss": 0.8395, "step": 32658 }, { "epoch": 0.62, "learning_rate": 1.6954490680694357e-06, "loss": 0.9636, "step": 32659 }, { "epoch": 0.62, "learning_rate": 1.695304431050456e-06, "loss": 0.8908, "step": 32660 }, { "epoch": 0.62, "learning_rate": 1.6951597970361855e-06, "loss": 0.838, "step": 32661 }, { "epoch": 0.62, "learning_rate": 1.6950151660271627e-06, "loss": 1.0344, "step": 32662 }, { "epoch": 0.62, "learning_rate": 1.6948705380239295e-06, "loss": 1.0803, "step": 32663 }, { "epoch": 0.62, "learning_rate": 1.694725913027025e-06, "loss": 1.1925, "step": 32664 }, { "epoch": 0.62, "learning_rate": 1.6945812910369885e-06, "loss": 0.9418, "step": 32665 }, { "epoch": 0.62, "learning_rate": 1.694436672054361e-06, "loss": 0.791, "step": 32666 }, { "epoch": 0.62, "learning_rate": 1.6942920560796827e-06, "loss": 0.9504, "step": 32667 }, { "epoch": 0.62, "learning_rate": 1.6941474431134925e-06, "loss": 0.9952, "step": 32668 }, { "epoch": 0.62, "learning_rate": 1.6940028331563318e-06, "loss": 1.0131, "step": 32669 }, { "epoch": 0.62, "learning_rate": 1.69385822620874e-06, "loss": 0.8229, "step": 32670 }, { "epoch": 0.62, "learning_rate": 1.6937136222712558e-06, "loss": 0.8432, "step": 32671 }, { "epoch": 0.62, "learning_rate": 1.693569021344421e-06, "loss": 0.7534, "step": 32672 }, { "epoch": 0.62, "learning_rate": 1.6934244234287744e-06, "loss": 0.6501, "step": 32673 }, { "epoch": 0.62, "learning_rate": 1.6932798285248558e-06, "loss": 1.3236, "step": 32674 }, { "epoch": 0.62, "learning_rate": 1.6931352366332065e-06, "loss": 0.9132, "step": 32675 }, { "epoch": 0.62, "learning_rate": 1.6929906477543656e-06, "loss": 1.0626, "step": 32676 }, { "epoch": 0.62, "learning_rate": 1.6928460618888717e-06, "loss": 0.8814, "step": 32677 }, { "epoch": 0.62, "learning_rate": 1.692701479037267e-06, "loss": 1.0227, "step": 32678 }, { "epoch": 0.62, "learning_rate": 1.6925568992000897e-06, "loss": 0.805, "step": 32679 }, { "epoch": 0.62, "learning_rate": 1.6924123223778801e-06, "loss": 0.7941, "step": 32680 }, { "epoch": 0.62, "learning_rate": 1.6922677485711782e-06, "loss": 1.3435, "step": 32681 }, { "epoch": 0.62, "learning_rate": 1.6921231777805245e-06, "loss": 0.6992, "step": 32682 }, { "epoch": 0.62, "learning_rate": 1.6919786100064567e-06, "loss": 1.0558, "step": 32683 }, { "epoch": 0.62, "learning_rate": 1.6918340452495173e-06, "loss": 0.8983, "step": 32684 }, { "epoch": 0.62, "learning_rate": 1.6916894835102445e-06, "loss": 0.8816, "step": 32685 }, { "epoch": 0.62, "learning_rate": 1.6915449247891774e-06, "loss": 0.9342, "step": 32686 }, { "epoch": 0.62, "learning_rate": 1.6914003690868575e-06, "loss": 0.9562, "step": 32687 }, { "epoch": 0.62, "learning_rate": 1.6912558164038243e-06, "loss": 0.9718, "step": 32688 }, { "epoch": 0.62, "learning_rate": 1.691111266740616e-06, "loss": 0.944, "step": 32689 }, { "epoch": 0.62, "learning_rate": 1.6909667200977745e-06, "loss": 0.9212, "step": 32690 }, { "epoch": 0.62, "learning_rate": 1.6908221764758385e-06, "loss": 0.9547, "step": 32691 }, { "epoch": 0.62, "learning_rate": 1.6906776358753463e-06, "loss": 0.6916, "step": 32692 }, { "epoch": 0.62, "learning_rate": 1.6905330982968405e-06, "loss": 1.0829, "step": 32693 }, { "epoch": 0.62, "learning_rate": 1.6903885637408585e-06, "loss": 1.0435, "step": 32694 }, { "epoch": 0.62, "learning_rate": 1.6902440322079402e-06, "loss": 0.9875, "step": 32695 }, { "epoch": 0.62, "learning_rate": 1.6900995036986274e-06, "loss": 0.8044, "step": 32696 }, { "epoch": 0.62, "learning_rate": 1.6899549782134575e-06, "loss": 0.8976, "step": 32697 }, { "epoch": 0.62, "learning_rate": 1.6898104557529702e-06, "loss": 1.0201, "step": 32698 }, { "epoch": 0.62, "learning_rate": 1.689665936317707e-06, "loss": 0.9283, "step": 32699 }, { "epoch": 0.62, "learning_rate": 1.6895214199082054e-06, "loss": 1.1031, "step": 32700 }, { "epoch": 0.62, "learning_rate": 1.6893769065250064e-06, "loss": 1.0927, "step": 32701 }, { "epoch": 0.62, "learning_rate": 1.6892323961686492e-06, "loss": 0.8573, "step": 32702 }, { "epoch": 0.62, "learning_rate": 1.6890878888396732e-06, "loss": 0.8436, "step": 32703 }, { "epoch": 0.62, "learning_rate": 1.6889433845386177e-06, "loss": 0.7184, "step": 32704 }, { "epoch": 0.62, "learning_rate": 1.688798883266024e-06, "loss": 0.9143, "step": 32705 }, { "epoch": 0.62, "learning_rate": 1.68865438502243e-06, "loss": 1.0766, "step": 32706 }, { "epoch": 0.62, "learning_rate": 1.6885098898083746e-06, "loss": 0.941, "step": 32707 }, { "epoch": 0.62, "learning_rate": 1.6883653976243992e-06, "loss": 1.0035, "step": 32708 }, { "epoch": 0.62, "learning_rate": 1.6882209084710427e-06, "loss": 0.7548, "step": 32709 }, { "epoch": 0.62, "learning_rate": 1.6880764223488435e-06, "loss": 0.9708, "step": 32710 }, { "epoch": 0.62, "learning_rate": 1.6879319392583432e-06, "loss": 1.012, "step": 32711 }, { "epoch": 0.62, "learning_rate": 1.68778745920008e-06, "loss": 1.1305, "step": 32712 }, { "epoch": 0.62, "learning_rate": 1.6876429821745926e-06, "loss": 1.1277, "step": 32713 }, { "epoch": 0.62, "learning_rate": 1.6874985081824223e-06, "loss": 0.9001, "step": 32714 }, { "epoch": 0.62, "learning_rate": 1.6873540372241073e-06, "loss": 0.932, "step": 32715 }, { "epoch": 0.62, "learning_rate": 1.687209569300187e-06, "loss": 0.9076, "step": 32716 }, { "epoch": 0.62, "learning_rate": 1.6870651044112018e-06, "loss": 0.9346, "step": 32717 }, { "epoch": 0.62, "learning_rate": 1.6869206425576912e-06, "loss": 0.8962, "step": 32718 }, { "epoch": 0.62, "learning_rate": 1.6867761837401924e-06, "loss": 0.9305, "step": 32719 }, { "epoch": 0.62, "learning_rate": 1.6866317279592477e-06, "loss": 0.7164, "step": 32720 }, { "epoch": 0.62, "learning_rate": 1.686487275215395e-06, "loss": 0.7435, "step": 32721 }, { "epoch": 0.62, "learning_rate": 1.6863428255091732e-06, "loss": 0.7348, "step": 32722 }, { "epoch": 0.62, "learning_rate": 1.6861983788411229e-06, "loss": 0.755, "step": 32723 }, { "epoch": 0.62, "learning_rate": 1.686053935211783e-06, "loss": 0.9514, "step": 32724 }, { "epoch": 0.62, "learning_rate": 1.6859094946216919e-06, "loss": 1.1022, "step": 32725 }, { "epoch": 0.62, "learning_rate": 1.6857650570713907e-06, "loss": 0.8782, "step": 32726 }, { "epoch": 0.62, "learning_rate": 1.685620622561418e-06, "loss": 0.8536, "step": 32727 }, { "epoch": 0.62, "learning_rate": 1.6854761910923117e-06, "loss": 1.0908, "step": 32728 }, { "epoch": 0.62, "learning_rate": 1.6853317626646132e-06, "loss": 0.7788, "step": 32729 }, { "epoch": 0.62, "learning_rate": 1.6851873372788613e-06, "loss": 0.9963, "step": 32730 }, { "epoch": 0.62, "learning_rate": 1.6850429149355934e-06, "loss": 1.1405, "step": 32731 }, { "epoch": 0.62, "learning_rate": 1.6848984956353521e-06, "loss": 0.9456, "step": 32732 }, { "epoch": 0.62, "learning_rate": 1.6847540793786743e-06, "loss": 0.7148, "step": 32733 }, { "epoch": 0.62, "learning_rate": 1.6846096661660988e-06, "loss": 0.795, "step": 32734 }, { "epoch": 0.62, "learning_rate": 1.6844652559981667e-06, "loss": 0.8473, "step": 32735 }, { "epoch": 0.62, "learning_rate": 1.684320848875416e-06, "loss": 0.8485, "step": 32736 }, { "epoch": 0.62, "learning_rate": 1.6841764447983857e-06, "loss": 1.0066, "step": 32737 }, { "epoch": 0.62, "learning_rate": 1.6840320437676166e-06, "loss": 1.0148, "step": 32738 }, { "epoch": 0.62, "learning_rate": 1.6838876457836468e-06, "loss": 0.7857, "step": 32739 }, { "epoch": 0.62, "learning_rate": 1.6837432508470144e-06, "loss": 0.6901, "step": 32740 }, { "epoch": 0.62, "learning_rate": 1.6835988589582608e-06, "loss": 0.8107, "step": 32741 }, { "epoch": 0.62, "learning_rate": 1.6834544701179234e-06, "loss": 0.9162, "step": 32742 }, { "epoch": 0.62, "learning_rate": 1.683310084326542e-06, "loss": 1.1606, "step": 32743 }, { "epoch": 0.62, "learning_rate": 1.6831657015846558e-06, "loss": 1.0134, "step": 32744 }, { "epoch": 0.62, "learning_rate": 1.6830213218928047e-06, "loss": 0.9184, "step": 32745 }, { "epoch": 0.62, "learning_rate": 1.6828769452515253e-06, "loss": 0.9355, "step": 32746 }, { "epoch": 0.62, "learning_rate": 1.6827325716613596e-06, "loss": 0.8742, "step": 32747 }, { "epoch": 0.62, "learning_rate": 1.6825882011228457e-06, "loss": 0.8916, "step": 32748 }, { "epoch": 0.62, "learning_rate": 1.682443833636521e-06, "loss": 0.9156, "step": 32749 }, { "epoch": 0.62, "learning_rate": 1.6822994692029265e-06, "loss": 0.995, "step": 32750 }, { "epoch": 0.62, "learning_rate": 1.6821551078226012e-06, "loss": 0.8491, "step": 32751 }, { "epoch": 0.62, "learning_rate": 1.6820107494960827e-06, "loss": 0.7151, "step": 32752 }, { "epoch": 0.62, "learning_rate": 1.6818663942239121e-06, "loss": 0.9001, "step": 32753 }, { "epoch": 0.62, "learning_rate": 1.6817220420066272e-06, "loss": 0.8837, "step": 32754 }, { "epoch": 0.62, "learning_rate": 1.6815776928447662e-06, "loss": 1.0996, "step": 32755 }, { "epoch": 0.62, "learning_rate": 1.68143334673887e-06, "loss": 1.0643, "step": 32756 }, { "epoch": 0.62, "learning_rate": 1.6812890036894758e-06, "loss": 0.9521, "step": 32757 }, { "epoch": 0.62, "learning_rate": 1.681144663697123e-06, "loss": 0.7973, "step": 32758 }, { "epoch": 0.62, "learning_rate": 1.681000326762352e-06, "loss": 1.1074, "step": 32759 }, { "epoch": 0.62, "learning_rate": 1.6808559928857005e-06, "loss": 0.7567, "step": 32760 }, { "epoch": 0.62, "learning_rate": 1.6807116620677067e-06, "loss": 0.9895, "step": 32761 }, { "epoch": 0.62, "learning_rate": 1.6805673343089118e-06, "loss": 1.0791, "step": 32762 }, { "epoch": 0.62, "learning_rate": 1.6804230096098523e-06, "loss": 0.9653, "step": 32763 }, { "epoch": 0.62, "learning_rate": 1.6802786879710685e-06, "loss": 0.9271, "step": 32764 }, { "epoch": 0.62, "learning_rate": 1.6801343693930987e-06, "loss": 1.0165, "step": 32765 }, { "epoch": 0.62, "learning_rate": 1.6799900538764826e-06, "loss": 0.954, "step": 32766 }, { "epoch": 0.62, "learning_rate": 1.6798457414217578e-06, "loss": 0.8181, "step": 32767 }, { "epoch": 0.62, "learning_rate": 1.6797014320294648e-06, "loss": 1.1303, "step": 32768 }, { "epoch": 0.62, "learning_rate": 1.679557125700141e-06, "loss": 0.87, "step": 32769 }, { "epoch": 0.62, "learning_rate": 1.6794128224343251e-06, "loss": 0.8797, "step": 32770 }, { "epoch": 0.62, "learning_rate": 1.6792685222325568e-06, "loss": 0.8554, "step": 32771 }, { "epoch": 0.62, "learning_rate": 1.6791242250953755e-06, "loss": 0.8271, "step": 32772 }, { "epoch": 0.62, "learning_rate": 1.6789799310233178e-06, "loss": 0.7957, "step": 32773 }, { "epoch": 0.62, "learning_rate": 1.6788356400169254e-06, "loss": 0.8634, "step": 32774 }, { "epoch": 0.62, "learning_rate": 1.6786913520767353e-06, "loss": 0.9317, "step": 32775 }, { "epoch": 0.62, "learning_rate": 1.6785470672032854e-06, "loss": 1.165, "step": 32776 }, { "epoch": 0.62, "learning_rate": 1.678402785397117e-06, "loss": 0.9963, "step": 32777 }, { "epoch": 0.62, "learning_rate": 1.6782585066587662e-06, "loss": 0.8729, "step": 32778 }, { "epoch": 0.62, "learning_rate": 1.6781142309887727e-06, "loss": 0.9331, "step": 32779 }, { "epoch": 0.62, "learning_rate": 1.6779699583876765e-06, "loss": 0.9812, "step": 32780 }, { "epoch": 0.62, "learning_rate": 1.6778256888560154e-06, "loss": 1.2278, "step": 32781 }, { "epoch": 0.62, "learning_rate": 1.6776814223943269e-06, "loss": 1.1115, "step": 32782 }, { "epoch": 0.62, "learning_rate": 1.6775371590031519e-06, "loss": 0.8762, "step": 32783 }, { "epoch": 0.62, "learning_rate": 1.6773928986830273e-06, "loss": 1.0554, "step": 32784 }, { "epoch": 0.62, "learning_rate": 1.6772486414344925e-06, "loss": 0.9311, "step": 32785 }, { "epoch": 0.62, "learning_rate": 1.6771043872580856e-06, "loss": 0.9027, "step": 32786 }, { "epoch": 0.62, "learning_rate": 1.6769601361543464e-06, "loss": 1.1929, "step": 32787 }, { "epoch": 0.62, "learning_rate": 1.6768158881238123e-06, "loss": 1.0729, "step": 32788 }, { "epoch": 0.62, "learning_rate": 1.6766716431670227e-06, "loss": 0.8184, "step": 32789 }, { "epoch": 0.62, "learning_rate": 1.6765274012845164e-06, "loss": 1.0874, "step": 32790 }, { "epoch": 0.62, "learning_rate": 1.676383162476831e-06, "loss": 0.8202, "step": 32791 }, { "epoch": 0.62, "learning_rate": 1.676238926744505e-06, "loss": 1.1584, "step": 32792 }, { "epoch": 0.62, "learning_rate": 1.6760946940880785e-06, "loss": 0.9465, "step": 32793 }, { "epoch": 0.62, "learning_rate": 1.6759504645080893e-06, "loss": 1.0497, "step": 32794 }, { "epoch": 0.62, "learning_rate": 1.6758062380050749e-06, "loss": 1.1293, "step": 32795 }, { "epoch": 0.62, "learning_rate": 1.6756620145795757e-06, "loss": 0.7924, "step": 32796 }, { "epoch": 0.62, "learning_rate": 1.6755177942321288e-06, "loss": 0.9849, "step": 32797 }, { "epoch": 0.62, "learning_rate": 1.675373576963273e-06, "loss": 0.7642, "step": 32798 }, { "epoch": 0.62, "learning_rate": 1.675229362773547e-06, "loss": 0.8484, "step": 32799 }, { "epoch": 0.62, "learning_rate": 1.6750851516634897e-06, "loss": 1.1639, "step": 32800 }, { "epoch": 0.62, "learning_rate": 1.6749409436336383e-06, "loss": 0.9992, "step": 32801 }, { "epoch": 0.62, "learning_rate": 1.6747967386845331e-06, "loss": 1.1198, "step": 32802 }, { "epoch": 0.62, "learning_rate": 1.6746525368167115e-06, "loss": 0.7929, "step": 32803 }, { "epoch": 0.62, "learning_rate": 1.674508338030711e-06, "loss": 0.6545, "step": 32804 }, { "epoch": 0.62, "learning_rate": 1.6743641423270718e-06, "loss": 0.8677, "step": 32805 }, { "epoch": 0.62, "learning_rate": 1.6742199497063321e-06, "loss": 1.0973, "step": 32806 }, { "epoch": 0.62, "learning_rate": 1.6740757601690283e-06, "loss": 0.8027, "step": 32807 }, { "epoch": 0.62, "learning_rate": 1.673931573715702e-06, "loss": 0.9616, "step": 32808 }, { "epoch": 0.62, "learning_rate": 1.6737873903468894e-06, "loss": 0.9035, "step": 32809 }, { "epoch": 0.62, "learning_rate": 1.6736432100631283e-06, "loss": 0.8596, "step": 32810 }, { "epoch": 0.62, "learning_rate": 1.6734990328649592e-06, "loss": 0.8393, "step": 32811 }, { "epoch": 0.62, "learning_rate": 1.6733548587529192e-06, "loss": 1.1493, "step": 32812 }, { "epoch": 0.62, "learning_rate": 1.6732106877275457e-06, "loss": 0.7639, "step": 32813 }, { "epoch": 0.62, "learning_rate": 1.6730665197893798e-06, "loss": 0.7758, "step": 32814 }, { "epoch": 0.62, "learning_rate": 1.6729223549389575e-06, "loss": 0.9728, "step": 32815 }, { "epoch": 0.62, "learning_rate": 1.6727781931768172e-06, "loss": 0.7823, "step": 32816 }, { "epoch": 0.62, "learning_rate": 1.6726340345034985e-06, "loss": 0.7661, "step": 32817 }, { "epoch": 0.62, "learning_rate": 1.6724898789195388e-06, "loss": 1.1893, "step": 32818 }, { "epoch": 0.62, "learning_rate": 1.672345726425476e-06, "loss": 1.1375, "step": 32819 }, { "epoch": 0.62, "learning_rate": 1.6722015770218494e-06, "loss": 0.847, "step": 32820 }, { "epoch": 0.62, "learning_rate": 1.6720574307091972e-06, "loss": 0.8675, "step": 32821 }, { "epoch": 0.62, "learning_rate": 1.6719132874880558e-06, "loss": 0.9772, "step": 32822 }, { "epoch": 0.62, "learning_rate": 1.6717691473589662e-06, "loss": 0.7549, "step": 32823 }, { "epoch": 0.62, "learning_rate": 1.6716250103224651e-06, "loss": 0.9293, "step": 32824 }, { "epoch": 0.62, "learning_rate": 1.6714808763790897e-06, "loss": 1.0411, "step": 32825 }, { "epoch": 0.62, "learning_rate": 1.6713367455293797e-06, "loss": 0.7979, "step": 32826 }, { "epoch": 0.62, "learning_rate": 1.6711926177738736e-06, "loss": 0.9954, "step": 32827 }, { "epoch": 0.62, "learning_rate": 1.6710484931131077e-06, "loss": 0.9232, "step": 32828 }, { "epoch": 0.62, "learning_rate": 1.6709043715476225e-06, "loss": 0.6743, "step": 32829 }, { "epoch": 0.62, "learning_rate": 1.6707602530779549e-06, "loss": 0.6657, "step": 32830 }, { "epoch": 0.62, "learning_rate": 1.6706161377046418e-06, "loss": 0.8933, "step": 32831 }, { "epoch": 0.62, "learning_rate": 1.6704720254282238e-06, "loss": 0.8232, "step": 32832 }, { "epoch": 0.62, "learning_rate": 1.6703279162492375e-06, "loss": 0.749, "step": 32833 }, { "epoch": 0.62, "learning_rate": 1.6701838101682206e-06, "loss": 1.0813, "step": 32834 }, { "epoch": 0.62, "learning_rate": 1.670039707185713e-06, "loss": 0.8096, "step": 32835 }, { "epoch": 0.62, "learning_rate": 1.6698956073022516e-06, "loss": 0.9709, "step": 32836 }, { "epoch": 0.62, "learning_rate": 1.6697515105183737e-06, "loss": 1.2039, "step": 32837 }, { "epoch": 0.62, "learning_rate": 1.6696074168346193e-06, "loss": 1.0557, "step": 32838 }, { "epoch": 0.62, "learning_rate": 1.6694633262515245e-06, "loss": 0.7704, "step": 32839 }, { "epoch": 0.62, "learning_rate": 1.6693192387696283e-06, "loss": 0.9492, "step": 32840 }, { "epoch": 0.62, "learning_rate": 1.6691751543894686e-06, "loss": 0.8411, "step": 32841 }, { "epoch": 0.62, "learning_rate": 1.669031073111584e-06, "loss": 0.8661, "step": 32842 }, { "epoch": 0.62, "learning_rate": 1.668886994936511e-06, "loss": 0.976, "step": 32843 }, { "epoch": 0.62, "learning_rate": 1.6687429198647892e-06, "loss": 0.8502, "step": 32844 }, { "epoch": 0.62, "learning_rate": 1.6685988478969562e-06, "loss": 0.89, "step": 32845 }, { "epoch": 0.62, "learning_rate": 1.6684547790335482e-06, "loss": 1.0015, "step": 32846 }, { "epoch": 0.62, "learning_rate": 1.6683107132751053e-06, "loss": 0.8433, "step": 32847 }, { "epoch": 0.62, "learning_rate": 1.668166650622165e-06, "loss": 0.7383, "step": 32848 }, { "epoch": 0.62, "learning_rate": 1.668022591075264e-06, "loss": 0.9258, "step": 32849 }, { "epoch": 0.62, "learning_rate": 1.6678785346349425e-06, "loss": 1.053, "step": 32850 }, { "epoch": 0.62, "learning_rate": 1.6677344813017366e-06, "loss": 0.7823, "step": 32851 }, { "epoch": 0.62, "learning_rate": 1.6675904310761837e-06, "loss": 1.0103, "step": 32852 }, { "epoch": 0.62, "learning_rate": 1.6674463839588236e-06, "loss": 0.887, "step": 32853 }, { "epoch": 0.62, "learning_rate": 1.667302339950193e-06, "loss": 0.8729, "step": 32854 }, { "epoch": 0.62, "learning_rate": 1.6671582990508289e-06, "loss": 0.9966, "step": 32855 }, { "epoch": 0.62, "learning_rate": 1.6670142612612716e-06, "loss": 1.1755, "step": 32856 }, { "epoch": 0.62, "learning_rate": 1.6668702265820574e-06, "loss": 0.895, "step": 32857 }, { "epoch": 0.62, "learning_rate": 1.6667261950137231e-06, "loss": 0.9728, "step": 32858 }, { "epoch": 0.62, "learning_rate": 1.666582166556809e-06, "loss": 0.9769, "step": 32859 }, { "epoch": 0.62, "learning_rate": 1.6664381412118506e-06, "loss": 0.8262, "step": 32860 }, { "epoch": 0.62, "learning_rate": 1.6662941189793868e-06, "loss": 0.8052, "step": 32861 }, { "epoch": 0.62, "learning_rate": 1.666150099859955e-06, "loss": 0.9736, "step": 32862 }, { "epoch": 0.62, "learning_rate": 1.666006083854094e-06, "loss": 1.0826, "step": 32863 }, { "epoch": 0.62, "learning_rate": 1.6658620709623396e-06, "loss": 0.9453, "step": 32864 }, { "epoch": 0.62, "learning_rate": 1.6657180611852315e-06, "loss": 0.8233, "step": 32865 }, { "epoch": 0.62, "learning_rate": 1.6655740545233068e-06, "loss": 0.7093, "step": 32866 }, { "epoch": 0.62, "learning_rate": 1.6654300509771018e-06, "loss": 0.7992, "step": 32867 }, { "epoch": 0.62, "learning_rate": 1.665286050547156e-06, "loss": 0.8436, "step": 32868 }, { "epoch": 0.62, "learning_rate": 1.6651420532340068e-06, "loss": 1.0281, "step": 32869 }, { "epoch": 0.62, "learning_rate": 1.6649980590381908e-06, "loss": 1.175, "step": 32870 }, { "epoch": 0.62, "learning_rate": 1.6648540679602477e-06, "loss": 0.9129, "step": 32871 }, { "epoch": 0.62, "learning_rate": 1.6647100800007135e-06, "loss": 0.8188, "step": 32872 }, { "epoch": 0.62, "learning_rate": 1.6645660951601253e-06, "loss": 0.8017, "step": 32873 }, { "epoch": 0.62, "learning_rate": 1.6644221134390226e-06, "loss": 1.0696, "step": 32874 }, { "epoch": 0.62, "learning_rate": 1.664278134837942e-06, "loss": 0.9294, "step": 32875 }, { "epoch": 0.62, "learning_rate": 1.6641341593574204e-06, "loss": 1.0069, "step": 32876 }, { "epoch": 0.62, "learning_rate": 1.6639901869979974e-06, "loss": 1.1194, "step": 32877 }, { "epoch": 0.62, "learning_rate": 1.6638462177602094e-06, "loss": 0.9691, "step": 32878 }, { "epoch": 0.62, "learning_rate": 1.6637022516445928e-06, "loss": 0.8347, "step": 32879 }, { "epoch": 0.62, "learning_rate": 1.6635582886516874e-06, "loss": 0.9592, "step": 32880 }, { "epoch": 0.62, "learning_rate": 1.6634143287820292e-06, "loss": 1.0601, "step": 32881 }, { "epoch": 0.62, "learning_rate": 1.6632703720361566e-06, "loss": 0.8348, "step": 32882 }, { "epoch": 0.62, "learning_rate": 1.6631264184146062e-06, "loss": 0.8599, "step": 32883 }, { "epoch": 0.62, "learning_rate": 1.662982467917917e-06, "loss": 1.0172, "step": 32884 }, { "epoch": 0.62, "learning_rate": 1.662838520546624e-06, "loss": 0.8079, "step": 32885 }, { "epoch": 0.62, "learning_rate": 1.662694576301268e-06, "loss": 0.8724, "step": 32886 }, { "epoch": 0.62, "learning_rate": 1.6625506351823846e-06, "loss": 1.0928, "step": 32887 }, { "epoch": 0.62, "learning_rate": 1.6624066971905104e-06, "loss": 0.8346, "step": 32888 }, { "epoch": 0.62, "learning_rate": 1.6622627623261845e-06, "loss": 0.8215, "step": 32889 }, { "epoch": 0.62, "learning_rate": 1.662118830589944e-06, "loss": 0.7758, "step": 32890 }, { "epoch": 0.62, "learning_rate": 1.6619749019823253e-06, "loss": 0.7045, "step": 32891 }, { "epoch": 0.62, "learning_rate": 1.6618309765038675e-06, "loss": 0.813, "step": 32892 }, { "epoch": 0.62, "learning_rate": 1.6616870541551071e-06, "loss": 0.7964, "step": 32893 }, { "epoch": 0.62, "learning_rate": 1.6615431349365807e-06, "loss": 1.0856, "step": 32894 }, { "epoch": 0.62, "learning_rate": 1.6613992188488276e-06, "loss": 0.9276, "step": 32895 }, { "epoch": 0.62, "learning_rate": 1.6612553058923836e-06, "loss": 0.819, "step": 32896 }, { "epoch": 0.62, "learning_rate": 1.661111396067786e-06, "loss": 0.9549, "step": 32897 }, { "epoch": 0.62, "learning_rate": 1.6609674893755737e-06, "loss": 0.6237, "step": 32898 }, { "epoch": 0.62, "learning_rate": 1.660823585816283e-06, "loss": 0.8285, "step": 32899 }, { "epoch": 0.62, "learning_rate": 1.6606796853904504e-06, "loss": 1.0699, "step": 32900 }, { "epoch": 0.62, "learning_rate": 1.660535788098615e-06, "loss": 1.0381, "step": 32901 }, { "epoch": 0.62, "learning_rate": 1.6603918939413127e-06, "loss": 0.9198, "step": 32902 }, { "epoch": 0.62, "learning_rate": 1.6602480029190814e-06, "loss": 0.7976, "step": 32903 }, { "epoch": 0.62, "learning_rate": 1.6601041150324585e-06, "loss": 0.8103, "step": 32904 }, { "epoch": 0.62, "learning_rate": 1.6599602302819814e-06, "loss": 0.9956, "step": 32905 }, { "epoch": 0.62, "learning_rate": 1.6598163486681862e-06, "loss": 1.0038, "step": 32906 }, { "epoch": 0.62, "learning_rate": 1.6596724701916116e-06, "loss": 0.8929, "step": 32907 }, { "epoch": 0.62, "learning_rate": 1.6595285948527946e-06, "loss": 0.7564, "step": 32908 }, { "epoch": 0.62, "learning_rate": 1.6593847226522709e-06, "loss": 0.9897, "step": 32909 }, { "epoch": 0.62, "learning_rate": 1.6592408535905795e-06, "loss": 0.7941, "step": 32910 }, { "epoch": 0.62, "learning_rate": 1.6590969876682572e-06, "loss": 1.0336, "step": 32911 }, { "epoch": 0.62, "learning_rate": 1.6589531248858403e-06, "loss": 0.9447, "step": 32912 }, { "epoch": 0.62, "learning_rate": 1.6588092652438675e-06, "loss": 1.0608, "step": 32913 }, { "epoch": 0.62, "learning_rate": 1.658665408742875e-06, "loss": 0.9119, "step": 32914 }, { "epoch": 0.62, "learning_rate": 1.6585215553833993e-06, "loss": 0.8756, "step": 32915 }, { "epoch": 0.62, "learning_rate": 1.6583777051659795e-06, "loss": 0.8565, "step": 32916 }, { "epoch": 0.62, "learning_rate": 1.6582338580911506e-06, "loss": 0.8149, "step": 32917 }, { "epoch": 0.62, "learning_rate": 1.6580900141594502e-06, "loss": 1.1204, "step": 32918 }, { "epoch": 0.62, "learning_rate": 1.6579461733714169e-06, "loss": 0.9254, "step": 32919 }, { "epoch": 0.62, "learning_rate": 1.6578023357275868e-06, "loss": 1.0281, "step": 32920 }, { "epoch": 0.62, "learning_rate": 1.6576585012284962e-06, "loss": 0.9684, "step": 32921 }, { "epoch": 0.62, "learning_rate": 1.6575146698746837e-06, "loss": 0.8253, "step": 32922 }, { "epoch": 0.62, "learning_rate": 1.657370841666685e-06, "loss": 0.8918, "step": 32923 }, { "epoch": 0.62, "learning_rate": 1.6572270166050381e-06, "loss": 1.0268, "step": 32924 }, { "epoch": 0.62, "learning_rate": 1.6570831946902793e-06, "loss": 1.2715, "step": 32925 }, { "epoch": 0.62, "learning_rate": 1.6569393759229465e-06, "loss": 0.9076, "step": 32926 }, { "epoch": 0.62, "learning_rate": 1.6567955603035755e-06, "loss": 0.848, "step": 32927 }, { "epoch": 0.62, "learning_rate": 1.656651747832705e-06, "loss": 0.8923, "step": 32928 }, { "epoch": 0.62, "learning_rate": 1.6565079385108707e-06, "loss": 0.9765, "step": 32929 }, { "epoch": 0.62, "learning_rate": 1.6563641323386093e-06, "loss": 0.9974, "step": 32930 }, { "epoch": 0.62, "learning_rate": 1.6562203293164586e-06, "loss": 1.1344, "step": 32931 }, { "epoch": 0.62, "learning_rate": 1.656076529444956e-06, "loss": 0.8501, "step": 32932 }, { "epoch": 0.62, "learning_rate": 1.6559327327246365e-06, "loss": 1.0411, "step": 32933 }, { "epoch": 0.62, "learning_rate": 1.6557889391560395e-06, "loss": 0.6413, "step": 32934 }, { "epoch": 0.62, "learning_rate": 1.6556451487397007e-06, "loss": 0.7461, "step": 32935 }, { "epoch": 0.62, "learning_rate": 1.6555013614761562e-06, "loss": 0.8589, "step": 32936 }, { "epoch": 0.62, "learning_rate": 1.655357577365944e-06, "loss": 1.2041, "step": 32937 }, { "epoch": 0.62, "learning_rate": 1.655213796409601e-06, "loss": 0.7802, "step": 32938 }, { "epoch": 0.62, "learning_rate": 1.6550700186076628e-06, "loss": 0.9207, "step": 32939 }, { "epoch": 0.62, "learning_rate": 1.6549262439606686e-06, "loss": 0.8366, "step": 32940 }, { "epoch": 0.62, "learning_rate": 1.654782472469154e-06, "loss": 0.7234, "step": 32941 }, { "epoch": 0.62, "learning_rate": 1.6546387041336542e-06, "loss": 0.9439, "step": 32942 }, { "epoch": 0.62, "learning_rate": 1.6544949389547089e-06, "loss": 1.1564, "step": 32943 }, { "epoch": 0.62, "learning_rate": 1.654351176932853e-06, "loss": 0.8777, "step": 32944 }, { "epoch": 0.62, "learning_rate": 1.654207418068624e-06, "loss": 0.9819, "step": 32945 }, { "epoch": 0.62, "learning_rate": 1.6540636623625583e-06, "loss": 0.9098, "step": 32946 }, { "epoch": 0.62, "learning_rate": 1.6539199098151937e-06, "loss": 0.7762, "step": 32947 }, { "epoch": 0.62, "learning_rate": 1.6537761604270652e-06, "loss": 0.7849, "step": 32948 }, { "epoch": 0.62, "learning_rate": 1.6536324141987114e-06, "loss": 0.9773, "step": 32949 }, { "epoch": 0.62, "learning_rate": 1.6534886711306686e-06, "loss": 1.0553, "step": 32950 }, { "epoch": 0.62, "learning_rate": 1.6533449312234718e-06, "loss": 0.6311, "step": 32951 }, { "epoch": 0.62, "learning_rate": 1.6532011944776595e-06, "loss": 0.8521, "step": 32952 }, { "epoch": 0.62, "learning_rate": 1.6530574608937686e-06, "loss": 0.8659, "step": 32953 }, { "epoch": 0.62, "learning_rate": 1.652913730472334e-06, "loss": 0.6663, "step": 32954 }, { "epoch": 0.62, "learning_rate": 1.6527700032138949e-06, "loss": 0.9446, "step": 32955 }, { "epoch": 0.62, "learning_rate": 1.6526262791189865e-06, "loss": 0.8981, "step": 32956 }, { "epoch": 0.62, "learning_rate": 1.6524825581881445e-06, "loss": 1.0057, "step": 32957 }, { "epoch": 0.62, "learning_rate": 1.6523388404219077e-06, "loss": 0.9063, "step": 32958 }, { "epoch": 0.62, "learning_rate": 1.6521951258208114e-06, "loss": 0.9243, "step": 32959 }, { "epoch": 0.62, "learning_rate": 1.6520514143853917e-06, "loss": 1.0958, "step": 32960 }, { "epoch": 0.62, "learning_rate": 1.651907706116187e-06, "loss": 0.9602, "step": 32961 }, { "epoch": 0.62, "learning_rate": 1.6517640010137331e-06, "loss": 1.0161, "step": 32962 }, { "epoch": 0.62, "learning_rate": 1.651620299078565e-06, "loss": 1.0579, "step": 32963 }, { "epoch": 0.62, "learning_rate": 1.6514766003112224e-06, "loss": 0.8522, "step": 32964 }, { "epoch": 0.62, "learning_rate": 1.6513329047122392e-06, "loss": 0.8816, "step": 32965 }, { "epoch": 0.62, "learning_rate": 1.6511892122821532e-06, "loss": 0.8586, "step": 32966 }, { "epoch": 0.62, "learning_rate": 1.6510455230215003e-06, "loss": 0.9327, "step": 32967 }, { "epoch": 0.62, "learning_rate": 1.650901836930818e-06, "loss": 0.8004, "step": 32968 }, { "epoch": 0.62, "learning_rate": 1.6507581540106412e-06, "loss": 1.0097, "step": 32969 }, { "epoch": 0.62, "learning_rate": 1.6506144742615088e-06, "loss": 0.8844, "step": 32970 }, { "epoch": 0.62, "learning_rate": 1.6504707976839553e-06, "loss": 0.8933, "step": 32971 }, { "epoch": 0.62, "learning_rate": 1.6503271242785172e-06, "loss": 0.8287, "step": 32972 }, { "epoch": 0.62, "learning_rate": 1.6501834540457317e-06, "loss": 0.648, "step": 32973 }, { "epoch": 0.62, "learning_rate": 1.6500397869861363e-06, "loss": 1.1185, "step": 32974 }, { "epoch": 0.62, "learning_rate": 1.6498961231002647e-06, "loss": 0.9933, "step": 32975 }, { "epoch": 0.62, "learning_rate": 1.649752462388656e-06, "loss": 0.8141, "step": 32976 }, { "epoch": 0.62, "learning_rate": 1.6496088048518456e-06, "loss": 0.68, "step": 32977 }, { "epoch": 0.62, "learning_rate": 1.6494651504903686e-06, "loss": 0.9691, "step": 32978 }, { "epoch": 0.62, "learning_rate": 1.6493214993047641e-06, "loss": 0.8928, "step": 32979 }, { "epoch": 0.62, "learning_rate": 1.6491778512955665e-06, "loss": 1.0169, "step": 32980 }, { "epoch": 0.62, "learning_rate": 1.649034206463312e-06, "loss": 0.9839, "step": 32981 }, { "epoch": 0.62, "learning_rate": 1.6488905648085386e-06, "loss": 0.9385, "step": 32982 }, { "epoch": 0.62, "learning_rate": 1.6487469263317817e-06, "loss": 0.9535, "step": 32983 }, { "epoch": 0.62, "learning_rate": 1.648603291033577e-06, "loss": 0.8289, "step": 32984 }, { "epoch": 0.62, "learning_rate": 1.6484596589144624e-06, "loss": 0.6519, "step": 32985 }, { "epoch": 0.62, "learning_rate": 1.6483160299749728e-06, "loss": 0.9873, "step": 32986 }, { "epoch": 0.62, "learning_rate": 1.6481724042156449e-06, "loss": 1.2216, "step": 32987 }, { "epoch": 0.62, "learning_rate": 1.6480287816370152e-06, "loss": 1.0112, "step": 32988 }, { "epoch": 0.62, "learning_rate": 1.6478851622396204e-06, "loss": 0.8508, "step": 32989 }, { "epoch": 0.62, "learning_rate": 1.6477415460239954e-06, "loss": 0.7271, "step": 32990 }, { "epoch": 0.62, "learning_rate": 1.6475979329906783e-06, "loss": 0.92, "step": 32991 }, { "epoch": 0.62, "learning_rate": 1.6474543231402044e-06, "loss": 0.7433, "step": 32992 }, { "epoch": 0.62, "learning_rate": 1.647310716473109e-06, "loss": 1.1092, "step": 32993 }, { "epoch": 0.62, "learning_rate": 1.647167112989929e-06, "loss": 0.9541, "step": 32994 }, { "epoch": 0.62, "learning_rate": 1.647023512691202e-06, "loss": 0.9602, "step": 32995 }, { "epoch": 0.62, "learning_rate": 1.6468799155774623e-06, "loss": 0.9049, "step": 32996 }, { "epoch": 0.62, "learning_rate": 1.6467363216492478e-06, "loss": 0.9329, "step": 32997 }, { "epoch": 0.62, "learning_rate": 1.646592730907093e-06, "loss": 0.9936, "step": 32998 }, { "epoch": 0.62, "learning_rate": 1.6464491433515344e-06, "loss": 1.2051, "step": 32999 }, { "epoch": 0.62, "learning_rate": 1.6463055589831095e-06, "loss": 1.0242, "step": 33000 }, { "epoch": 0.62, "learning_rate": 1.6461619778023526e-06, "loss": 0.8004, "step": 33001 }, { "epoch": 0.62, "learning_rate": 1.6460183998098007e-06, "loss": 0.6924, "step": 33002 }, { "epoch": 0.62, "learning_rate": 1.6458748250059903e-06, "loss": 0.7804, "step": 33003 }, { "epoch": 0.62, "learning_rate": 1.6457312533914577e-06, "loss": 0.8829, "step": 33004 }, { "epoch": 0.62, "learning_rate": 1.6455876849667369e-06, "loss": 0.9429, "step": 33005 }, { "epoch": 0.62, "learning_rate": 1.6454441197323667e-06, "loss": 1.0134, "step": 33006 }, { "epoch": 0.62, "learning_rate": 1.6453005576888815e-06, "loss": 0.9147, "step": 33007 }, { "epoch": 0.62, "learning_rate": 1.645156998836818e-06, "loss": 0.7547, "step": 33008 }, { "epoch": 0.62, "learning_rate": 1.6450134431767117e-06, "loss": 0.8442, "step": 33009 }, { "epoch": 0.62, "learning_rate": 1.6448698907091e-06, "loss": 0.7227, "step": 33010 }, { "epoch": 0.62, "learning_rate": 1.6447263414345163e-06, "loss": 1.0113, "step": 33011 }, { "epoch": 0.62, "learning_rate": 1.6445827953534993e-06, "loss": 0.8308, "step": 33012 }, { "epoch": 0.62, "learning_rate": 1.6444392524665842e-06, "loss": 1.088, "step": 33013 }, { "epoch": 0.62, "learning_rate": 1.6442957127743056e-06, "loss": 0.6852, "step": 33014 }, { "epoch": 0.62, "learning_rate": 1.644152176277201e-06, "loss": 0.9811, "step": 33015 }, { "epoch": 0.62, "learning_rate": 1.6440086429758068e-06, "loss": 1.0129, "step": 33016 }, { "epoch": 0.62, "learning_rate": 1.6438651128706564e-06, "loss": 0.8145, "step": 33017 }, { "epoch": 0.62, "learning_rate": 1.643721585962289e-06, "loss": 1.0007, "step": 33018 }, { "epoch": 0.62, "learning_rate": 1.6435780622512387e-06, "loss": 0.8611, "step": 33019 }, { "epoch": 0.62, "learning_rate": 1.6434345417380406e-06, "loss": 0.9254, "step": 33020 }, { "epoch": 0.62, "learning_rate": 1.6432910244232328e-06, "loss": 0.9144, "step": 33021 }, { "epoch": 0.62, "learning_rate": 1.6431475103073497e-06, "loss": 0.8497, "step": 33022 }, { "epoch": 0.62, "learning_rate": 1.6430039993909277e-06, "loss": 1.0373, "step": 33023 }, { "epoch": 0.62, "learning_rate": 1.6428604916745018e-06, "loss": 0.9969, "step": 33024 }, { "epoch": 0.62, "learning_rate": 1.642716987158609e-06, "loss": 0.9803, "step": 33025 }, { "epoch": 0.62, "learning_rate": 1.6425734858437852e-06, "loss": 0.9548, "step": 33026 }, { "epoch": 0.62, "learning_rate": 1.6424299877305644e-06, "loss": 0.8332, "step": 33027 }, { "epoch": 0.62, "learning_rate": 1.6422864928194845e-06, "loss": 1.0822, "step": 33028 }, { "epoch": 0.62, "learning_rate": 1.6421430011110811e-06, "loss": 0.7612, "step": 33029 }, { "epoch": 0.62, "learning_rate": 1.641999512605888e-06, "loss": 0.8329, "step": 33030 }, { "epoch": 0.62, "learning_rate": 1.6418560273044437e-06, "loss": 1.0158, "step": 33031 }, { "epoch": 0.62, "learning_rate": 1.641712545207283e-06, "loss": 0.908, "step": 33032 }, { "epoch": 0.62, "learning_rate": 1.6415690663149397e-06, "loss": 0.8996, "step": 33033 }, { "epoch": 0.62, "learning_rate": 1.6414255906279525e-06, "loss": 0.9437, "step": 33034 }, { "epoch": 0.62, "learning_rate": 1.6412821181468552e-06, "loss": 0.8583, "step": 33035 }, { "epoch": 0.62, "learning_rate": 1.641138648872184e-06, "loss": 0.7506, "step": 33036 }, { "epoch": 0.62, "learning_rate": 1.6409951828044754e-06, "loss": 0.9172, "step": 33037 }, { "epoch": 0.62, "learning_rate": 1.6408517199442648e-06, "loss": 1.0388, "step": 33038 }, { "epoch": 0.62, "learning_rate": 1.6407082602920859e-06, "loss": 0.9627, "step": 33039 }, { "epoch": 0.62, "learning_rate": 1.6405648038484775e-06, "loss": 0.9941, "step": 33040 }, { "epoch": 0.62, "learning_rate": 1.6404213506139733e-06, "loss": 0.6772, "step": 33041 }, { "epoch": 0.62, "learning_rate": 1.6402779005891092e-06, "loss": 0.8294, "step": 33042 }, { "epoch": 0.62, "learning_rate": 1.6401344537744212e-06, "loss": 1.0691, "step": 33043 }, { "epoch": 0.62, "learning_rate": 1.6399910101704452e-06, "loss": 1.1019, "step": 33044 }, { "epoch": 0.62, "learning_rate": 1.6398475697777156e-06, "loss": 0.8734, "step": 33045 }, { "epoch": 0.62, "learning_rate": 1.6397041325967693e-06, "loss": 0.7833, "step": 33046 }, { "epoch": 0.62, "learning_rate": 1.639560698628142e-06, "loss": 0.7614, "step": 33047 }, { "epoch": 0.62, "learning_rate": 1.6394172678723675e-06, "loss": 0.8987, "step": 33048 }, { "epoch": 0.62, "learning_rate": 1.6392738403299827e-06, "loss": 1.1042, "step": 33049 }, { "epoch": 0.62, "learning_rate": 1.6391304160015237e-06, "loss": 0.9351, "step": 33050 }, { "epoch": 0.62, "learning_rate": 1.6389869948875242e-06, "loss": 0.8761, "step": 33051 }, { "epoch": 0.62, "learning_rate": 1.6388435769885222e-06, "loss": 0.7843, "step": 33052 }, { "epoch": 0.62, "learning_rate": 1.6387001623050515e-06, "loss": 0.9047, "step": 33053 }, { "epoch": 0.62, "learning_rate": 1.6385567508376473e-06, "loss": 0.7911, "step": 33054 }, { "epoch": 0.62, "learning_rate": 1.6384133425868468e-06, "loss": 0.8266, "step": 33055 }, { "epoch": 0.62, "learning_rate": 1.6382699375531836e-06, "loss": 1.0615, "step": 33056 }, { "epoch": 0.62, "learning_rate": 1.638126535737194e-06, "loss": 0.9613, "step": 33057 }, { "epoch": 0.62, "learning_rate": 1.637983137139414e-06, "loss": 0.8885, "step": 33058 }, { "epoch": 0.62, "learning_rate": 1.637839741760379e-06, "loss": 0.8489, "step": 33059 }, { "epoch": 0.62, "learning_rate": 1.6376963496006226e-06, "loss": 0.8716, "step": 33060 }, { "epoch": 0.62, "learning_rate": 1.6375529606606828e-06, "loss": 0.8613, "step": 33061 }, { "epoch": 0.62, "learning_rate": 1.6374095749410934e-06, "loss": 1.0986, "step": 33062 }, { "epoch": 0.62, "learning_rate": 1.63726619244239e-06, "loss": 1.0814, "step": 33063 }, { "epoch": 0.62, "learning_rate": 1.637122813165108e-06, "loss": 1.0264, "step": 33064 }, { "epoch": 0.62, "learning_rate": 1.636979437109784e-06, "loss": 0.9021, "step": 33065 }, { "epoch": 0.62, "learning_rate": 1.6368360642769509e-06, "loss": 0.9362, "step": 33066 }, { "epoch": 0.62, "learning_rate": 1.6366926946671463e-06, "loss": 0.7491, "step": 33067 }, { "epoch": 0.62, "learning_rate": 1.6365493282809053e-06, "loss": 1.1251, "step": 33068 }, { "epoch": 0.62, "learning_rate": 1.6364059651187613e-06, "loss": 1.0052, "step": 33069 }, { "epoch": 0.62, "learning_rate": 1.6362626051812514e-06, "loss": 0.8827, "step": 33070 }, { "epoch": 0.62, "learning_rate": 1.636119248468911e-06, "loss": 0.8922, "step": 33071 }, { "epoch": 0.62, "learning_rate": 1.6359758949822737e-06, "loss": 0.8005, "step": 33072 }, { "epoch": 0.62, "learning_rate": 1.635832544721877e-06, "loss": 0.9206, "step": 33073 }, { "epoch": 0.62, "learning_rate": 1.6356891976882555e-06, "loss": 1.0242, "step": 33074 }, { "epoch": 0.62, "learning_rate": 1.6355458538819424e-06, "loss": 0.9894, "step": 33075 }, { "epoch": 0.62, "learning_rate": 1.6354025133034762e-06, "loss": 0.8267, "step": 33076 }, { "epoch": 0.62, "learning_rate": 1.6352591759533894e-06, "loss": 0.8193, "step": 33077 }, { "epoch": 0.62, "learning_rate": 1.6351158418322183e-06, "loss": 0.9824, "step": 33078 }, { "epoch": 0.62, "learning_rate": 1.634972510940499e-06, "loss": 0.6543, "step": 33079 }, { "epoch": 0.62, "learning_rate": 1.6348291832787654e-06, "loss": 0.7968, "step": 33080 }, { "epoch": 0.62, "learning_rate": 1.6346858588475528e-06, "loss": 0.9473, "step": 33081 }, { "epoch": 0.62, "learning_rate": 1.6345425376473972e-06, "loss": 0.9913, "step": 33082 }, { "epoch": 0.62, "learning_rate": 1.6343992196788327e-06, "loss": 0.8415, "step": 33083 }, { "epoch": 0.62, "learning_rate": 1.634255904942395e-06, "loss": 1.0494, "step": 33084 }, { "epoch": 0.62, "learning_rate": 1.6341125934386195e-06, "loss": 0.8286, "step": 33085 }, { "epoch": 0.62, "learning_rate": 1.6339692851680414e-06, "loss": 0.6561, "step": 33086 }, { "epoch": 0.62, "learning_rate": 1.6338259801311945e-06, "loss": 1.1475, "step": 33087 }, { "epoch": 0.62, "learning_rate": 1.6336826783286157e-06, "loss": 1.1436, "step": 33088 }, { "epoch": 0.62, "learning_rate": 1.6335393797608392e-06, "loss": 0.9037, "step": 33089 }, { "epoch": 0.62, "learning_rate": 1.633396084428399e-06, "loss": 1.021, "step": 33090 }, { "epoch": 0.62, "learning_rate": 1.6332527923318319e-06, "loss": 0.8502, "step": 33091 }, { "epoch": 0.62, "learning_rate": 1.633109503471673e-06, "loss": 1.0333, "step": 33092 }, { "epoch": 0.62, "learning_rate": 1.6329662178484551e-06, "loss": 1.1248, "step": 33093 }, { "epoch": 0.62, "learning_rate": 1.6328229354627162e-06, "loss": 1.0142, "step": 33094 }, { "epoch": 0.62, "learning_rate": 1.63267965631499e-06, "loss": 0.9022, "step": 33095 }, { "epoch": 0.62, "learning_rate": 1.63253638040581e-06, "loss": 0.996, "step": 33096 }, { "epoch": 0.62, "learning_rate": 1.6323931077357137e-06, "loss": 0.952, "step": 33097 }, { "epoch": 0.62, "learning_rate": 1.6322498383052342e-06, "loss": 0.7625, "step": 33098 }, { "epoch": 0.62, "learning_rate": 1.6321065721149071e-06, "loss": 1.0225, "step": 33099 }, { "epoch": 0.62, "learning_rate": 1.6319633091652682e-06, "loss": 1.1696, "step": 33100 }, { "epoch": 0.62, "learning_rate": 1.6318200494568516e-06, "loss": 0.7677, "step": 33101 }, { "epoch": 0.62, "learning_rate": 1.6316767929901918e-06, "loss": 1.0254, "step": 33102 }, { "epoch": 0.62, "learning_rate": 1.6315335397658247e-06, "loss": 0.8299, "step": 33103 }, { "epoch": 0.62, "learning_rate": 1.6313902897842845e-06, "loss": 0.8381, "step": 33104 }, { "epoch": 0.62, "learning_rate": 1.6312470430461064e-06, "loss": 0.8776, "step": 33105 }, { "epoch": 0.62, "learning_rate": 1.6311037995518247e-06, "loss": 1.0239, "step": 33106 }, { "epoch": 0.62, "learning_rate": 1.6309605593019758e-06, "loss": 1.1248, "step": 33107 }, { "epoch": 0.62, "learning_rate": 1.6308173222970924e-06, "loss": 0.8197, "step": 33108 }, { "epoch": 0.62, "learning_rate": 1.6306740885377115e-06, "loss": 0.8836, "step": 33109 }, { "epoch": 0.62, "learning_rate": 1.6305308580243668e-06, "loss": 0.9126, "step": 33110 }, { "epoch": 0.62, "learning_rate": 1.6303876307575923e-06, "loss": 0.8724, "step": 33111 }, { "epoch": 0.62, "learning_rate": 1.630244406737924e-06, "loss": 0.9789, "step": 33112 }, { "epoch": 0.62, "learning_rate": 1.6301011859658971e-06, "loss": 0.8889, "step": 33113 }, { "epoch": 0.62, "learning_rate": 1.6299579684420447e-06, "loss": 0.6806, "step": 33114 }, { "epoch": 0.62, "learning_rate": 1.6298147541669034e-06, "loss": 0.6866, "step": 33115 }, { "epoch": 0.62, "learning_rate": 1.6296715431410075e-06, "loss": 0.7722, "step": 33116 }, { "epoch": 0.62, "learning_rate": 1.62952833536489e-06, "loss": 0.8624, "step": 33117 }, { "epoch": 0.62, "learning_rate": 1.6293851308390879e-06, "loss": 1.046, "step": 33118 }, { "epoch": 0.62, "learning_rate": 1.6292419295641353e-06, "loss": 1.1155, "step": 33119 }, { "epoch": 0.62, "learning_rate": 1.6290987315405654e-06, "loss": 0.8505, "step": 33120 }, { "epoch": 0.62, "learning_rate": 1.6289555367689156e-06, "loss": 0.8536, "step": 33121 }, { "epoch": 0.62, "learning_rate": 1.628812345249719e-06, "loss": 1.1262, "step": 33122 }, { "epoch": 0.62, "learning_rate": 1.628669156983509e-06, "loss": 0.8205, "step": 33123 }, { "epoch": 0.62, "learning_rate": 1.628525971970823e-06, "loss": 1.0282, "step": 33124 }, { "epoch": 0.62, "learning_rate": 1.6283827902121938e-06, "loss": 1.0247, "step": 33125 }, { "epoch": 0.62, "learning_rate": 1.628239611708156e-06, "loss": 0.9998, "step": 33126 }, { "epoch": 0.63, "learning_rate": 1.6280964364592455e-06, "loss": 0.859, "step": 33127 }, { "epoch": 0.63, "learning_rate": 1.6279532644659964e-06, "loss": 0.796, "step": 33128 }, { "epoch": 0.63, "learning_rate": 1.6278100957289421e-06, "loss": 0.7857, "step": 33129 }, { "epoch": 0.63, "learning_rate": 1.6276669302486192e-06, "loss": 0.916, "step": 33130 }, { "epoch": 0.63, "learning_rate": 1.6275237680255606e-06, "loss": 0.931, "step": 33131 }, { "epoch": 0.63, "learning_rate": 1.6273806090603017e-06, "loss": 0.821, "step": 33132 }, { "epoch": 0.63, "learning_rate": 1.6272374533533767e-06, "loss": 0.9626, "step": 33133 }, { "epoch": 0.63, "learning_rate": 1.6270943009053208e-06, "loss": 1.0078, "step": 33134 }, { "epoch": 0.63, "learning_rate": 1.626951151716667e-06, "loss": 0.8223, "step": 33135 }, { "epoch": 0.63, "learning_rate": 1.6268080057879517e-06, "loss": 1.0025, "step": 33136 }, { "epoch": 0.63, "learning_rate": 1.6266648631197088e-06, "loss": 1.2456, "step": 33137 }, { "epoch": 0.63, "learning_rate": 1.6265217237124713e-06, "loss": 1.0975, "step": 33138 }, { "epoch": 0.63, "learning_rate": 1.6263785875667757e-06, "loss": 0.9479, "step": 33139 }, { "epoch": 0.63, "learning_rate": 1.626235454683156e-06, "loss": 0.792, "step": 33140 }, { "epoch": 0.63, "learning_rate": 1.626092325062145e-06, "loss": 0.9771, "step": 33141 }, { "epoch": 0.63, "learning_rate": 1.62594919870428e-06, "loss": 0.7466, "step": 33142 }, { "epoch": 0.63, "learning_rate": 1.6258060756100936e-06, "loss": 0.9399, "step": 33143 }, { "epoch": 0.63, "learning_rate": 1.6256629557801196e-06, "loss": 1.1665, "step": 33144 }, { "epoch": 0.63, "learning_rate": 1.6255198392148944e-06, "loss": 1.1224, "step": 33145 }, { "epoch": 0.63, "learning_rate": 1.6253767259149505e-06, "loss": 0.7593, "step": 33146 }, { "epoch": 0.63, "learning_rate": 1.625233615880823e-06, "loss": 0.9261, "step": 33147 }, { "epoch": 0.63, "learning_rate": 1.625090509113047e-06, "loss": 1.04, "step": 33148 }, { "epoch": 0.63, "learning_rate": 1.6249474056121564e-06, "loss": 1.1418, "step": 33149 }, { "epoch": 0.63, "learning_rate": 1.6248043053786844e-06, "loss": 1.239, "step": 33150 }, { "epoch": 0.63, "learning_rate": 1.6246612084131672e-06, "loss": 1.0584, "step": 33151 }, { "epoch": 0.63, "learning_rate": 1.6245181147161377e-06, "loss": 0.7773, "step": 33152 }, { "epoch": 0.63, "learning_rate": 1.6243750242881306e-06, "loss": 0.8866, "step": 33153 }, { "epoch": 0.63, "learning_rate": 1.6242319371296805e-06, "loss": 1.0144, "step": 33154 }, { "epoch": 0.63, "learning_rate": 1.6240888532413218e-06, "loss": 1.0225, "step": 33155 }, { "epoch": 0.63, "learning_rate": 1.6239457726235876e-06, "loss": 0.8376, "step": 33156 }, { "epoch": 0.63, "learning_rate": 1.6238026952770142e-06, "loss": 0.9435, "step": 33157 }, { "epoch": 0.63, "learning_rate": 1.6236596212021344e-06, "loss": 0.9397, "step": 33158 }, { "epoch": 0.63, "learning_rate": 1.6235165503994818e-06, "loss": 0.8459, "step": 33159 }, { "epoch": 0.63, "learning_rate": 1.6233734828695921e-06, "loss": 0.8258, "step": 33160 }, { "epoch": 0.63, "learning_rate": 1.6232304186129994e-06, "loss": 1.1218, "step": 33161 }, { "epoch": 0.63, "learning_rate": 1.6230873576302363e-06, "loss": 1.1541, "step": 33162 }, { "epoch": 0.63, "learning_rate": 1.6229442999218391e-06, "loss": 0.9007, "step": 33163 }, { "epoch": 0.63, "learning_rate": 1.6228012454883413e-06, "loss": 0.9911, "step": 33164 }, { "epoch": 0.63, "learning_rate": 1.6226581943302754e-06, "loss": 0.8636, "step": 33165 }, { "epoch": 0.63, "learning_rate": 1.622515146448178e-06, "loss": 0.7768, "step": 33166 }, { "epoch": 0.63, "learning_rate": 1.622372101842582e-06, "loss": 0.8127, "step": 33167 }, { "epoch": 0.63, "learning_rate": 1.6222290605140205e-06, "loss": 1.1212, "step": 33168 }, { "epoch": 0.63, "learning_rate": 1.6220860224630306e-06, "loss": 1.1031, "step": 33169 }, { "epoch": 0.63, "learning_rate": 1.621942987690144e-06, "loss": 0.8045, "step": 33170 }, { "epoch": 0.63, "learning_rate": 1.6217999561958945e-06, "loss": 0.8004, "step": 33171 }, { "epoch": 0.63, "learning_rate": 1.621656927980818e-06, "loss": 0.9092, "step": 33172 }, { "epoch": 0.63, "learning_rate": 1.6215139030454471e-06, "loss": 0.8851, "step": 33173 }, { "epoch": 0.63, "learning_rate": 1.6213708813903164e-06, "loss": 0.9534, "step": 33174 }, { "epoch": 0.63, "learning_rate": 1.62122786301596e-06, "loss": 1.0342, "step": 33175 }, { "epoch": 0.63, "learning_rate": 1.6210848479229119e-06, "loss": 0.7245, "step": 33176 }, { "epoch": 0.63, "learning_rate": 1.6209418361117054e-06, "loss": 0.6655, "step": 33177 }, { "epoch": 0.63, "learning_rate": 1.6207988275828763e-06, "loss": 0.8589, "step": 33178 }, { "epoch": 0.63, "learning_rate": 1.620655822336957e-06, "loss": 0.8644, "step": 33179 }, { "epoch": 0.63, "learning_rate": 1.620512820374481e-06, "loss": 0.7965, "step": 33180 }, { "epoch": 0.63, "learning_rate": 1.6203698216959838e-06, "loss": 0.8687, "step": 33181 }, { "epoch": 0.63, "learning_rate": 1.620226826301999e-06, "loss": 0.9761, "step": 33182 }, { "epoch": 0.63, "learning_rate": 1.6200838341930593e-06, "loss": 0.755, "step": 33183 }, { "epoch": 0.63, "learning_rate": 1.6199408453697009e-06, "loss": 0.8538, "step": 33184 }, { "epoch": 0.63, "learning_rate": 1.619797859832456e-06, "loss": 0.9024, "step": 33185 }, { "epoch": 0.63, "learning_rate": 1.6196548775818583e-06, "loss": 0.8224, "step": 33186 }, { "epoch": 0.63, "learning_rate": 1.619511898618443e-06, "loss": 0.9947, "step": 33187 }, { "epoch": 0.63, "learning_rate": 1.6193689229427428e-06, "loss": 0.9401, "step": 33188 }, { "epoch": 0.63, "learning_rate": 1.6192259505552915e-06, "loss": 0.9661, "step": 33189 }, { "epoch": 0.63, "learning_rate": 1.6190829814566247e-06, "loss": 0.9756, "step": 33190 }, { "epoch": 0.63, "learning_rate": 1.6189400156472751e-06, "loss": 1.0728, "step": 33191 }, { "epoch": 0.63, "learning_rate": 1.6187970531277752e-06, "loss": 0.7914, "step": 33192 }, { "epoch": 0.63, "learning_rate": 1.6186540938986612e-06, "loss": 0.8634, "step": 33193 }, { "epoch": 0.63, "learning_rate": 1.6185111379604652e-06, "loss": 1.0475, "step": 33194 }, { "epoch": 0.63, "learning_rate": 1.6183681853137217e-06, "loss": 0.9651, "step": 33195 }, { "epoch": 0.63, "learning_rate": 1.6182252359589643e-06, "loss": 0.9566, "step": 33196 }, { "epoch": 0.63, "learning_rate": 1.6180822898967274e-06, "loss": 0.6591, "step": 33197 }, { "epoch": 0.63, "learning_rate": 1.617939347127543e-06, "loss": 0.7229, "step": 33198 }, { "epoch": 0.63, "learning_rate": 1.6177964076519473e-06, "loss": 0.9122, "step": 33199 }, { "epoch": 0.63, "learning_rate": 1.6176534714704729e-06, "loss": 0.9562, "step": 33200 }, { "epoch": 0.63, "learning_rate": 1.6175105385836517e-06, "loss": 1.0417, "step": 33201 }, { "epoch": 0.63, "learning_rate": 1.6173676089920202e-06, "loss": 0.8777, "step": 33202 }, { "epoch": 0.63, "learning_rate": 1.6172246826961113e-06, "loss": 0.8442, "step": 33203 }, { "epoch": 0.63, "learning_rate": 1.6170817596964571e-06, "loss": 0.9039, "step": 33204 }, { "epoch": 0.63, "learning_rate": 1.6169388399935939e-06, "loss": 0.908, "step": 33205 }, { "epoch": 0.63, "learning_rate": 1.616795923588054e-06, "loss": 0.9682, "step": 33206 }, { "epoch": 0.63, "learning_rate": 1.6166530104803699e-06, "loss": 1.1561, "step": 33207 }, { "epoch": 0.63, "learning_rate": 1.6165101006710776e-06, "loss": 0.7313, "step": 33208 }, { "epoch": 0.63, "learning_rate": 1.6163671941607087e-06, "loss": 0.9863, "step": 33209 }, { "epoch": 0.63, "learning_rate": 1.6162242909497972e-06, "loss": 0.8797, "step": 33210 }, { "epoch": 0.63, "learning_rate": 1.6160813910388782e-06, "loss": 1.0735, "step": 33211 }, { "epoch": 0.63, "learning_rate": 1.6159384944284838e-06, "loss": 1.0074, "step": 33212 }, { "epoch": 0.63, "learning_rate": 1.6157956011191476e-06, "loss": 1.0052, "step": 33213 }, { "epoch": 0.63, "learning_rate": 1.615652711111404e-06, "loss": 0.8934, "step": 33214 }, { "epoch": 0.63, "learning_rate": 1.615509824405786e-06, "loss": 0.891, "step": 33215 }, { "epoch": 0.63, "learning_rate": 1.6153669410028266e-06, "loss": 0.7784, "step": 33216 }, { "epoch": 0.63, "learning_rate": 1.6152240609030604e-06, "loss": 0.8156, "step": 33217 }, { "epoch": 0.63, "learning_rate": 1.6150811841070209e-06, "loss": 1.014, "step": 33218 }, { "epoch": 0.63, "learning_rate": 1.6149383106152399e-06, "loss": 0.8815, "step": 33219 }, { "epoch": 0.63, "learning_rate": 1.6147954404282533e-06, "loss": 0.7541, "step": 33220 }, { "epoch": 0.63, "learning_rate": 1.6146525735465935e-06, "loss": 0.908, "step": 33221 }, { "epoch": 0.63, "learning_rate": 1.6145097099707924e-06, "loss": 0.9084, "step": 33222 }, { "epoch": 0.63, "learning_rate": 1.6143668497013857e-06, "loss": 0.8892, "step": 33223 }, { "epoch": 0.63, "learning_rate": 1.6142239927389064e-06, "loss": 0.9403, "step": 33224 }, { "epoch": 0.63, "learning_rate": 1.6140811390838868e-06, "loss": 1.0142, "step": 33225 }, { "epoch": 0.63, "learning_rate": 1.6139382887368616e-06, "loss": 0.8991, "step": 33226 }, { "epoch": 0.63, "learning_rate": 1.6137954416983643e-06, "loss": 0.8748, "step": 33227 }, { "epoch": 0.63, "learning_rate": 1.613652597968926e-06, "loss": 0.9194, "step": 33228 }, { "epoch": 0.63, "learning_rate": 1.6135097575490832e-06, "loss": 0.821, "step": 33229 }, { "epoch": 0.63, "learning_rate": 1.613366920439367e-06, "loss": 0.8456, "step": 33230 }, { "epoch": 0.63, "learning_rate": 1.613224086640311e-06, "loss": 1.2907, "step": 33231 }, { "epoch": 0.63, "learning_rate": 1.6130812561524503e-06, "loss": 0.9857, "step": 33232 }, { "epoch": 0.63, "learning_rate": 1.612938428976317e-06, "loss": 0.9541, "step": 33233 }, { "epoch": 0.63, "learning_rate": 1.6127956051124433e-06, "loss": 0.8897, "step": 33234 }, { "epoch": 0.63, "learning_rate": 1.6126527845613646e-06, "loss": 0.789, "step": 33235 }, { "epoch": 0.63, "learning_rate": 1.6125099673236128e-06, "loss": 0.9713, "step": 33236 }, { "epoch": 0.63, "learning_rate": 1.6123671533997216e-06, "loss": 1.1884, "step": 33237 }, { "epoch": 0.63, "learning_rate": 1.612224342790224e-06, "loss": 0.9413, "step": 33238 }, { "epoch": 0.63, "learning_rate": 1.612081535495654e-06, "loss": 0.8953, "step": 33239 }, { "epoch": 0.63, "learning_rate": 1.6119387315165435e-06, "loss": 0.9345, "step": 33240 }, { "epoch": 0.63, "learning_rate": 1.6117959308534276e-06, "loss": 0.8161, "step": 33241 }, { "epoch": 0.63, "learning_rate": 1.6116531335068381e-06, "loss": 0.8165, "step": 33242 }, { "epoch": 0.63, "learning_rate": 1.611510339477308e-06, "loss": 0.9149, "step": 33243 }, { "epoch": 0.63, "learning_rate": 1.6113675487653713e-06, "loss": 1.1925, "step": 33244 }, { "epoch": 0.63, "learning_rate": 1.6112247613715614e-06, "loss": 0.9863, "step": 33245 }, { "epoch": 0.63, "learning_rate": 1.6110819772964101e-06, "loss": 0.7314, "step": 33246 }, { "epoch": 0.63, "learning_rate": 1.6109391965404525e-06, "loss": 1.0086, "step": 33247 }, { "epoch": 0.63, "learning_rate": 1.6107964191042206e-06, "loss": 0.9459, "step": 33248 }, { "epoch": 0.63, "learning_rate": 1.6106536449882465e-06, "loss": 0.9742, "step": 33249 }, { "epoch": 0.63, "learning_rate": 1.6105108741930656e-06, "loss": 1.116, "step": 33250 }, { "epoch": 0.63, "learning_rate": 1.6103681067192093e-06, "loss": 1.0894, "step": 33251 }, { "epoch": 0.63, "learning_rate": 1.6102253425672104e-06, "loss": 0.8323, "step": 33252 }, { "epoch": 0.63, "learning_rate": 1.6100825817376042e-06, "loss": 0.9306, "step": 33253 }, { "epoch": 0.63, "learning_rate": 1.6099398242309222e-06, "loss": 0.8008, "step": 33254 }, { "epoch": 0.63, "learning_rate": 1.6097970700476966e-06, "loss": 0.9507, "step": 33255 }, { "epoch": 0.63, "learning_rate": 1.6096543191884625e-06, "loss": 0.8635, "step": 33256 }, { "epoch": 0.63, "learning_rate": 1.6095115716537512e-06, "loss": 1.0029, "step": 33257 }, { "epoch": 0.63, "learning_rate": 1.6093688274440971e-06, "loss": 0.918, "step": 33258 }, { "epoch": 0.63, "learning_rate": 1.6092260865600315e-06, "loss": 0.9965, "step": 33259 }, { "epoch": 0.63, "learning_rate": 1.609083349002089e-06, "loss": 0.8156, "step": 33260 }, { "epoch": 0.63, "learning_rate": 1.6089406147708026e-06, "loss": 0.6969, "step": 33261 }, { "epoch": 0.63, "learning_rate": 1.6087978838667032e-06, "loss": 0.9237, "step": 33262 }, { "epoch": 0.63, "learning_rate": 1.6086551562903264e-06, "loss": 0.9478, "step": 33263 }, { "epoch": 0.63, "learning_rate": 1.608512432042203e-06, "loss": 0.9771, "step": 33264 }, { "epoch": 0.63, "learning_rate": 1.6083697111228668e-06, "loss": 0.6356, "step": 33265 }, { "epoch": 0.63, "learning_rate": 1.6082269935328516e-06, "loss": 0.7951, "step": 33266 }, { "epoch": 0.63, "learning_rate": 1.608084279272689e-06, "loss": 0.789, "step": 33267 }, { "epoch": 0.63, "learning_rate": 1.6079415683429123e-06, "loss": 0.9776, "step": 33268 }, { "epoch": 0.63, "learning_rate": 1.6077988607440547e-06, "loss": 1.0989, "step": 33269 }, { "epoch": 0.63, "learning_rate": 1.6076561564766486e-06, "loss": 0.79, "step": 33270 }, { "epoch": 0.63, "learning_rate": 1.607513455541227e-06, "loss": 0.772, "step": 33271 }, { "epoch": 0.63, "learning_rate": 1.6073707579383227e-06, "loss": 0.7529, "step": 33272 }, { "epoch": 0.63, "learning_rate": 1.6072280636684692e-06, "loss": 1.0434, "step": 33273 }, { "epoch": 0.63, "learning_rate": 1.6070853727321979e-06, "loss": 0.748, "step": 33274 }, { "epoch": 0.63, "learning_rate": 1.606942685130043e-06, "loss": 0.9264, "step": 33275 }, { "epoch": 0.63, "learning_rate": 1.6068000008625373e-06, "loss": 0.7043, "step": 33276 }, { "epoch": 0.63, "learning_rate": 1.6066573199302117e-06, "loss": 0.7906, "step": 33277 }, { "epoch": 0.63, "learning_rate": 1.6065146423336007e-06, "loss": 0.8419, "step": 33278 }, { "epoch": 0.63, "learning_rate": 1.606371968073237e-06, "loss": 0.8898, "step": 33279 }, { "epoch": 0.63, "learning_rate": 1.6062292971496523e-06, "loss": 1.014, "step": 33280 }, { "epoch": 0.63, "learning_rate": 1.606086629563381e-06, "loss": 1.2192, "step": 33281 }, { "epoch": 0.63, "learning_rate": 1.6059439653149545e-06, "loss": 0.8403, "step": 33282 }, { "epoch": 0.63, "learning_rate": 1.6058013044049053e-06, "loss": 0.8118, "step": 33283 }, { "epoch": 0.63, "learning_rate": 1.605658646833767e-06, "loss": 1.0271, "step": 33284 }, { "epoch": 0.63, "learning_rate": 1.605515992602072e-06, "loss": 0.8089, "step": 33285 }, { "epoch": 0.63, "learning_rate": 1.605373341710352e-06, "loss": 0.8062, "step": 33286 }, { "epoch": 0.63, "learning_rate": 1.6052306941591417e-06, "loss": 0.889, "step": 33287 }, { "epoch": 0.63, "learning_rate": 1.6050880499489724e-06, "loss": 0.8687, "step": 33288 }, { "epoch": 0.63, "learning_rate": 1.604945409080376e-06, "loss": 0.9666, "step": 33289 }, { "epoch": 0.63, "learning_rate": 1.604802771553887e-06, "loss": 0.9006, "step": 33290 }, { "epoch": 0.63, "learning_rate": 1.6046601373700363e-06, "loss": 1.0679, "step": 33291 }, { "epoch": 0.63, "learning_rate": 1.6045175065293573e-06, "loss": 0.7618, "step": 33292 }, { "epoch": 0.63, "learning_rate": 1.6043748790323826e-06, "loss": 0.96, "step": 33293 }, { "epoch": 0.63, "learning_rate": 1.6042322548796451e-06, "loss": 1.0387, "step": 33294 }, { "epoch": 0.63, "learning_rate": 1.6040896340716758e-06, "loss": 0.942, "step": 33295 }, { "epoch": 0.63, "learning_rate": 1.6039470166090094e-06, "loss": 0.9181, "step": 33296 }, { "epoch": 0.63, "learning_rate": 1.6038044024921773e-06, "loss": 0.971, "step": 33297 }, { "epoch": 0.63, "learning_rate": 1.6036617917217112e-06, "loss": 0.7349, "step": 33298 }, { "epoch": 0.63, "learning_rate": 1.603519184298145e-06, "loss": 0.713, "step": 33299 }, { "epoch": 0.63, "learning_rate": 1.6033765802220109e-06, "loss": 1.0291, "step": 33300 }, { "epoch": 0.63, "learning_rate": 1.6032339794938406e-06, "loss": 0.8696, "step": 33301 }, { "epoch": 0.63, "learning_rate": 1.6030913821141678e-06, "loss": 0.7816, "step": 33302 }, { "epoch": 0.63, "learning_rate": 1.6029487880835243e-06, "loss": 0.998, "step": 33303 }, { "epoch": 0.63, "learning_rate": 1.6028061974024417e-06, "loss": 0.8068, "step": 33304 }, { "epoch": 0.63, "learning_rate": 1.602663610071454e-06, "loss": 0.8788, "step": 33305 }, { "epoch": 0.63, "learning_rate": 1.6025210260910926e-06, "loss": 1.0103, "step": 33306 }, { "epoch": 0.63, "learning_rate": 1.6023784454618896e-06, "loss": 1.063, "step": 33307 }, { "epoch": 0.63, "learning_rate": 1.602235868184379e-06, "loss": 0.9754, "step": 33308 }, { "epoch": 0.63, "learning_rate": 1.602093294259092e-06, "loss": 0.905, "step": 33309 }, { "epoch": 0.63, "learning_rate": 1.60195072368656e-06, "loss": 0.7892, "step": 33310 }, { "epoch": 0.63, "learning_rate": 1.6018081564673176e-06, "loss": 0.8023, "step": 33311 }, { "epoch": 0.63, "learning_rate": 1.6016655926018959e-06, "loss": 0.9266, "step": 33312 }, { "epoch": 0.63, "learning_rate": 1.6015230320908269e-06, "loss": 0.9632, "step": 33313 }, { "epoch": 0.63, "learning_rate": 1.6013804749346434e-06, "loss": 0.9188, "step": 33314 }, { "epoch": 0.63, "learning_rate": 1.601237921133878e-06, "loss": 0.9628, "step": 33315 }, { "epoch": 0.63, "learning_rate": 1.6010953706890619e-06, "loss": 0.7392, "step": 33316 }, { "epoch": 0.63, "learning_rate": 1.6009528236007294e-06, "loss": 1.0785, "step": 33317 }, { "epoch": 0.63, "learning_rate": 1.6008102798694108e-06, "loss": 1.0723, "step": 33318 }, { "epoch": 0.63, "learning_rate": 1.6006677394956385e-06, "loss": 1.3005, "step": 33319 }, { "epoch": 0.63, "learning_rate": 1.6005252024799455e-06, "loss": 0.9767, "step": 33320 }, { "epoch": 0.63, "learning_rate": 1.6003826688228645e-06, "loss": 1.0814, "step": 33321 }, { "epoch": 0.63, "learning_rate": 1.600240138524926e-06, "loss": 0.8199, "step": 33322 }, { "epoch": 0.63, "learning_rate": 1.6000976115866646e-06, "loss": 0.8771, "step": 33323 }, { "epoch": 0.63, "learning_rate": 1.5999550880086106e-06, "loss": 1.1768, "step": 33324 }, { "epoch": 0.63, "learning_rate": 1.5998125677912961e-06, "loss": 1.1141, "step": 33325 }, { "epoch": 0.63, "learning_rate": 1.5996700509352547e-06, "loss": 1.1132, "step": 33326 }, { "epoch": 0.63, "learning_rate": 1.5995275374410172e-06, "loss": 0.9481, "step": 33327 }, { "epoch": 0.63, "learning_rate": 1.5993850273091155e-06, "loss": 0.7959, "step": 33328 }, { "epoch": 0.63, "learning_rate": 1.599242520540084e-06, "loss": 0.7632, "step": 33329 }, { "epoch": 0.63, "learning_rate": 1.5991000171344527e-06, "loss": 0.9843, "step": 33330 }, { "epoch": 0.63, "learning_rate": 1.5989575170927541e-06, "loss": 0.9878, "step": 33331 }, { "epoch": 0.63, "learning_rate": 1.5988150204155212e-06, "loss": 0.9089, "step": 33332 }, { "epoch": 0.63, "learning_rate": 1.5986725271032847e-06, "loss": 0.9394, "step": 33333 }, { "epoch": 0.63, "learning_rate": 1.5985300371565773e-06, "loss": 1.0634, "step": 33334 }, { "epoch": 0.63, "learning_rate": 1.5983875505759311e-06, "loss": 0.7541, "step": 33335 }, { "epoch": 0.63, "learning_rate": 1.5982450673618788e-06, "loss": 0.8124, "step": 33336 }, { "epoch": 0.63, "learning_rate": 1.5981025875149509e-06, "loss": 1.061, "step": 33337 }, { "epoch": 0.63, "learning_rate": 1.597960111035681e-06, "loss": 1.0057, "step": 33338 }, { "epoch": 0.63, "learning_rate": 1.5978176379246007e-06, "loss": 0.8643, "step": 33339 }, { "epoch": 0.63, "learning_rate": 1.5976751681822403e-06, "loss": 0.7663, "step": 33340 }, { "epoch": 0.63, "learning_rate": 1.5975327018091338e-06, "loss": 0.9547, "step": 33341 }, { "epoch": 0.63, "learning_rate": 1.5973902388058133e-06, "loss": 0.8686, "step": 33342 }, { "epoch": 0.63, "learning_rate": 1.5972477791728086e-06, "loss": 0.9789, "step": 33343 }, { "epoch": 0.63, "learning_rate": 1.5971053229106542e-06, "loss": 0.9531, "step": 33344 }, { "epoch": 0.63, "learning_rate": 1.5969628700198808e-06, "loss": 0.8572, "step": 33345 }, { "epoch": 0.63, "learning_rate": 1.5968204205010194e-06, "loss": 0.8159, "step": 33346 }, { "epoch": 0.63, "learning_rate": 1.5966779743546038e-06, "loss": 0.9184, "step": 33347 }, { "epoch": 0.63, "learning_rate": 1.5965355315811642e-06, "loss": 0.8088, "step": 33348 }, { "epoch": 0.63, "learning_rate": 1.596393092181233e-06, "loss": 0.9238, "step": 33349 }, { "epoch": 0.63, "learning_rate": 1.5962506561553433e-06, "loss": 0.845, "step": 33350 }, { "epoch": 0.63, "learning_rate": 1.596108223504026e-06, "loss": 0.9219, "step": 33351 }, { "epoch": 0.63, "learning_rate": 1.5959657942278117e-06, "loss": 0.6638, "step": 33352 }, { "epoch": 0.63, "learning_rate": 1.5958233683272345e-06, "loss": 0.7368, "step": 33353 }, { "epoch": 0.63, "learning_rate": 1.5956809458028246e-06, "loss": 1.0555, "step": 33354 }, { "epoch": 0.63, "learning_rate": 1.5955385266551143e-06, "loss": 0.9761, "step": 33355 }, { "epoch": 0.63, "learning_rate": 1.5953961108846356e-06, "loss": 1.0477, "step": 33356 }, { "epoch": 0.63, "learning_rate": 1.5952536984919203e-06, "loss": 0.9351, "step": 33357 }, { "epoch": 0.63, "learning_rate": 1.5951112894774991e-06, "loss": 0.7664, "step": 33358 }, { "epoch": 0.63, "learning_rate": 1.594968883841906e-06, "loss": 0.841, "step": 33359 }, { "epoch": 0.63, "learning_rate": 1.5948264815856708e-06, "loss": 0.8788, "step": 33360 }, { "epoch": 0.63, "learning_rate": 1.5946840827093247e-06, "loss": 0.7596, "step": 33361 }, { "epoch": 0.63, "learning_rate": 1.5945416872134011e-06, "loss": 1.001, "step": 33362 }, { "epoch": 0.63, "learning_rate": 1.5943992950984316e-06, "loss": 0.8795, "step": 33363 }, { "epoch": 0.63, "learning_rate": 1.5942569063649466e-06, "loss": 1.1497, "step": 33364 }, { "epoch": 0.63, "learning_rate": 1.5941145210134792e-06, "loss": 1.0004, "step": 33365 }, { "epoch": 0.63, "learning_rate": 1.5939721390445607e-06, "loss": 0.8561, "step": 33366 }, { "epoch": 0.63, "learning_rate": 1.5938297604587211e-06, "loss": 0.7804, "step": 33367 }, { "epoch": 0.63, "learning_rate": 1.5936873852564949e-06, "loss": 0.929, "step": 33368 }, { "epoch": 0.63, "learning_rate": 1.5935450134384111e-06, "loss": 1.0162, "step": 33369 }, { "epoch": 0.63, "learning_rate": 1.5934026450050022e-06, "loss": 1.1748, "step": 33370 }, { "epoch": 0.63, "learning_rate": 1.593260279956801e-06, "loss": 0.731, "step": 33371 }, { "epoch": 0.63, "learning_rate": 1.5931179182943385e-06, "loss": 0.8355, "step": 33372 }, { "epoch": 0.63, "learning_rate": 1.5929755600181446e-06, "loss": 0.7617, "step": 33373 }, { "epoch": 0.63, "learning_rate": 1.5928332051287531e-06, "loss": 1.1016, "step": 33374 }, { "epoch": 0.63, "learning_rate": 1.5926908536266938e-06, "loss": 1.071, "step": 33375 }, { "epoch": 0.63, "learning_rate": 1.5925485055124995e-06, "loss": 1.0546, "step": 33376 }, { "epoch": 0.63, "learning_rate": 1.5924061607867012e-06, "loss": 1.0106, "step": 33377 }, { "epoch": 0.63, "learning_rate": 1.5922638194498307e-06, "loss": 0.9561, "step": 33378 }, { "epoch": 0.63, "learning_rate": 1.5921214815024185e-06, "loss": 0.835, "step": 33379 }, { "epoch": 0.63, "learning_rate": 1.591979146944998e-06, "loss": 0.8435, "step": 33380 }, { "epoch": 0.63, "learning_rate": 1.5918368157780993e-06, "loss": 1.1486, "step": 33381 }, { "epoch": 0.63, "learning_rate": 1.5916944880022527e-06, "loss": 0.8284, "step": 33382 }, { "epoch": 0.63, "learning_rate": 1.591552163617992e-06, "loss": 0.9638, "step": 33383 }, { "epoch": 0.63, "learning_rate": 1.5914098426258483e-06, "loss": 0.9632, "step": 33384 }, { "epoch": 0.63, "learning_rate": 1.591267525026351e-06, "loss": 0.8011, "step": 33385 }, { "epoch": 0.63, "learning_rate": 1.5911252108200343e-06, "loss": 0.767, "step": 33386 }, { "epoch": 0.63, "learning_rate": 1.5909829000074277e-06, "loss": 0.9907, "step": 33387 }, { "epoch": 0.63, "learning_rate": 1.5908405925890624e-06, "loss": 1.0137, "step": 33388 }, { "epoch": 0.63, "learning_rate": 1.5906982885654716e-06, "loss": 0.9503, "step": 33389 }, { "epoch": 0.63, "learning_rate": 1.5905559879371848e-06, "loss": 0.9446, "step": 33390 }, { "epoch": 0.63, "learning_rate": 1.5904136907047335e-06, "loss": 0.8477, "step": 33391 }, { "epoch": 0.63, "learning_rate": 1.5902713968686505e-06, "loss": 0.9268, "step": 33392 }, { "epoch": 0.63, "learning_rate": 1.5901291064294666e-06, "loss": 0.9425, "step": 33393 }, { "epoch": 0.63, "learning_rate": 1.5899868193877115e-06, "loss": 0.9237, "step": 33394 }, { "epoch": 0.63, "learning_rate": 1.5898445357439188e-06, "loss": 0.9438, "step": 33395 }, { "epoch": 0.63, "learning_rate": 1.589702255498618e-06, "loss": 0.8044, "step": 33396 }, { "epoch": 0.63, "learning_rate": 1.5895599786523414e-06, "loss": 1.06, "step": 33397 }, { "epoch": 0.63, "learning_rate": 1.5894177052056197e-06, "loss": 0.8745, "step": 33398 }, { "epoch": 0.63, "learning_rate": 1.5892754351589848e-06, "loss": 0.9344, "step": 33399 }, { "epoch": 0.63, "learning_rate": 1.5891331685129665e-06, "loss": 0.8311, "step": 33400 }, { "epoch": 0.63, "learning_rate": 1.5889909052680983e-06, "loss": 1.0521, "step": 33401 }, { "epoch": 0.63, "learning_rate": 1.5888486454249097e-06, "loss": 0.6582, "step": 33402 }, { "epoch": 0.63, "learning_rate": 1.5887063889839315e-06, "loss": 0.8086, "step": 33403 }, { "epoch": 0.63, "learning_rate": 1.5885641359456966e-06, "loss": 0.9982, "step": 33404 }, { "epoch": 0.63, "learning_rate": 1.5884218863107354e-06, "loss": 0.8238, "step": 33405 }, { "epoch": 0.63, "learning_rate": 1.5882796400795778e-06, "loss": 1.0044, "step": 33406 }, { "epoch": 0.63, "learning_rate": 1.5881373972527573e-06, "loss": 0.9172, "step": 33407 }, { "epoch": 0.63, "learning_rate": 1.5879951578308036e-06, "loss": 0.8504, "step": 33408 }, { "epoch": 0.63, "learning_rate": 1.5878529218142471e-06, "loss": 0.912, "step": 33409 }, { "epoch": 0.63, "learning_rate": 1.587710689203621e-06, "loss": 0.9206, "step": 33410 }, { "epoch": 0.63, "learning_rate": 1.5875684599994545e-06, "loss": 0.7667, "step": 33411 }, { "epoch": 0.63, "learning_rate": 1.587426234202279e-06, "loss": 1.068, "step": 33412 }, { "epoch": 0.63, "learning_rate": 1.587284011812627e-06, "loss": 1.0622, "step": 33413 }, { "epoch": 0.63, "learning_rate": 1.5871417928310285e-06, "loss": 1.0825, "step": 33414 }, { "epoch": 0.63, "learning_rate": 1.5869995772580133e-06, "loss": 1.1063, "step": 33415 }, { "epoch": 0.63, "learning_rate": 1.586857365094115e-06, "loss": 0.7566, "step": 33416 }, { "epoch": 0.63, "learning_rate": 1.5867151563398626e-06, "loss": 0.8478, "step": 33417 }, { "epoch": 0.63, "learning_rate": 1.5865729509957877e-06, "loss": 1.1995, "step": 33418 }, { "epoch": 0.63, "learning_rate": 1.5864307490624221e-06, "loss": 0.9218, "step": 33419 }, { "epoch": 0.63, "learning_rate": 1.5862885505402958e-06, "loss": 0.8074, "step": 33420 }, { "epoch": 0.63, "learning_rate": 1.5861463554299394e-06, "loss": 0.942, "step": 33421 }, { "epoch": 0.63, "learning_rate": 1.586004163731885e-06, "loss": 0.7374, "step": 33422 }, { "epoch": 0.63, "learning_rate": 1.5858619754466637e-06, "loss": 0.9276, "step": 33423 }, { "epoch": 0.63, "learning_rate": 1.5857197905748045e-06, "loss": 0.9794, "step": 33424 }, { "epoch": 0.63, "learning_rate": 1.58557760911684e-06, "loss": 1.0654, "step": 33425 }, { "epoch": 0.63, "learning_rate": 1.5854354310733012e-06, "loss": 0.899, "step": 33426 }, { "epoch": 0.63, "learning_rate": 1.5852932564447177e-06, "loss": 0.7942, "step": 33427 }, { "epoch": 0.63, "learning_rate": 1.5851510852316218e-06, "loss": 0.7751, "step": 33428 }, { "epoch": 0.63, "learning_rate": 1.5850089174345437e-06, "loss": 0.7183, "step": 33429 }, { "epoch": 0.63, "learning_rate": 1.5848667530540134e-06, "loss": 0.8812, "step": 33430 }, { "epoch": 0.63, "learning_rate": 1.5847245920905636e-06, "loss": 1.0731, "step": 33431 }, { "epoch": 0.63, "learning_rate": 1.5845824345447236e-06, "loss": 0.9768, "step": 33432 }, { "epoch": 0.63, "learning_rate": 1.584440280417024e-06, "loss": 0.9172, "step": 33433 }, { "epoch": 0.63, "learning_rate": 1.5842981297079977e-06, "loss": 0.9675, "step": 33434 }, { "epoch": 0.63, "learning_rate": 1.5841559824181738e-06, "loss": 0.852, "step": 33435 }, { "epoch": 0.63, "learning_rate": 1.5840138385480824e-06, "loss": 0.8424, "step": 33436 }, { "epoch": 0.63, "learning_rate": 1.5838716980982565e-06, "loss": 0.9728, "step": 33437 }, { "epoch": 0.63, "learning_rate": 1.583729561069225e-06, "loss": 0.9423, "step": 33438 }, { "epoch": 0.63, "learning_rate": 1.583587427461519e-06, "loss": 0.7958, "step": 33439 }, { "epoch": 0.63, "learning_rate": 1.5834452972756695e-06, "loss": 0.8924, "step": 33440 }, { "epoch": 0.63, "learning_rate": 1.5833031705122076e-06, "loss": 0.5732, "step": 33441 }, { "epoch": 0.63, "learning_rate": 1.583161047171663e-06, "loss": 0.7639, "step": 33442 }, { "epoch": 0.63, "learning_rate": 1.5830189272545676e-06, "loss": 0.6987, "step": 33443 }, { "epoch": 0.63, "learning_rate": 1.5828768107614514e-06, "loss": 1.1161, "step": 33444 }, { "epoch": 0.63, "learning_rate": 1.5827346976928442e-06, "loss": 0.9456, "step": 33445 }, { "epoch": 0.63, "learning_rate": 1.582592588049278e-06, "loss": 0.9655, "step": 33446 }, { "epoch": 0.63, "learning_rate": 1.582450481831283e-06, "loss": 0.7637, "step": 33447 }, { "epoch": 0.63, "learning_rate": 1.5823083790393894e-06, "loss": 0.7136, "step": 33448 }, { "epoch": 0.63, "learning_rate": 1.5821662796741288e-06, "loss": 1.0457, "step": 33449 }, { "epoch": 0.63, "learning_rate": 1.5820241837360314e-06, "loss": 1.0322, "step": 33450 }, { "epoch": 0.63, "learning_rate": 1.5818820912256267e-06, "loss": 1.0075, "step": 33451 }, { "epoch": 0.63, "learning_rate": 1.5817400021434464e-06, "loss": 0.9323, "step": 33452 }, { "epoch": 0.63, "learning_rate": 1.5815979164900207e-06, "loss": 0.7369, "step": 33453 }, { "epoch": 0.63, "learning_rate": 1.5814558342658802e-06, "loss": 0.9202, "step": 33454 }, { "epoch": 0.63, "learning_rate": 1.5813137554715558e-06, "loss": 1.0889, "step": 33455 }, { "epoch": 0.63, "learning_rate": 1.581171680107578e-06, "loss": 0.9772, "step": 33456 }, { "epoch": 0.63, "learning_rate": 1.5810296081744759e-06, "loss": 0.8638, "step": 33457 }, { "epoch": 0.63, "learning_rate": 1.580887539672782e-06, "loss": 1.0226, "step": 33458 }, { "epoch": 0.63, "learning_rate": 1.5807454746030254e-06, "loss": 1.0451, "step": 33459 }, { "epoch": 0.63, "learning_rate": 1.5806034129657368e-06, "loss": 1.1111, "step": 33460 }, { "epoch": 0.63, "learning_rate": 1.5804613547614472e-06, "loss": 0.8572, "step": 33461 }, { "epoch": 0.63, "learning_rate": 1.580319299990687e-06, "loss": 0.8466, "step": 33462 }, { "epoch": 0.63, "learning_rate": 1.5801772486539854e-06, "loss": 1.015, "step": 33463 }, { "epoch": 0.63, "learning_rate": 1.5800352007518748e-06, "loss": 1.0547, "step": 33464 }, { "epoch": 0.63, "learning_rate": 1.5798931562848846e-06, "loss": 0.7197, "step": 33465 }, { "epoch": 0.63, "learning_rate": 1.5797511152535438e-06, "loss": 0.7646, "step": 33466 }, { "epoch": 0.63, "learning_rate": 1.579609077658385e-06, "loss": 0.9693, "step": 33467 }, { "epoch": 0.63, "learning_rate": 1.5794670434999382e-06, "loss": 1.0615, "step": 33468 }, { "epoch": 0.63, "learning_rate": 1.5793250127787318e-06, "loss": 0.9932, "step": 33469 }, { "epoch": 0.63, "learning_rate": 1.579182985495299e-06, "loss": 0.8108, "step": 33470 }, { "epoch": 0.63, "learning_rate": 1.5790409616501684e-06, "loss": 0.8798, "step": 33471 }, { "epoch": 0.63, "learning_rate": 1.5788989412438698e-06, "loss": 1.0041, "step": 33472 }, { "epoch": 0.63, "learning_rate": 1.5787569242769354e-06, "loss": 0.9489, "step": 33473 }, { "epoch": 0.63, "learning_rate": 1.5786149107498938e-06, "loss": 1.1196, "step": 33474 }, { "epoch": 0.63, "learning_rate": 1.5784729006632755e-06, "loss": 1.0178, "step": 33475 }, { "epoch": 0.63, "learning_rate": 1.5783308940176118e-06, "loss": 0.9216, "step": 33476 }, { "epoch": 0.63, "learning_rate": 1.5781888908134323e-06, "loss": 0.9178, "step": 33477 }, { "epoch": 0.63, "learning_rate": 1.5780468910512666e-06, "loss": 1.0275, "step": 33478 }, { "epoch": 0.63, "learning_rate": 1.5779048947316464e-06, "loss": 0.8014, "step": 33479 }, { "epoch": 0.63, "learning_rate": 1.5777629018551005e-06, "loss": 0.992, "step": 33480 }, { "epoch": 0.63, "learning_rate": 1.5776209124221597e-06, "loss": 0.8755, "step": 33481 }, { "epoch": 0.63, "learning_rate": 1.577478926433354e-06, "loss": 0.9255, "step": 33482 }, { "epoch": 0.63, "learning_rate": 1.5773369438892143e-06, "loss": 0.7956, "step": 33483 }, { "epoch": 0.63, "learning_rate": 1.577194964790269e-06, "loss": 0.8521, "step": 33484 }, { "epoch": 0.63, "learning_rate": 1.5770529891370507e-06, "loss": 0.9413, "step": 33485 }, { "epoch": 0.63, "learning_rate": 1.576911016930088e-06, "loss": 0.9288, "step": 33486 }, { "epoch": 0.63, "learning_rate": 1.5767690481699104e-06, "loss": 1.0585, "step": 33487 }, { "epoch": 0.63, "learning_rate": 1.5766270828570494e-06, "loss": 0.8251, "step": 33488 }, { "epoch": 0.63, "learning_rate": 1.576485120992035e-06, "loss": 0.8447, "step": 33489 }, { "epoch": 0.63, "learning_rate": 1.5763431625753966e-06, "loss": 0.8446, "step": 33490 }, { "epoch": 0.63, "learning_rate": 1.5762012076076638e-06, "loss": 0.7505, "step": 33491 }, { "epoch": 0.63, "learning_rate": 1.5760592560893684e-06, "loss": 0.9311, "step": 33492 }, { "epoch": 0.63, "learning_rate": 1.5759173080210387e-06, "loss": 1.0692, "step": 33493 }, { "epoch": 0.63, "learning_rate": 1.5757753634032056e-06, "loss": 1.0236, "step": 33494 }, { "epoch": 0.63, "learning_rate": 1.575633422236399e-06, "loss": 0.8986, "step": 33495 }, { "epoch": 0.63, "learning_rate": 1.575491484521149e-06, "loss": 1.1661, "step": 33496 }, { "epoch": 0.63, "learning_rate": 1.5753495502579846e-06, "loss": 0.8228, "step": 33497 }, { "epoch": 0.63, "learning_rate": 1.5752076194474381e-06, "loss": 0.7548, "step": 33498 }, { "epoch": 0.63, "learning_rate": 1.5750656920900375e-06, "loss": 0.9366, "step": 33499 }, { "epoch": 0.63, "learning_rate": 1.5749237681863123e-06, "loss": 1.0171, "step": 33500 }, { "epoch": 0.63, "learning_rate": 1.5747818477367938e-06, "loss": 0.8756, "step": 33501 }, { "epoch": 0.63, "learning_rate": 1.5746399307420124e-06, "loss": 0.8803, "step": 33502 }, { "epoch": 0.63, "learning_rate": 1.574498017202496e-06, "loss": 0.9587, "step": 33503 }, { "epoch": 0.63, "learning_rate": 1.5743561071187763e-06, "loss": 0.8289, "step": 33504 }, { "epoch": 0.63, "learning_rate": 1.574214200491383e-06, "loss": 0.953, "step": 33505 }, { "epoch": 0.63, "learning_rate": 1.5740722973208439e-06, "loss": 1.0054, "step": 33506 }, { "epoch": 0.63, "learning_rate": 1.5739303976076918e-06, "loss": 1.0483, "step": 33507 }, { "epoch": 0.63, "learning_rate": 1.5737885013524548e-06, "loss": 0.7644, "step": 33508 }, { "epoch": 0.63, "learning_rate": 1.5736466085556622e-06, "loss": 0.8837, "step": 33509 }, { "epoch": 0.63, "learning_rate": 1.5735047192178466e-06, "loss": 0.829, "step": 33510 }, { "epoch": 0.63, "learning_rate": 1.573362833339535e-06, "loss": 1.0614, "step": 33511 }, { "epoch": 0.63, "learning_rate": 1.5732209509212578e-06, "loss": 0.9971, "step": 33512 }, { "epoch": 0.63, "learning_rate": 1.5730790719635457e-06, "loss": 0.9516, "step": 33513 }, { "epoch": 0.63, "learning_rate": 1.5729371964669282e-06, "loss": 0.7507, "step": 33514 }, { "epoch": 0.63, "learning_rate": 1.572795324431934e-06, "loss": 0.9595, "step": 33515 }, { "epoch": 0.63, "learning_rate": 1.5726534558590939e-06, "loss": 1.0881, "step": 33516 }, { "epoch": 0.63, "learning_rate": 1.572511590748938e-06, "loss": 0.5923, "step": 33517 }, { "epoch": 0.63, "learning_rate": 1.5723697291019944e-06, "loss": 0.8526, "step": 33518 }, { "epoch": 0.63, "learning_rate": 1.5722278709187943e-06, "loss": 1.0711, "step": 33519 }, { "epoch": 0.63, "learning_rate": 1.5720860161998674e-06, "loss": 0.8873, "step": 33520 }, { "epoch": 0.63, "learning_rate": 1.5719441649457418e-06, "loss": 0.813, "step": 33521 }, { "epoch": 0.63, "learning_rate": 1.5718023171569486e-06, "loss": 0.9299, "step": 33522 }, { "epoch": 0.63, "learning_rate": 1.5716604728340175e-06, "loss": 0.6938, "step": 33523 }, { "epoch": 0.63, "learning_rate": 1.571518631977477e-06, "loss": 0.9437, "step": 33524 }, { "epoch": 0.63, "learning_rate": 1.5713767945878582e-06, "loss": 1.1345, "step": 33525 }, { "epoch": 0.63, "learning_rate": 1.5712349606656902e-06, "loss": 1.0635, "step": 33526 }, { "epoch": 0.63, "learning_rate": 1.5710931302115013e-06, "loss": 0.7137, "step": 33527 }, { "epoch": 0.63, "learning_rate": 1.5709513032258231e-06, "loss": 0.9417, "step": 33528 }, { "epoch": 0.63, "learning_rate": 1.5708094797091839e-06, "loss": 0.7325, "step": 33529 }, { "epoch": 0.63, "learning_rate": 1.570667659662113e-06, "loss": 0.8365, "step": 33530 }, { "epoch": 0.63, "learning_rate": 1.5705258430851413e-06, "loss": 0.9906, "step": 33531 }, { "epoch": 0.63, "learning_rate": 1.570384029978798e-06, "loss": 1.0119, "step": 33532 }, { "epoch": 0.63, "learning_rate": 1.5702422203436113e-06, "loss": 0.8669, "step": 33533 }, { "epoch": 0.63, "learning_rate": 1.5701004141801125e-06, "loss": 0.963, "step": 33534 }, { "epoch": 0.63, "learning_rate": 1.5699586114888294e-06, "loss": 0.9743, "step": 33535 }, { "epoch": 0.63, "learning_rate": 1.5698168122702929e-06, "loss": 0.9879, "step": 33536 }, { "epoch": 0.63, "learning_rate": 1.5696750165250312e-06, "loss": 1.0039, "step": 33537 }, { "epoch": 0.63, "learning_rate": 1.5695332242535754e-06, "loss": 1.1077, "step": 33538 }, { "epoch": 0.63, "learning_rate": 1.5693914354564533e-06, "loss": 0.8855, "step": 33539 }, { "epoch": 0.63, "learning_rate": 1.5692496501341955e-06, "loss": 0.7925, "step": 33540 }, { "epoch": 0.63, "learning_rate": 1.5691078682873313e-06, "loss": 0.9265, "step": 33541 }, { "epoch": 0.63, "learning_rate": 1.5689660899163887e-06, "loss": 0.8767, "step": 33542 }, { "epoch": 0.63, "learning_rate": 1.5688243150218985e-06, "loss": 0.8893, "step": 33543 }, { "epoch": 0.63, "learning_rate": 1.5686825436043906e-06, "loss": 1.2067, "step": 33544 }, { "epoch": 0.63, "learning_rate": 1.5685407756643922e-06, "loss": 0.6843, "step": 33545 }, { "epoch": 0.63, "learning_rate": 1.5683990112024352e-06, "loss": 0.9339, "step": 33546 }, { "epoch": 0.63, "learning_rate": 1.5682572502190476e-06, "loss": 0.7502, "step": 33547 }, { "epoch": 0.63, "learning_rate": 1.568115492714758e-06, "loss": 0.8095, "step": 33548 }, { "epoch": 0.63, "learning_rate": 1.5679737386900975e-06, "loss": 1.1463, "step": 33549 }, { "epoch": 0.63, "learning_rate": 1.567831988145594e-06, "loss": 1.0863, "step": 33550 }, { "epoch": 0.63, "learning_rate": 1.567690241081777e-06, "loss": 0.8661, "step": 33551 }, { "epoch": 0.63, "learning_rate": 1.5675484974991767e-06, "loss": 0.9872, "step": 33552 }, { "epoch": 0.63, "learning_rate": 1.5674067573983216e-06, "loss": 0.7989, "step": 33553 }, { "epoch": 0.63, "learning_rate": 1.5672650207797402e-06, "loss": 0.7632, "step": 33554 }, { "epoch": 0.63, "learning_rate": 1.567123287643964e-06, "loss": 1.006, "step": 33555 }, { "epoch": 0.63, "learning_rate": 1.56698155799152e-06, "loss": 1.1536, "step": 33556 }, { "epoch": 0.63, "learning_rate": 1.5668398318229384e-06, "loss": 0.9429, "step": 33557 }, { "epoch": 0.63, "learning_rate": 1.5666981091387478e-06, "loss": 0.6434, "step": 33558 }, { "epoch": 0.63, "learning_rate": 1.566556389939479e-06, "loss": 0.8823, "step": 33559 }, { "epoch": 0.63, "learning_rate": 1.5664146742256587e-06, "loss": 0.965, "step": 33560 }, { "epoch": 0.63, "learning_rate": 1.5662729619978184e-06, "loss": 0.8155, "step": 33561 }, { "epoch": 0.63, "learning_rate": 1.5661312532564863e-06, "loss": 1.0217, "step": 33562 }, { "epoch": 0.63, "learning_rate": 1.5659895480021903e-06, "loss": 1.0104, "step": 33563 }, { "epoch": 0.63, "learning_rate": 1.5658478462354614e-06, "loss": 0.8342, "step": 33564 }, { "epoch": 0.63, "learning_rate": 1.5657061479568286e-06, "loss": 0.9372, "step": 33565 }, { "epoch": 0.63, "learning_rate": 1.5655644531668191e-06, "loss": 0.9424, "step": 33566 }, { "epoch": 0.63, "learning_rate": 1.5654227618659643e-06, "loss": 0.9331, "step": 33567 }, { "epoch": 0.63, "learning_rate": 1.5652810740547925e-06, "loss": 1.156, "step": 33568 }, { "epoch": 0.63, "learning_rate": 1.5651393897338313e-06, "loss": 0.9057, "step": 33569 }, { "epoch": 0.63, "learning_rate": 1.564997708903612e-06, "loss": 0.8923, "step": 33570 }, { "epoch": 0.63, "learning_rate": 1.5648560315646621e-06, "loss": 0.8033, "step": 33571 }, { "epoch": 0.63, "learning_rate": 1.5647143577175105e-06, "loss": 0.8661, "step": 33572 }, { "epoch": 0.63, "learning_rate": 1.564572687362688e-06, "loss": 0.8073, "step": 33573 }, { "epoch": 0.63, "learning_rate": 1.5644310205007223e-06, "loss": 0.8885, "step": 33574 }, { "epoch": 0.63, "learning_rate": 1.5642893571321416e-06, "loss": 1.0809, "step": 33575 }, { "epoch": 0.63, "learning_rate": 1.5641476972574765e-06, "loss": 0.9858, "step": 33576 }, { "epoch": 0.63, "learning_rate": 1.5640060408772547e-06, "loss": 0.9207, "step": 33577 }, { "epoch": 0.63, "learning_rate": 1.5638643879920059e-06, "loss": 0.9491, "step": 33578 }, { "epoch": 0.63, "learning_rate": 1.5637227386022585e-06, "loss": 0.9434, "step": 33579 }, { "epoch": 0.63, "learning_rate": 1.5635810927085426e-06, "loss": 0.921, "step": 33580 }, { "epoch": 0.63, "learning_rate": 1.5634394503113849e-06, "loss": 1.0788, "step": 33581 }, { "epoch": 0.63, "learning_rate": 1.5632978114113168e-06, "loss": 1.0667, "step": 33582 }, { "epoch": 0.63, "learning_rate": 1.5631561760088657e-06, "loss": 0.8766, "step": 33583 }, { "epoch": 0.63, "learning_rate": 1.5630145441045596e-06, "loss": 0.901, "step": 33584 }, { "epoch": 0.63, "learning_rate": 1.5628729156989292e-06, "loss": 0.8421, "step": 33585 }, { "epoch": 0.63, "learning_rate": 1.562731290792503e-06, "loss": 0.6423, "step": 33586 }, { "epoch": 0.63, "learning_rate": 1.5625896693858087e-06, "loss": 0.9816, "step": 33587 }, { "epoch": 0.63, "learning_rate": 1.5624480514793766e-06, "loss": 0.9398, "step": 33588 }, { "epoch": 0.63, "learning_rate": 1.5623064370737344e-06, "loss": 0.7829, "step": 33589 }, { "epoch": 0.63, "learning_rate": 1.5621648261694108e-06, "loss": 1.0756, "step": 33590 }, { "epoch": 0.63, "learning_rate": 1.5620232187669356e-06, "loss": 0.8806, "step": 33591 }, { "epoch": 0.63, "learning_rate": 1.5618816148668366e-06, "loss": 0.7496, "step": 33592 }, { "epoch": 0.63, "learning_rate": 1.5617400144696426e-06, "loss": 1.0154, "step": 33593 }, { "epoch": 0.63, "learning_rate": 1.5615984175758834e-06, "loss": 0.9827, "step": 33594 }, { "epoch": 0.63, "learning_rate": 1.5614568241860867e-06, "loss": 1.0331, "step": 33595 }, { "epoch": 0.63, "learning_rate": 1.561315234300781e-06, "loss": 0.9129, "step": 33596 }, { "epoch": 0.63, "learning_rate": 1.5611736479204959e-06, "loss": 0.8275, "step": 33597 }, { "epoch": 0.63, "learning_rate": 1.5610320650457594e-06, "loss": 1.0015, "step": 33598 }, { "epoch": 0.63, "learning_rate": 1.5608904856771002e-06, "loss": 0.9184, "step": 33599 }, { "epoch": 0.63, "learning_rate": 1.560748909815047e-06, "loss": 1.0875, "step": 33600 }, { "epoch": 0.63, "learning_rate": 1.5606073374601294e-06, "loss": 0.9067, "step": 33601 }, { "epoch": 0.63, "learning_rate": 1.5604657686128743e-06, "loss": 0.8276, "step": 33602 }, { "epoch": 0.63, "learning_rate": 1.560324203273812e-06, "loss": 0.9138, "step": 33603 }, { "epoch": 0.63, "learning_rate": 1.5601826414434702e-06, "loss": 0.9918, "step": 33604 }, { "epoch": 0.63, "learning_rate": 1.5600410831223767e-06, "loss": 0.9037, "step": 33605 }, { "epoch": 0.63, "learning_rate": 1.5598995283110615e-06, "loss": 0.8061, "step": 33606 }, { "epoch": 0.63, "learning_rate": 1.5597579770100532e-06, "loss": 0.7852, "step": 33607 }, { "epoch": 0.63, "learning_rate": 1.5596164292198788e-06, "loss": 1.0115, "step": 33608 }, { "epoch": 0.63, "learning_rate": 1.5594748849410686e-06, "loss": 0.9137, "step": 33609 }, { "epoch": 0.63, "learning_rate": 1.5593333441741505e-06, "loss": 1.1127, "step": 33610 }, { "epoch": 0.63, "learning_rate": 1.559191806919652e-06, "loss": 0.9608, "step": 33611 }, { "epoch": 0.63, "learning_rate": 1.5590502731781032e-06, "loss": 0.9769, "step": 33612 }, { "epoch": 0.63, "learning_rate": 1.5589087429500315e-06, "loss": 0.8306, "step": 33613 }, { "epoch": 0.63, "learning_rate": 1.5587672162359653e-06, "loss": 0.8036, "step": 33614 }, { "epoch": 0.63, "learning_rate": 1.558625693036434e-06, "loss": 1.047, "step": 33615 }, { "epoch": 0.63, "learning_rate": 1.5584841733519658e-06, "loss": 0.7732, "step": 33616 }, { "epoch": 0.63, "learning_rate": 1.5583426571830879e-06, "loss": 1.2855, "step": 33617 }, { "epoch": 0.63, "learning_rate": 1.5582011445303302e-06, "loss": 1.211, "step": 33618 }, { "epoch": 0.63, "learning_rate": 1.5580596353942207e-06, "loss": 0.9177, "step": 33619 }, { "epoch": 0.63, "learning_rate": 1.557918129775287e-06, "loss": 0.8756, "step": 33620 }, { "epoch": 0.63, "learning_rate": 1.5577766276740586e-06, "loss": 0.7487, "step": 33621 }, { "epoch": 0.63, "learning_rate": 1.5576351290910639e-06, "loss": 0.7137, "step": 33622 }, { "epoch": 0.63, "learning_rate": 1.5574936340268297e-06, "loss": 0.7904, "step": 33623 }, { "epoch": 0.63, "learning_rate": 1.557352142481886e-06, "loss": 0.8174, "step": 33624 }, { "epoch": 0.63, "learning_rate": 1.5572106544567608e-06, "loss": 1.2714, "step": 33625 }, { "epoch": 0.63, "learning_rate": 1.5570691699519811e-06, "loss": 0.8971, "step": 33626 }, { "epoch": 0.63, "learning_rate": 1.5569276889680769e-06, "loss": 0.8239, "step": 33627 }, { "epoch": 0.63, "learning_rate": 1.5567862115055759e-06, "loss": 1.0348, "step": 33628 }, { "epoch": 0.63, "learning_rate": 1.556644737565005e-06, "loss": 0.9518, "step": 33629 }, { "epoch": 0.63, "learning_rate": 1.5565032671468956e-06, "loss": 0.8777, "step": 33630 }, { "epoch": 0.63, "learning_rate": 1.5563618002517733e-06, "loss": 0.9191, "step": 33631 }, { "epoch": 0.63, "learning_rate": 1.5562203368801664e-06, "loss": 1.0301, "step": 33632 }, { "epoch": 0.63, "learning_rate": 1.5560788770326052e-06, "loss": 0.8453, "step": 33633 }, { "epoch": 0.63, "learning_rate": 1.5559374207096156e-06, "loss": 0.8706, "step": 33634 }, { "epoch": 0.63, "learning_rate": 1.5557959679117262e-06, "loss": 0.8352, "step": 33635 }, { "epoch": 0.63, "learning_rate": 1.5556545186394666e-06, "loss": 0.9735, "step": 33636 }, { "epoch": 0.63, "learning_rate": 1.5555130728933645e-06, "loss": 0.9294, "step": 33637 }, { "epoch": 0.63, "learning_rate": 1.5553716306739464e-06, "loss": 0.9933, "step": 33638 }, { "epoch": 0.63, "learning_rate": 1.5552301919817428e-06, "loss": 0.8773, "step": 33639 }, { "epoch": 0.63, "learning_rate": 1.55508875681728e-06, "loss": 0.8156, "step": 33640 }, { "epoch": 0.63, "learning_rate": 1.5549473251810871e-06, "loss": 0.8889, "step": 33641 }, { "epoch": 0.63, "learning_rate": 1.5548058970736915e-06, "loss": 0.7922, "step": 33642 }, { "epoch": 0.63, "learning_rate": 1.5546644724956223e-06, "loss": 0.8598, "step": 33643 }, { "epoch": 0.63, "learning_rate": 1.5545230514474064e-06, "loss": 1.009, "step": 33644 }, { "epoch": 0.63, "learning_rate": 1.554381633929573e-06, "loss": 1.092, "step": 33645 }, { "epoch": 0.63, "learning_rate": 1.5542402199426496e-06, "loss": 0.9207, "step": 33646 }, { "epoch": 0.63, "learning_rate": 1.5540988094871635e-06, "loss": 0.8016, "step": 33647 }, { "epoch": 0.63, "learning_rate": 1.5539574025636436e-06, "loss": 0.8304, "step": 33648 }, { "epoch": 0.63, "learning_rate": 1.5538159991726185e-06, "loss": 0.9267, "step": 33649 }, { "epoch": 0.63, "learning_rate": 1.553674599314614e-06, "loss": 1.0304, "step": 33650 }, { "epoch": 0.63, "learning_rate": 1.5535332029901612e-06, "loss": 0.9691, "step": 33651 }, { "epoch": 0.63, "learning_rate": 1.553391810199786e-06, "loss": 0.812, "step": 33652 }, { "epoch": 0.63, "learning_rate": 1.5532504209440158e-06, "loss": 0.6934, "step": 33653 }, { "epoch": 0.63, "learning_rate": 1.5531090352233806e-06, "loss": 0.8546, "step": 33654 }, { "epoch": 0.63, "learning_rate": 1.5529676530384069e-06, "loss": 1.0215, "step": 33655 }, { "epoch": 0.63, "learning_rate": 1.5528262743896222e-06, "loss": 1.2563, "step": 33656 }, { "epoch": 0.64, "learning_rate": 1.5526848992775561e-06, "loss": 1.0219, "step": 33657 }, { "epoch": 0.64, "learning_rate": 1.5525435277027356e-06, "loss": 0.9542, "step": 33658 }, { "epoch": 0.64, "learning_rate": 1.5524021596656875e-06, "loss": 0.9487, "step": 33659 }, { "epoch": 0.64, "learning_rate": 1.5522607951669416e-06, "loss": 0.7832, "step": 33660 }, { "epoch": 0.64, "learning_rate": 1.5521194342070245e-06, "loss": 0.7422, "step": 33661 }, { "epoch": 0.64, "learning_rate": 1.5519780767864646e-06, "loss": 1.0786, "step": 33662 }, { "epoch": 0.64, "learning_rate": 1.551836722905789e-06, "loss": 1.0527, "step": 33663 }, { "epoch": 0.64, "learning_rate": 1.5516953725655267e-06, "loss": 0.8588, "step": 33664 }, { "epoch": 0.64, "learning_rate": 1.5515540257662036e-06, "loss": 1.0839, "step": 33665 }, { "epoch": 0.64, "learning_rate": 1.5514126825083504e-06, "loss": 0.8948, "step": 33666 }, { "epoch": 0.64, "learning_rate": 1.5512713427924924e-06, "loss": 0.8589, "step": 33667 }, { "epoch": 0.64, "learning_rate": 1.5511300066191576e-06, "loss": 1.0953, "step": 33668 }, { "epoch": 0.64, "learning_rate": 1.5509886739888747e-06, "loss": 1.2325, "step": 33669 }, { "epoch": 0.64, "learning_rate": 1.550847344902171e-06, "loss": 0.9291, "step": 33670 }, { "epoch": 0.64, "learning_rate": 1.5507060193595735e-06, "loss": 0.7289, "step": 33671 }, { "epoch": 0.64, "learning_rate": 1.5505646973616117e-06, "loss": 0.9348, "step": 33672 }, { "epoch": 0.64, "learning_rate": 1.5504233789088125e-06, "loss": 1.0555, "step": 33673 }, { "epoch": 0.64, "learning_rate": 1.5502820640017019e-06, "loss": 0.9756, "step": 33674 }, { "epoch": 0.64, "learning_rate": 1.5501407526408099e-06, "loss": 1.1903, "step": 33675 }, { "epoch": 0.64, "learning_rate": 1.5499994448266627e-06, "loss": 0.9807, "step": 33676 }, { "epoch": 0.64, "learning_rate": 1.5498581405597884e-06, "loss": 0.9714, "step": 33677 }, { "epoch": 0.64, "learning_rate": 1.5497168398407153e-06, "loss": 0.7528, "step": 33678 }, { "epoch": 0.64, "learning_rate": 1.5495755426699704e-06, "loss": 0.7482, "step": 33679 }, { "epoch": 0.64, "learning_rate": 1.5494342490480801e-06, "loss": 1.0538, "step": 33680 }, { "epoch": 0.64, "learning_rate": 1.5492929589755744e-06, "loss": 1.0844, "step": 33681 }, { "epoch": 0.64, "learning_rate": 1.5491516724529792e-06, "loss": 0.8612, "step": 33682 }, { "epoch": 0.64, "learning_rate": 1.5490103894808225e-06, "loss": 1.0505, "step": 33683 }, { "epoch": 0.64, "learning_rate": 1.5488691100596318e-06, "loss": 0.7568, "step": 33684 }, { "epoch": 0.64, "learning_rate": 1.5487278341899353e-06, "loss": 0.8633, "step": 33685 }, { "epoch": 0.64, "learning_rate": 1.5485865618722584e-06, "loss": 0.9105, "step": 33686 }, { "epoch": 0.64, "learning_rate": 1.5484452931071316e-06, "loss": 1.1212, "step": 33687 }, { "epoch": 0.64, "learning_rate": 1.5483040278950808e-06, "loss": 0.8268, "step": 33688 }, { "epoch": 0.64, "learning_rate": 1.5481627662366327e-06, "loss": 0.8248, "step": 33689 }, { "epoch": 0.64, "learning_rate": 1.5480215081323158e-06, "loss": 0.8055, "step": 33690 }, { "epoch": 0.64, "learning_rate": 1.5478802535826582e-06, "loss": 0.8295, "step": 33691 }, { "epoch": 0.64, "learning_rate": 1.5477390025881854e-06, "loss": 0.9811, "step": 33692 }, { "epoch": 0.64, "learning_rate": 1.547597755149427e-06, "loss": 0.8979, "step": 33693 }, { "epoch": 0.64, "learning_rate": 1.5474565112669093e-06, "loss": 1.1901, "step": 33694 }, { "epoch": 0.64, "learning_rate": 1.547315270941159e-06, "loss": 0.8776, "step": 33695 }, { "epoch": 0.64, "learning_rate": 1.5471740341727052e-06, "loss": 0.6909, "step": 33696 }, { "epoch": 0.64, "learning_rate": 1.547032800962074e-06, "loss": 0.916, "step": 33697 }, { "epoch": 0.64, "learning_rate": 1.5468915713097921e-06, "loss": 0.7637, "step": 33698 }, { "epoch": 0.64, "learning_rate": 1.5467503452163891e-06, "loss": 1.0335, "step": 33699 }, { "epoch": 0.64, "learning_rate": 1.546609122682391e-06, "loss": 0.9945, "step": 33700 }, { "epoch": 0.64, "learning_rate": 1.5464679037083244e-06, "loss": 0.8909, "step": 33701 }, { "epoch": 0.64, "learning_rate": 1.5463266882947183e-06, "loss": 0.8543, "step": 33702 }, { "epoch": 0.64, "learning_rate": 1.5461854764420986e-06, "loss": 0.8547, "step": 33703 }, { "epoch": 0.64, "learning_rate": 1.5460442681509933e-06, "loss": 0.6945, "step": 33704 }, { "epoch": 0.64, "learning_rate": 1.545903063421929e-06, "loss": 0.983, "step": 33705 }, { "epoch": 0.64, "learning_rate": 1.5457618622554342e-06, "loss": 1.0109, "step": 33706 }, { "epoch": 0.64, "learning_rate": 1.5456206646520344e-06, "loss": 0.9467, "step": 33707 }, { "epoch": 0.64, "learning_rate": 1.5454794706122588e-06, "loss": 0.8378, "step": 33708 }, { "epoch": 0.64, "learning_rate": 1.5453382801366334e-06, "loss": 0.7242, "step": 33709 }, { "epoch": 0.64, "learning_rate": 1.545197093225685e-06, "loss": 0.8218, "step": 33710 }, { "epoch": 0.64, "learning_rate": 1.5450559098799413e-06, "loss": 0.873, "step": 33711 }, { "epoch": 0.64, "learning_rate": 1.5449147300999303e-06, "loss": 0.9588, "step": 33712 }, { "epoch": 0.64, "learning_rate": 1.5447735538861774e-06, "loss": 1.1479, "step": 33713 }, { "epoch": 0.64, "learning_rate": 1.5446323812392119e-06, "loss": 0.8784, "step": 33714 }, { "epoch": 0.64, "learning_rate": 1.5444912121595595e-06, "loss": 1.0133, "step": 33715 }, { "epoch": 0.64, "learning_rate": 1.544350046647747e-06, "loss": 0.7128, "step": 33716 }, { "epoch": 0.64, "learning_rate": 1.544208884704303e-06, "loss": 0.6642, "step": 33717 }, { "epoch": 0.64, "learning_rate": 1.5440677263297533e-06, "loss": 0.8969, "step": 33718 }, { "epoch": 0.64, "learning_rate": 1.5439265715246246e-06, "loss": 0.9594, "step": 33719 }, { "epoch": 0.64, "learning_rate": 1.543785420289446e-06, "loss": 0.8912, "step": 33720 }, { "epoch": 0.64, "learning_rate": 1.5436442726247431e-06, "loss": 0.877, "step": 33721 }, { "epoch": 0.64, "learning_rate": 1.5435031285310425e-06, "loss": 0.818, "step": 33722 }, { "epoch": 0.64, "learning_rate": 1.5433619880088723e-06, "loss": 0.8839, "step": 33723 }, { "epoch": 0.64, "learning_rate": 1.5432208510587594e-06, "loss": 0.967, "step": 33724 }, { "epoch": 0.64, "learning_rate": 1.5430797176812306e-06, "loss": 1.1381, "step": 33725 }, { "epoch": 0.64, "learning_rate": 1.5429385878768116e-06, "loss": 1.0635, "step": 33726 }, { "epoch": 0.64, "learning_rate": 1.5427974616460317e-06, "loss": 0.7828, "step": 33727 }, { "epoch": 0.64, "learning_rate": 1.542656338989417e-06, "loss": 1.062, "step": 33728 }, { "epoch": 0.64, "learning_rate": 1.542515219907493e-06, "loss": 0.6785, "step": 33729 }, { "epoch": 0.64, "learning_rate": 1.5423741044007884e-06, "loss": 1.0146, "step": 33730 }, { "epoch": 0.64, "learning_rate": 1.5422329924698298e-06, "loss": 1.2654, "step": 33731 }, { "epoch": 0.64, "learning_rate": 1.5420918841151427e-06, "loss": 1.1077, "step": 33732 }, { "epoch": 0.64, "learning_rate": 1.5419507793372568e-06, "loss": 0.744, "step": 33733 }, { "epoch": 0.64, "learning_rate": 1.5418096781366967e-06, "loss": 0.8803, "step": 33734 }, { "epoch": 0.64, "learning_rate": 1.541668580513989e-06, "loss": 0.9515, "step": 33735 }, { "epoch": 0.64, "learning_rate": 1.5415274864696628e-06, "loss": 0.7709, "step": 33736 }, { "epoch": 0.64, "learning_rate": 1.5413863960042428e-06, "loss": 1.0187, "step": 33737 }, { "epoch": 0.64, "learning_rate": 1.541245309118256e-06, "loss": 1.1409, "step": 33738 }, { "epoch": 0.64, "learning_rate": 1.541104225812231e-06, "loss": 0.7194, "step": 33739 }, { "epoch": 0.64, "learning_rate": 1.5409631460866933e-06, "loss": 1.0551, "step": 33740 }, { "epoch": 0.64, "learning_rate": 1.540822069942169e-06, "loss": 0.926, "step": 33741 }, { "epoch": 0.64, "learning_rate": 1.5406809973791865e-06, "loss": 0.855, "step": 33742 }, { "epoch": 0.64, "learning_rate": 1.5405399283982714e-06, "loss": 0.8664, "step": 33743 }, { "epoch": 0.64, "learning_rate": 1.5403988629999506e-06, "loss": 0.8757, "step": 33744 }, { "epoch": 0.64, "learning_rate": 1.540257801184751e-06, "loss": 0.9844, "step": 33745 }, { "epoch": 0.64, "learning_rate": 1.5401167429531999e-06, "loss": 0.9409, "step": 33746 }, { "epoch": 0.64, "learning_rate": 1.5399756883058225e-06, "loss": 0.8914, "step": 33747 }, { "epoch": 0.64, "learning_rate": 1.5398346372431478e-06, "loss": 1.016, "step": 33748 }, { "epoch": 0.64, "learning_rate": 1.5396935897657006e-06, "loss": 0.8799, "step": 33749 }, { "epoch": 0.64, "learning_rate": 1.5395525458740073e-06, "loss": 1.0051, "step": 33750 }, { "epoch": 0.64, "learning_rate": 1.5394115055685958e-06, "loss": 0.9969, "step": 33751 }, { "epoch": 0.64, "learning_rate": 1.5392704688499927e-06, "loss": 0.7887, "step": 33752 }, { "epoch": 0.64, "learning_rate": 1.5391294357187233e-06, "loss": 1.204, "step": 33753 }, { "epoch": 0.64, "learning_rate": 1.5389884061753162e-06, "loss": 0.9485, "step": 33754 }, { "epoch": 0.64, "learning_rate": 1.5388473802202969e-06, "loss": 1.0291, "step": 33755 }, { "epoch": 0.64, "learning_rate": 1.538706357854191e-06, "loss": 0.9604, "step": 33756 }, { "epoch": 0.64, "learning_rate": 1.5385653390775267e-06, "loss": 0.8907, "step": 33757 }, { "epoch": 0.64, "learning_rate": 1.5384243238908303e-06, "loss": 1.0598, "step": 33758 }, { "epoch": 0.64, "learning_rate": 1.5382833122946266e-06, "loss": 0.9322, "step": 33759 }, { "epoch": 0.64, "learning_rate": 1.538142304289445e-06, "loss": 0.7534, "step": 33760 }, { "epoch": 0.64, "learning_rate": 1.5380012998758106e-06, "loss": 0.6701, "step": 33761 }, { "epoch": 0.64, "learning_rate": 1.5378602990542489e-06, "loss": 0.8684, "step": 33762 }, { "epoch": 0.64, "learning_rate": 1.5377193018252879e-06, "loss": 0.9958, "step": 33763 }, { "epoch": 0.64, "learning_rate": 1.5375783081894535e-06, "loss": 0.9739, "step": 33764 }, { "epoch": 0.64, "learning_rate": 1.5374373181472719e-06, "loss": 0.7804, "step": 33765 }, { "epoch": 0.64, "learning_rate": 1.53729633169927e-06, "loss": 0.9414, "step": 33766 }, { "epoch": 0.64, "learning_rate": 1.5371553488459745e-06, "loss": 0.9371, "step": 33767 }, { "epoch": 0.64, "learning_rate": 1.5370143695879103e-06, "loss": 0.8465, "step": 33768 }, { "epoch": 0.64, "learning_rate": 1.5368733939256058e-06, "loss": 1.0845, "step": 33769 }, { "epoch": 0.64, "learning_rate": 1.5367324218595868e-06, "loss": 0.9548, "step": 33770 }, { "epoch": 0.64, "learning_rate": 1.5365914533903787e-06, "loss": 0.8914, "step": 33771 }, { "epoch": 0.64, "learning_rate": 1.5364504885185082e-06, "loss": 0.9841, "step": 33772 }, { "epoch": 0.64, "learning_rate": 1.5363095272445034e-06, "loss": 0.7679, "step": 33773 }, { "epoch": 0.64, "learning_rate": 1.5361685695688877e-06, "loss": 0.985, "step": 33774 }, { "epoch": 0.64, "learning_rate": 1.5360276154921904e-06, "loss": 1.3429, "step": 33775 }, { "epoch": 0.64, "learning_rate": 1.5358866650149362e-06, "loss": 0.6598, "step": 33776 }, { "epoch": 0.64, "learning_rate": 1.5357457181376507e-06, "loss": 0.8951, "step": 33777 }, { "epoch": 0.64, "learning_rate": 1.5356047748608622e-06, "loss": 0.9021, "step": 33778 }, { "epoch": 0.64, "learning_rate": 1.5354638351850953e-06, "loss": 0.8926, "step": 33779 }, { "epoch": 0.64, "learning_rate": 1.5353228991108765e-06, "loss": 1.1431, "step": 33780 }, { "epoch": 0.64, "learning_rate": 1.5351819666387329e-06, "loss": 1.0593, "step": 33781 }, { "epoch": 0.64, "learning_rate": 1.535041037769191e-06, "loss": 0.9411, "step": 33782 }, { "epoch": 0.64, "learning_rate": 1.534900112502775e-06, "loss": 0.8594, "step": 33783 }, { "epoch": 0.64, "learning_rate": 1.5347591908400133e-06, "loss": 0.935, "step": 33784 }, { "epoch": 0.64, "learning_rate": 1.5346182727814308e-06, "loss": 0.7598, "step": 33785 }, { "epoch": 0.64, "learning_rate": 1.5344773583275537e-06, "loss": 0.768, "step": 33786 }, { "epoch": 0.64, "learning_rate": 1.534336447478909e-06, "loss": 1.1185, "step": 33787 }, { "epoch": 0.64, "learning_rate": 1.5341955402360225e-06, "loss": 1.1321, "step": 33788 }, { "epoch": 0.64, "learning_rate": 1.5340546365994196e-06, "loss": 0.7145, "step": 33789 }, { "epoch": 0.64, "learning_rate": 1.5339137365696276e-06, "loss": 0.9211, "step": 33790 }, { "epoch": 0.64, "learning_rate": 1.5337728401471728e-06, "loss": 1.0316, "step": 33791 }, { "epoch": 0.64, "learning_rate": 1.533631947332579e-06, "loss": 0.9373, "step": 33792 }, { "epoch": 0.64, "learning_rate": 1.5334910581263745e-06, "loss": 1.1581, "step": 33793 }, { "epoch": 0.64, "learning_rate": 1.5333501725290857e-06, "loss": 1.1917, "step": 33794 }, { "epoch": 0.64, "learning_rate": 1.533209290541236e-06, "loss": 0.8503, "step": 33795 }, { "epoch": 0.64, "learning_rate": 1.533068412163355e-06, "loss": 0.7661, "step": 33796 }, { "epoch": 0.64, "learning_rate": 1.5329275373959663e-06, "loss": 1.0406, "step": 33797 }, { "epoch": 0.64, "learning_rate": 1.5327866662395956e-06, "loss": 0.914, "step": 33798 }, { "epoch": 0.64, "learning_rate": 1.5326457986947708e-06, "loss": 1.0229, "step": 33799 }, { "epoch": 0.64, "learning_rate": 1.5325049347620163e-06, "loss": 0.9904, "step": 33800 }, { "epoch": 0.64, "learning_rate": 1.5323640744418586e-06, "loss": 0.9937, "step": 33801 }, { "epoch": 0.64, "learning_rate": 1.5322232177348245e-06, "loss": 0.9531, "step": 33802 }, { "epoch": 0.64, "learning_rate": 1.5320823646414395e-06, "loss": 0.9931, "step": 33803 }, { "epoch": 0.64, "learning_rate": 1.531941515162228e-06, "loss": 0.7537, "step": 33804 }, { "epoch": 0.64, "learning_rate": 1.5318006692977184e-06, "loss": 1.184, "step": 33805 }, { "epoch": 0.64, "learning_rate": 1.5316598270484348e-06, "loss": 0.8256, "step": 33806 }, { "epoch": 0.64, "learning_rate": 1.5315189884149038e-06, "loss": 1.0013, "step": 33807 }, { "epoch": 0.64, "learning_rate": 1.5313781533976514e-06, "loss": 0.8358, "step": 33808 }, { "epoch": 0.64, "learning_rate": 1.5312373219972032e-06, "loss": 0.9508, "step": 33809 }, { "epoch": 0.64, "learning_rate": 1.5310964942140844e-06, "loss": 0.757, "step": 33810 }, { "epoch": 0.64, "learning_rate": 1.5309556700488227e-06, "loss": 0.8951, "step": 33811 }, { "epoch": 0.64, "learning_rate": 1.5308148495019426e-06, "loss": 1.0679, "step": 33812 }, { "epoch": 0.64, "learning_rate": 1.5306740325739695e-06, "loss": 0.946, "step": 33813 }, { "epoch": 0.64, "learning_rate": 1.53053321926543e-06, "loss": 0.9072, "step": 33814 }, { "epoch": 0.64, "learning_rate": 1.5303924095768505e-06, "loss": 0.701, "step": 33815 }, { "epoch": 0.64, "learning_rate": 1.530251603508755e-06, "loss": 0.895, "step": 33816 }, { "epoch": 0.64, "learning_rate": 1.530110801061671e-06, "loss": 0.7552, "step": 33817 }, { "epoch": 0.64, "learning_rate": 1.5299700022361236e-06, "loss": 0.9746, "step": 33818 }, { "epoch": 0.64, "learning_rate": 1.5298292070326376e-06, "loss": 1.0821, "step": 33819 }, { "epoch": 0.64, "learning_rate": 1.5296884154517406e-06, "loss": 0.768, "step": 33820 }, { "epoch": 0.64, "learning_rate": 1.529547627493957e-06, "loss": 0.8206, "step": 33821 }, { "epoch": 0.64, "learning_rate": 1.529406843159812e-06, "loss": 0.9554, "step": 33822 }, { "epoch": 0.64, "learning_rate": 1.529266062449833e-06, "loss": 0.7336, "step": 33823 }, { "epoch": 0.64, "learning_rate": 1.529125285364545e-06, "loss": 1.0671, "step": 33824 }, { "epoch": 0.64, "learning_rate": 1.528984511904472e-06, "loss": 1.0532, "step": 33825 }, { "epoch": 0.64, "learning_rate": 1.5288437420701427e-06, "loss": 1.0426, "step": 33826 }, { "epoch": 0.64, "learning_rate": 1.5287029758620802e-06, "loss": 0.7827, "step": 33827 }, { "epoch": 0.64, "learning_rate": 1.5285622132808108e-06, "loss": 0.9661, "step": 33828 }, { "epoch": 0.64, "learning_rate": 1.528421454326861e-06, "loss": 0.7727, "step": 33829 }, { "epoch": 0.64, "learning_rate": 1.5282806990007556e-06, "loss": 0.9421, "step": 33830 }, { "epoch": 0.64, "learning_rate": 1.5281399473030195e-06, "loss": 1.0869, "step": 33831 }, { "epoch": 0.64, "learning_rate": 1.5279991992341802e-06, "loss": 0.8382, "step": 33832 }, { "epoch": 0.64, "learning_rate": 1.5278584547947618e-06, "loss": 0.9136, "step": 33833 }, { "epoch": 0.64, "learning_rate": 1.5277177139852893e-06, "loss": 0.8005, "step": 33834 }, { "epoch": 0.64, "learning_rate": 1.5275769768062893e-06, "loss": 0.8858, "step": 33835 }, { "epoch": 0.64, "learning_rate": 1.527436243258288e-06, "loss": 0.7471, "step": 33836 }, { "epoch": 0.64, "learning_rate": 1.5272955133418086e-06, "loss": 1.0948, "step": 33837 }, { "epoch": 0.64, "learning_rate": 1.5271547870573788e-06, "loss": 0.9904, "step": 33838 }, { "epoch": 0.64, "learning_rate": 1.5270140644055237e-06, "loss": 0.7905, "step": 33839 }, { "epoch": 0.64, "learning_rate": 1.5268733453867668e-06, "loss": 0.8602, "step": 33840 }, { "epoch": 0.64, "learning_rate": 1.5267326300016362e-06, "loss": 0.8276, "step": 33841 }, { "epoch": 0.64, "learning_rate": 1.5265919182506555e-06, "loss": 0.9996, "step": 33842 }, { "epoch": 0.64, "learning_rate": 1.5264512101343504e-06, "loss": 1.0535, "step": 33843 }, { "epoch": 0.64, "learning_rate": 1.5263105056532473e-06, "loss": 1.0641, "step": 33844 }, { "epoch": 0.64, "learning_rate": 1.5261698048078713e-06, "loss": 0.9822, "step": 33845 }, { "epoch": 0.64, "learning_rate": 1.526029107598746e-06, "loss": 0.8101, "step": 33846 }, { "epoch": 0.64, "learning_rate": 1.5258884140263997e-06, "loss": 0.8619, "step": 33847 }, { "epoch": 0.64, "learning_rate": 1.5257477240913554e-06, "loss": 0.8037, "step": 33848 }, { "epoch": 0.64, "learning_rate": 1.525607037794139e-06, "loss": 1.0167, "step": 33849 }, { "epoch": 0.64, "learning_rate": 1.5254663551352763e-06, "loss": 0.9071, "step": 33850 }, { "epoch": 0.64, "learning_rate": 1.5253256761152928e-06, "loss": 0.9069, "step": 33851 }, { "epoch": 0.64, "learning_rate": 1.5251850007347124e-06, "loss": 0.903, "step": 33852 }, { "epoch": 0.64, "learning_rate": 1.5250443289940623e-06, "loss": 0.7781, "step": 33853 }, { "epoch": 0.64, "learning_rate": 1.5249036608938666e-06, "loss": 0.9707, "step": 33854 }, { "epoch": 0.64, "learning_rate": 1.5247629964346499e-06, "loss": 0.9492, "step": 33855 }, { "epoch": 0.64, "learning_rate": 1.5246223356169388e-06, "loss": 1.1632, "step": 33856 }, { "epoch": 0.64, "learning_rate": 1.5244816784412586e-06, "loss": 1.0151, "step": 33857 }, { "epoch": 0.64, "learning_rate": 1.5243410249081325e-06, "loss": 0.678, "step": 33858 }, { "epoch": 0.64, "learning_rate": 1.5242003750180883e-06, "loss": 0.9169, "step": 33859 }, { "epoch": 0.64, "learning_rate": 1.5240597287716502e-06, "loss": 0.9706, "step": 33860 }, { "epoch": 0.64, "learning_rate": 1.5239190861693421e-06, "loss": 0.8206, "step": 33861 }, { "epoch": 0.64, "learning_rate": 1.5237784472116909e-06, "loss": 1.0859, "step": 33862 }, { "epoch": 0.64, "learning_rate": 1.5236378118992207e-06, "loss": 0.8446, "step": 33863 }, { "epoch": 0.64, "learning_rate": 1.5234971802324566e-06, "loss": 0.9911, "step": 33864 }, { "epoch": 0.64, "learning_rate": 1.5233565522119247e-06, "loss": 0.8826, "step": 33865 }, { "epoch": 0.64, "learning_rate": 1.52321592783815e-06, "loss": 0.8934, "step": 33866 }, { "epoch": 0.64, "learning_rate": 1.5230753071116559e-06, "loss": 0.6149, "step": 33867 }, { "epoch": 0.64, "learning_rate": 1.5229346900329694e-06, "loss": 0.9758, "step": 33868 }, { "epoch": 0.64, "learning_rate": 1.5227940766026146e-06, "loss": 1.1259, "step": 33869 }, { "epoch": 0.64, "learning_rate": 1.5226534668211167e-06, "loss": 0.9627, "step": 33870 }, { "epoch": 0.64, "learning_rate": 1.5225128606890008e-06, "loss": 0.9154, "step": 33871 }, { "epoch": 0.64, "learning_rate": 1.5223722582067923e-06, "loss": 0.9345, "step": 33872 }, { "epoch": 0.64, "learning_rate": 1.5222316593750147e-06, "loss": 0.9613, "step": 33873 }, { "epoch": 0.64, "learning_rate": 1.5220910641941954e-06, "loss": 0.9481, "step": 33874 }, { "epoch": 0.64, "learning_rate": 1.521950472664858e-06, "loss": 1.0148, "step": 33875 }, { "epoch": 0.64, "learning_rate": 1.5218098847875268e-06, "loss": 1.0506, "step": 33876 }, { "epoch": 0.64, "learning_rate": 1.5216693005627276e-06, "loss": 0.8448, "step": 33877 }, { "epoch": 0.64, "learning_rate": 1.5215287199909856e-06, "loss": 0.8257, "step": 33878 }, { "epoch": 0.64, "learning_rate": 1.5213881430728247e-06, "loss": 0.7462, "step": 33879 }, { "epoch": 0.64, "learning_rate": 1.5212475698087714e-06, "loss": 0.9187, "step": 33880 }, { "epoch": 0.64, "learning_rate": 1.5211070001993498e-06, "loss": 1.1108, "step": 33881 }, { "epoch": 0.64, "learning_rate": 1.5209664342450834e-06, "loss": 1.0811, "step": 33882 }, { "epoch": 0.64, "learning_rate": 1.5208258719464994e-06, "loss": 0.8412, "step": 33883 }, { "epoch": 0.64, "learning_rate": 1.5206853133041211e-06, "loss": 1.0979, "step": 33884 }, { "epoch": 0.64, "learning_rate": 1.5205447583184732e-06, "loss": 0.9108, "step": 33885 }, { "epoch": 0.64, "learning_rate": 1.520404206990082e-06, "loss": 0.9567, "step": 33886 }, { "epoch": 0.64, "learning_rate": 1.5202636593194719e-06, "loss": 1.1129, "step": 33887 }, { "epoch": 0.64, "learning_rate": 1.520123115307166e-06, "loss": 1.1139, "step": 33888 }, { "epoch": 0.64, "learning_rate": 1.5199825749536915e-06, "loss": 0.9955, "step": 33889 }, { "epoch": 0.64, "learning_rate": 1.5198420382595714e-06, "loss": 0.8257, "step": 33890 }, { "epoch": 0.64, "learning_rate": 1.5197015052253312e-06, "loss": 0.8621, "step": 33891 }, { "epoch": 0.64, "learning_rate": 1.5195609758514951e-06, "loss": 0.7291, "step": 33892 }, { "epoch": 0.64, "learning_rate": 1.5194204501385893e-06, "loss": 1.1449, "step": 33893 }, { "epoch": 0.64, "learning_rate": 1.5192799280871362e-06, "loss": 1.2233, "step": 33894 }, { "epoch": 0.64, "learning_rate": 1.5191394096976628e-06, "loss": 0.9544, "step": 33895 }, { "epoch": 0.64, "learning_rate": 1.518998894970693e-06, "loss": 0.8372, "step": 33896 }, { "epoch": 0.64, "learning_rate": 1.51885838390675e-06, "loss": 0.8705, "step": 33897 }, { "epoch": 0.64, "learning_rate": 1.5187178765063601e-06, "loss": 0.7399, "step": 33898 }, { "epoch": 0.64, "learning_rate": 1.518577372770048e-06, "loss": 0.9633, "step": 33899 }, { "epoch": 0.64, "learning_rate": 1.5184368726983372e-06, "loss": 1.2994, "step": 33900 }, { "epoch": 0.64, "learning_rate": 1.518296376291754e-06, "loss": 0.9161, "step": 33901 }, { "epoch": 0.64, "learning_rate": 1.518155883550822e-06, "loss": 0.9592, "step": 33902 }, { "epoch": 0.64, "learning_rate": 1.5180153944760648e-06, "loss": 0.9461, "step": 33903 }, { "epoch": 0.64, "learning_rate": 1.517874909068009e-06, "loss": 0.8712, "step": 33904 }, { "epoch": 0.64, "learning_rate": 1.5177344273271776e-06, "loss": 0.8586, "step": 33905 }, { "epoch": 0.64, "learning_rate": 1.5175939492540953e-06, "loss": 1.0488, "step": 33906 }, { "epoch": 0.64, "learning_rate": 1.517453474849288e-06, "loss": 1.0147, "step": 33907 }, { "epoch": 0.64, "learning_rate": 1.5173130041132795e-06, "loss": 0.825, "step": 33908 }, { "epoch": 0.64, "learning_rate": 1.5171725370465928e-06, "loss": 0.8006, "step": 33909 }, { "epoch": 0.64, "learning_rate": 1.5170320736497552e-06, "loss": 0.7756, "step": 33910 }, { "epoch": 0.64, "learning_rate": 1.5168916139232886e-06, "loss": 1.0283, "step": 33911 }, { "epoch": 0.64, "learning_rate": 1.5167511578677192e-06, "loss": 1.0681, "step": 33912 }, { "epoch": 0.64, "learning_rate": 1.5166107054835705e-06, "loss": 0.9283, "step": 33913 }, { "epoch": 0.64, "learning_rate": 1.5164702567713676e-06, "loss": 0.9767, "step": 33914 }, { "epoch": 0.64, "learning_rate": 1.5163298117316338e-06, "loss": 1.0063, "step": 33915 }, { "epoch": 0.64, "learning_rate": 1.5161893703648952e-06, "loss": 0.9045, "step": 33916 }, { "epoch": 0.64, "learning_rate": 1.5160489326716753e-06, "loss": 0.9961, "step": 33917 }, { "epoch": 0.64, "learning_rate": 1.515908498652498e-06, "loss": 1.0217, "step": 33918 }, { "epoch": 0.64, "learning_rate": 1.5157680683078882e-06, "loss": 1.0814, "step": 33919 }, { "epoch": 0.64, "learning_rate": 1.5156276416383708e-06, "loss": 0.9642, "step": 33920 }, { "epoch": 0.64, "learning_rate": 1.5154872186444688e-06, "loss": 0.7471, "step": 33921 }, { "epoch": 0.64, "learning_rate": 1.5153467993267082e-06, "loss": 0.8972, "step": 33922 }, { "epoch": 0.64, "learning_rate": 1.5152063836856127e-06, "loss": 1.0001, "step": 33923 }, { "epoch": 0.64, "learning_rate": 1.5150659717217051e-06, "loss": 1.0022, "step": 33924 }, { "epoch": 0.64, "learning_rate": 1.514925563435512e-06, "loss": 1.0784, "step": 33925 }, { "epoch": 0.64, "learning_rate": 1.514785158827556e-06, "loss": 0.9214, "step": 33926 }, { "epoch": 0.64, "learning_rate": 1.514644757898362e-06, "loss": 0.8831, "step": 33927 }, { "epoch": 0.64, "learning_rate": 1.514504360648455e-06, "loss": 0.9536, "step": 33928 }, { "epoch": 0.64, "learning_rate": 1.5143639670783583e-06, "loss": 0.839, "step": 33929 }, { "epoch": 0.64, "learning_rate": 1.5142235771885954e-06, "loss": 0.9817, "step": 33930 }, { "epoch": 0.64, "learning_rate": 1.5140831909796928e-06, "loss": 1.1252, "step": 33931 }, { "epoch": 0.64, "learning_rate": 1.5139428084521723e-06, "loss": 1.0907, "step": 33932 }, { "epoch": 0.64, "learning_rate": 1.5138024296065595e-06, "loss": 0.855, "step": 33933 }, { "epoch": 0.64, "learning_rate": 1.5136620544433777e-06, "loss": 0.9099, "step": 33934 }, { "epoch": 0.64, "learning_rate": 1.5135216829631528e-06, "loss": 0.6902, "step": 33935 }, { "epoch": 0.64, "learning_rate": 1.5133813151664063e-06, "loss": 0.9525, "step": 33936 }, { "epoch": 0.64, "learning_rate": 1.5132409510536644e-06, "loss": 0.9938, "step": 33937 }, { "epoch": 0.64, "learning_rate": 1.5131005906254508e-06, "loss": 0.7544, "step": 33938 }, { "epoch": 0.64, "learning_rate": 1.5129602338822886e-06, "loss": 0.9507, "step": 33939 }, { "epoch": 0.64, "learning_rate": 1.5128198808247029e-06, "loss": 0.8459, "step": 33940 }, { "epoch": 0.64, "learning_rate": 1.5126795314532178e-06, "loss": 0.8673, "step": 33941 }, { "epoch": 0.64, "learning_rate": 1.5125391857683564e-06, "loss": 0.9312, "step": 33942 }, { "epoch": 0.64, "learning_rate": 1.5123988437706444e-06, "loss": 0.9495, "step": 33943 }, { "epoch": 0.64, "learning_rate": 1.512258505460605e-06, "loss": 0.719, "step": 33944 }, { "epoch": 0.64, "learning_rate": 1.5121181708387606e-06, "loss": 0.6768, "step": 33945 }, { "epoch": 0.64, "learning_rate": 1.5119778399056375e-06, "loss": 0.723, "step": 33946 }, { "epoch": 0.64, "learning_rate": 1.5118375126617587e-06, "loss": 1.0024, "step": 33947 }, { "epoch": 0.64, "learning_rate": 1.5116971891076479e-06, "loss": 0.8419, "step": 33948 }, { "epoch": 0.64, "learning_rate": 1.5115568692438303e-06, "loss": 1.0193, "step": 33949 }, { "epoch": 0.64, "learning_rate": 1.5114165530708292e-06, "loss": 1.1171, "step": 33950 }, { "epoch": 0.64, "learning_rate": 1.5112762405891674e-06, "loss": 0.9523, "step": 33951 }, { "epoch": 0.64, "learning_rate": 1.5111359317993706e-06, "loss": 0.8721, "step": 33952 }, { "epoch": 0.64, "learning_rate": 1.5109956267019614e-06, "loss": 0.8582, "step": 33953 }, { "epoch": 0.64, "learning_rate": 1.5108553252974645e-06, "loss": 0.8412, "step": 33954 }, { "epoch": 0.64, "learning_rate": 1.5107150275864036e-06, "loss": 0.8745, "step": 33955 }, { "epoch": 0.64, "learning_rate": 1.5105747335693024e-06, "loss": 0.9453, "step": 33956 }, { "epoch": 0.64, "learning_rate": 1.5104344432466842e-06, "loss": 0.9835, "step": 33957 }, { "epoch": 0.64, "learning_rate": 1.5102941566190743e-06, "loss": 0.804, "step": 33958 }, { "epoch": 0.64, "learning_rate": 1.5101538736869958e-06, "loss": 0.9097, "step": 33959 }, { "epoch": 0.64, "learning_rate": 1.5100135944509717e-06, "loss": 0.9515, "step": 33960 }, { "epoch": 0.64, "learning_rate": 1.5098733189115262e-06, "loss": 0.9407, "step": 33961 }, { "epoch": 0.64, "learning_rate": 1.509733047069184e-06, "loss": 0.9729, "step": 33962 }, { "epoch": 0.64, "learning_rate": 1.5095927789244685e-06, "loss": 0.9639, "step": 33963 }, { "epoch": 0.64, "learning_rate": 1.5094525144779024e-06, "loss": 1.0635, "step": 33964 }, { "epoch": 0.64, "learning_rate": 1.5093122537300109e-06, "loss": 0.8358, "step": 33965 }, { "epoch": 0.64, "learning_rate": 1.5091719966813168e-06, "loss": 0.803, "step": 33966 }, { "epoch": 0.64, "learning_rate": 1.5090317433323439e-06, "loss": 0.7314, "step": 33967 }, { "epoch": 0.64, "learning_rate": 1.5088914936836164e-06, "loss": 1.0967, "step": 33968 }, { "epoch": 0.64, "learning_rate": 1.5087512477356578e-06, "loss": 1.0399, "step": 33969 }, { "epoch": 0.64, "learning_rate": 1.5086110054889907e-06, "loss": 0.6942, "step": 33970 }, { "epoch": 0.64, "learning_rate": 1.508470766944141e-06, "loss": 0.774, "step": 33971 }, { "epoch": 0.64, "learning_rate": 1.5083305321016306e-06, "loss": 0.9177, "step": 33972 }, { "epoch": 0.64, "learning_rate": 1.5081903009619831e-06, "loss": 0.9174, "step": 33973 }, { "epoch": 0.64, "learning_rate": 1.5080500735257227e-06, "loss": 0.9965, "step": 33974 }, { "epoch": 0.64, "learning_rate": 1.5079098497933737e-06, "loss": 1.1332, "step": 33975 }, { "epoch": 0.64, "learning_rate": 1.5077696297654576e-06, "loss": 0.9791, "step": 33976 }, { "epoch": 0.64, "learning_rate": 1.5076294134425006e-06, "loss": 0.8607, "step": 33977 }, { "epoch": 0.64, "learning_rate": 1.5074892008250247e-06, "loss": 0.8846, "step": 33978 }, { "epoch": 0.64, "learning_rate": 1.5073489919135529e-06, "loss": 0.7281, "step": 33979 }, { "epoch": 0.64, "learning_rate": 1.5072087867086105e-06, "loss": 0.9062, "step": 33980 }, { "epoch": 0.64, "learning_rate": 1.5070685852107191e-06, "loss": 1.0772, "step": 33981 }, { "epoch": 0.64, "learning_rate": 1.5069283874204033e-06, "loss": 0.9208, "step": 33982 }, { "epoch": 0.64, "learning_rate": 1.5067881933381872e-06, "loss": 0.9424, "step": 33983 }, { "epoch": 0.64, "learning_rate": 1.5066480029645937e-06, "loss": 0.8072, "step": 33984 }, { "epoch": 0.64, "learning_rate": 1.5065078163001445e-06, "loss": 0.981, "step": 33985 }, { "epoch": 0.64, "learning_rate": 1.5063676333453664e-06, "loss": 0.8246, "step": 33986 }, { "epoch": 0.64, "learning_rate": 1.50622745410078e-06, "loss": 1.1659, "step": 33987 }, { "epoch": 0.64, "learning_rate": 1.5060872785669101e-06, "loss": 0.9006, "step": 33988 }, { "epoch": 0.64, "learning_rate": 1.5059471067442798e-06, "loss": 0.7353, "step": 33989 }, { "epoch": 0.64, "learning_rate": 1.505806938633413e-06, "loss": 0.9489, "step": 33990 }, { "epoch": 0.64, "learning_rate": 1.5056667742348318e-06, "loss": 0.818, "step": 33991 }, { "epoch": 0.64, "learning_rate": 1.5055266135490608e-06, "loss": 1.072, "step": 33992 }, { "epoch": 0.64, "learning_rate": 1.5053864565766236e-06, "loss": 1.0687, "step": 33993 }, { "epoch": 0.64, "learning_rate": 1.5052463033180418e-06, "loss": 0.9279, "step": 33994 }, { "epoch": 0.64, "learning_rate": 1.5051061537738397e-06, "loss": 0.83, "step": 33995 }, { "epoch": 0.64, "learning_rate": 1.504966007944542e-06, "loss": 0.7949, "step": 33996 }, { "epoch": 0.64, "learning_rate": 1.5048258658306692e-06, "loss": 0.7827, "step": 33997 }, { "epoch": 0.64, "learning_rate": 1.5046857274327476e-06, "loss": 0.9168, "step": 33998 }, { "epoch": 0.64, "learning_rate": 1.5045455927512987e-06, "loss": 0.9397, "step": 33999 }, { "epoch": 0.64, "learning_rate": 1.5044054617868449e-06, "loss": 1.2145, "step": 34000 }, { "epoch": 0.64, "learning_rate": 1.5042653345399117e-06, "loss": 1.0339, "step": 34001 }, { "epoch": 0.64, "learning_rate": 1.5041252110110205e-06, "loss": 0.8885, "step": 34002 }, { "epoch": 0.64, "learning_rate": 1.5039850912006949e-06, "loss": 0.9009, "step": 34003 }, { "epoch": 0.64, "learning_rate": 1.5038449751094592e-06, "loss": 0.7671, "step": 34004 }, { "epoch": 0.64, "learning_rate": 1.5037048627378362e-06, "loss": 0.9173, "step": 34005 }, { "epoch": 0.64, "learning_rate": 1.5035647540863473e-06, "loss": 1.0244, "step": 34006 }, { "epoch": 0.64, "learning_rate": 1.5034246491555185e-06, "loss": 0.8992, "step": 34007 }, { "epoch": 0.64, "learning_rate": 1.5032845479458707e-06, "loss": 0.8264, "step": 34008 }, { "epoch": 0.64, "learning_rate": 1.503144450457928e-06, "loss": 0.6455, "step": 34009 }, { "epoch": 0.64, "learning_rate": 1.5030043566922133e-06, "loss": 0.9332, "step": 34010 }, { "epoch": 0.64, "learning_rate": 1.5028642666492503e-06, "loss": 0.8423, "step": 34011 }, { "epoch": 0.64, "learning_rate": 1.5027241803295605e-06, "loss": 1.0769, "step": 34012 }, { "epoch": 0.64, "learning_rate": 1.5025840977336693e-06, "loss": 0.7945, "step": 34013 }, { "epoch": 0.64, "learning_rate": 1.502444018862098e-06, "loss": 0.9914, "step": 34014 }, { "epoch": 0.64, "learning_rate": 1.5023039437153695e-06, "loss": 0.8024, "step": 34015 }, { "epoch": 0.64, "learning_rate": 1.502163872294008e-06, "loss": 1.1057, "step": 34016 }, { "epoch": 0.64, "learning_rate": 1.5020238045985363e-06, "loss": 0.8434, "step": 34017 }, { "epoch": 0.64, "learning_rate": 1.5018837406294762e-06, "loss": 1.0989, "step": 34018 }, { "epoch": 0.64, "learning_rate": 1.5017436803873526e-06, "loss": 1.1777, "step": 34019 }, { "epoch": 0.64, "learning_rate": 1.5016036238726875e-06, "loss": 0.815, "step": 34020 }, { "epoch": 0.64, "learning_rate": 1.5014635710860029e-06, "loss": 1.031, "step": 34021 }, { "epoch": 0.64, "learning_rate": 1.5013235220278235e-06, "loss": 0.7811, "step": 34022 }, { "epoch": 0.64, "learning_rate": 1.501183476698671e-06, "loss": 0.7235, "step": 34023 }, { "epoch": 0.64, "learning_rate": 1.5010434350990688e-06, "loss": 0.8821, "step": 34024 }, { "epoch": 0.64, "learning_rate": 1.50090339722954e-06, "loss": 1.1395, "step": 34025 }, { "epoch": 0.64, "learning_rate": 1.5007633630906076e-06, "loss": 1.0408, "step": 34026 }, { "epoch": 0.64, "learning_rate": 1.5006233326827935e-06, "loss": 1.0125, "step": 34027 }, { "epoch": 0.64, "learning_rate": 1.500483306006622e-06, "loss": 0.7784, "step": 34028 }, { "epoch": 0.64, "learning_rate": 1.5003432830626146e-06, "loss": 0.7745, "step": 34029 }, { "epoch": 0.64, "learning_rate": 1.5002032638512947e-06, "loss": 0.9007, "step": 34030 }, { "epoch": 0.64, "learning_rate": 1.5000632483731853e-06, "loss": 1.0707, "step": 34031 }, { "epoch": 0.64, "learning_rate": 1.4999232366288098e-06, "loss": 1.0417, "step": 34032 }, { "epoch": 0.64, "learning_rate": 1.4997832286186887e-06, "loss": 0.7487, "step": 34033 }, { "epoch": 0.64, "learning_rate": 1.4996432243433477e-06, "loss": 0.91, "step": 34034 }, { "epoch": 0.64, "learning_rate": 1.499503223803308e-06, "loss": 0.868, "step": 34035 }, { "epoch": 0.64, "learning_rate": 1.4993632269990919e-06, "loss": 1.0386, "step": 34036 }, { "epoch": 0.64, "learning_rate": 1.499223233931223e-06, "loss": 1.124, "step": 34037 }, { "epoch": 0.64, "learning_rate": 1.4990832446002247e-06, "loss": 0.9124, "step": 34038 }, { "epoch": 0.64, "learning_rate": 1.4989432590066177e-06, "loss": 0.9647, "step": 34039 }, { "epoch": 0.64, "learning_rate": 1.498803277150927e-06, "loss": 0.8643, "step": 34040 }, { "epoch": 0.64, "learning_rate": 1.4986632990336741e-06, "loss": 0.8833, "step": 34041 }, { "epoch": 0.64, "learning_rate": 1.4985233246553803e-06, "loss": 1.0214, "step": 34042 }, { "epoch": 0.64, "learning_rate": 1.4983833540165714e-06, "loss": 0.9006, "step": 34043 }, { "epoch": 0.64, "learning_rate": 1.4982433871177677e-06, "loss": 1.0197, "step": 34044 }, { "epoch": 0.64, "learning_rate": 1.4981034239594915e-06, "loss": 0.9436, "step": 34045 }, { "epoch": 0.64, "learning_rate": 1.497963464542268e-06, "loss": 0.9517, "step": 34046 }, { "epoch": 0.64, "learning_rate": 1.4978235088666176e-06, "loss": 0.8695, "step": 34047 }, { "epoch": 0.64, "learning_rate": 1.4976835569330628e-06, "loss": 0.9164, "step": 34048 }, { "epoch": 0.64, "learning_rate": 1.497543608742128e-06, "loss": 1.0397, "step": 34049 }, { "epoch": 0.64, "learning_rate": 1.497403664294334e-06, "loss": 1.1154, "step": 34050 }, { "epoch": 0.64, "learning_rate": 1.4972637235902041e-06, "loss": 0.88, "step": 34051 }, { "epoch": 0.64, "learning_rate": 1.4971237866302606e-06, "loss": 0.8361, "step": 34052 }, { "epoch": 0.64, "learning_rate": 1.4969838534150267e-06, "loss": 0.8779, "step": 34053 }, { "epoch": 0.64, "learning_rate": 1.4968439239450232e-06, "loss": 0.7852, "step": 34054 }, { "epoch": 0.64, "learning_rate": 1.4967039982207748e-06, "loss": 0.9699, "step": 34055 }, { "epoch": 0.64, "learning_rate": 1.496564076242803e-06, "loss": 1.1374, "step": 34056 }, { "epoch": 0.64, "learning_rate": 1.496424158011629e-06, "loss": 1.0559, "step": 34057 }, { "epoch": 0.64, "learning_rate": 1.496284243527777e-06, "loss": 0.8578, "step": 34058 }, { "epoch": 0.64, "learning_rate": 1.4961443327917694e-06, "loss": 0.8928, "step": 34059 }, { "epoch": 0.64, "learning_rate": 1.4960044258041267e-06, "loss": 0.7533, "step": 34060 }, { "epoch": 0.64, "learning_rate": 1.4958645225653742e-06, "loss": 0.8623, "step": 34061 }, { "epoch": 0.64, "learning_rate": 1.4957246230760328e-06, "loss": 0.9743, "step": 34062 }, { "epoch": 0.64, "learning_rate": 1.4955847273366237e-06, "loss": 0.981, "step": 34063 }, { "epoch": 0.64, "learning_rate": 1.4954448353476715e-06, "loss": 0.9918, "step": 34064 }, { "epoch": 0.64, "learning_rate": 1.4953049471096966e-06, "loss": 0.8248, "step": 34065 }, { "epoch": 0.64, "learning_rate": 1.4951650626232223e-06, "loss": 0.9476, "step": 34066 }, { "epoch": 0.64, "learning_rate": 1.4950251818887714e-06, "loss": 0.751, "step": 34067 }, { "epoch": 0.64, "learning_rate": 1.4948853049068656e-06, "loss": 0.9341, "step": 34068 }, { "epoch": 0.64, "learning_rate": 1.4947454316780268e-06, "loss": 1.0439, "step": 34069 }, { "epoch": 0.64, "learning_rate": 1.4946055622027783e-06, "loss": 0.858, "step": 34070 }, { "epoch": 0.64, "learning_rate": 1.4944656964816415e-06, "loss": 0.9235, "step": 34071 }, { "epoch": 0.64, "learning_rate": 1.4943258345151391e-06, "loss": 0.7404, "step": 34072 }, { "epoch": 0.64, "learning_rate": 1.4941859763037928e-06, "loss": 0.8449, "step": 34073 }, { "epoch": 0.64, "learning_rate": 1.494046121848126e-06, "loss": 1.2419, "step": 34074 }, { "epoch": 0.64, "learning_rate": 1.4939062711486591e-06, "loss": 0.9839, "step": 34075 }, { "epoch": 0.64, "learning_rate": 1.493766424205916e-06, "loss": 0.825, "step": 34076 }, { "epoch": 0.64, "learning_rate": 1.4936265810204187e-06, "loss": 0.7989, "step": 34077 }, { "epoch": 0.64, "learning_rate": 1.4934867415926876e-06, "loss": 0.7451, "step": 34078 }, { "epoch": 0.64, "learning_rate": 1.493346905923247e-06, "loss": 0.7587, "step": 34079 }, { "epoch": 0.64, "learning_rate": 1.493207074012618e-06, "loss": 0.8001, "step": 34080 }, { "epoch": 0.64, "learning_rate": 1.4930672458613226e-06, "loss": 1.0167, "step": 34081 }, { "epoch": 0.64, "learning_rate": 1.492927421469884e-06, "loss": 0.9287, "step": 34082 }, { "epoch": 0.64, "learning_rate": 1.4927876008388233e-06, "loss": 0.7957, "step": 34083 }, { "epoch": 0.64, "learning_rate": 1.4926477839686621e-06, "loss": 1.0953, "step": 34084 }, { "epoch": 0.64, "learning_rate": 1.4925079708599242e-06, "loss": 1.0245, "step": 34085 }, { "epoch": 0.64, "learning_rate": 1.49236816151313e-06, "loss": 0.8732, "step": 34086 }, { "epoch": 0.64, "learning_rate": 1.4922283559288016e-06, "loss": 1.0668, "step": 34087 }, { "epoch": 0.64, "learning_rate": 1.4920885541074631e-06, "loss": 0.8494, "step": 34088 }, { "epoch": 0.64, "learning_rate": 1.4919487560496345e-06, "loss": 0.8899, "step": 34089 }, { "epoch": 0.64, "learning_rate": 1.4918089617558376e-06, "loss": 0.9259, "step": 34090 }, { "epoch": 0.64, "learning_rate": 1.4916691712265963e-06, "loss": 0.9766, "step": 34091 }, { "epoch": 0.64, "learning_rate": 1.4915293844624303e-06, "loss": 0.8265, "step": 34092 }, { "epoch": 0.64, "learning_rate": 1.491389601463863e-06, "loss": 1.2689, "step": 34093 }, { "epoch": 0.64, "learning_rate": 1.491249822231416e-06, "loss": 1.0659, "step": 34094 }, { "epoch": 0.64, "learning_rate": 1.491110046765612e-06, "loss": 0.8371, "step": 34095 }, { "epoch": 0.64, "learning_rate": 1.4909702750669707e-06, "loss": 0.9275, "step": 34096 }, { "epoch": 0.64, "learning_rate": 1.4908305071360168e-06, "loss": 0.9918, "step": 34097 }, { "epoch": 0.64, "learning_rate": 1.4906907429732708e-06, "loss": 0.717, "step": 34098 }, { "epoch": 0.64, "learning_rate": 1.4905509825792535e-06, "loss": 1.0785, "step": 34099 }, { "epoch": 0.64, "learning_rate": 1.4904112259544883e-06, "loss": 0.9473, "step": 34100 }, { "epoch": 0.64, "learning_rate": 1.4902714730994975e-06, "loss": 1.0854, "step": 34101 }, { "epoch": 0.64, "learning_rate": 1.4901317240148007e-06, "loss": 0.929, "step": 34102 }, { "epoch": 0.64, "learning_rate": 1.4899919787009221e-06, "loss": 0.9111, "step": 34103 }, { "epoch": 0.64, "learning_rate": 1.4898522371583826e-06, "loss": 0.7413, "step": 34104 }, { "epoch": 0.64, "learning_rate": 1.4897124993877027e-06, "loss": 0.8893, "step": 34105 }, { "epoch": 0.64, "learning_rate": 1.4895727653894066e-06, "loss": 1.0246, "step": 34106 }, { "epoch": 0.64, "learning_rate": 1.4894330351640143e-06, "loss": 0.9384, "step": 34107 }, { "epoch": 0.64, "learning_rate": 1.4892933087120476e-06, "loss": 0.8176, "step": 34108 }, { "epoch": 0.64, "learning_rate": 1.4891535860340294e-06, "loss": 0.9473, "step": 34109 }, { "epoch": 0.64, "learning_rate": 1.489013867130481e-06, "loss": 0.9295, "step": 34110 }, { "epoch": 0.64, "learning_rate": 1.4888741520019226e-06, "loss": 1.1636, "step": 34111 }, { "epoch": 0.64, "learning_rate": 1.4887344406488783e-06, "loss": 0.9343, "step": 34112 }, { "epoch": 0.64, "learning_rate": 1.488594733071868e-06, "loss": 0.9871, "step": 34113 }, { "epoch": 0.64, "learning_rate": 1.488455029271414e-06, "loss": 0.9148, "step": 34114 }, { "epoch": 0.64, "learning_rate": 1.488315329248038e-06, "loss": 0.9044, "step": 34115 }, { "epoch": 0.64, "learning_rate": 1.4881756330022618e-06, "loss": 0.9511, "step": 34116 }, { "epoch": 0.64, "learning_rate": 1.4880359405346056e-06, "loss": 1.0266, "step": 34117 }, { "epoch": 0.64, "learning_rate": 1.4878962518455937e-06, "loss": 0.9332, "step": 34118 }, { "epoch": 0.64, "learning_rate": 1.4877565669357458e-06, "loss": 1.0884, "step": 34119 }, { "epoch": 0.64, "learning_rate": 1.4876168858055829e-06, "loss": 0.8326, "step": 34120 }, { "epoch": 0.64, "learning_rate": 1.4874772084556282e-06, "loss": 0.849, "step": 34121 }, { "epoch": 0.64, "learning_rate": 1.4873375348864028e-06, "loss": 0.964, "step": 34122 }, { "epoch": 0.64, "learning_rate": 1.487197865098427e-06, "loss": 0.8568, "step": 34123 }, { "epoch": 0.64, "learning_rate": 1.4870581990922245e-06, "loss": 1.003, "step": 34124 }, { "epoch": 0.64, "learning_rate": 1.486918536868316e-06, "loss": 0.9444, "step": 34125 }, { "epoch": 0.64, "learning_rate": 1.4867788784272207e-06, "loss": 1.0075, "step": 34126 }, { "epoch": 0.64, "learning_rate": 1.4866392237694638e-06, "loss": 0.9821, "step": 34127 }, { "epoch": 0.64, "learning_rate": 1.486499572895564e-06, "loss": 0.7668, "step": 34128 }, { "epoch": 0.64, "learning_rate": 1.4863599258060434e-06, "loss": 0.7942, "step": 34129 }, { "epoch": 0.64, "learning_rate": 1.4862202825014248e-06, "loss": 0.9169, "step": 34130 }, { "epoch": 0.64, "learning_rate": 1.4860806429822282e-06, "loss": 1.0056, "step": 34131 }, { "epoch": 0.64, "learning_rate": 1.485941007248975e-06, "loss": 1.0788, "step": 34132 }, { "epoch": 0.64, "learning_rate": 1.4858013753021877e-06, "loss": 0.7473, "step": 34133 }, { "epoch": 0.64, "learning_rate": 1.4856617471423865e-06, "loss": 0.9274, "step": 34134 }, { "epoch": 0.64, "learning_rate": 1.4855221227700931e-06, "loss": 0.6339, "step": 34135 }, { "epoch": 0.64, "learning_rate": 1.4853825021858293e-06, "loss": 0.8998, "step": 34136 }, { "epoch": 0.64, "learning_rate": 1.4852428853901163e-06, "loss": 1.0099, "step": 34137 }, { "epoch": 0.64, "learning_rate": 1.4851032723834742e-06, "loss": 0.9797, "step": 34138 }, { "epoch": 0.64, "learning_rate": 1.4849636631664265e-06, "loss": 1.1061, "step": 34139 }, { "epoch": 0.64, "learning_rate": 1.4848240577394935e-06, "loss": 0.9031, "step": 34140 }, { "epoch": 0.64, "learning_rate": 1.4846844561031954e-06, "loss": 0.7635, "step": 34141 }, { "epoch": 0.64, "learning_rate": 1.4845448582580545e-06, "loss": 0.9347, "step": 34142 }, { "epoch": 0.64, "learning_rate": 1.4844052642045927e-06, "loss": 0.9253, "step": 34143 }, { "epoch": 0.64, "learning_rate": 1.4842656739433298e-06, "loss": 1.082, "step": 34144 }, { "epoch": 0.64, "learning_rate": 1.4841260874747882e-06, "loss": 1.058, "step": 34145 }, { "epoch": 0.64, "learning_rate": 1.4839865047994888e-06, "loss": 0.9391, "step": 34146 }, { "epoch": 0.64, "learning_rate": 1.483846925917952e-06, "loss": 0.8804, "step": 34147 }, { "epoch": 0.64, "learning_rate": 1.4837073508307003e-06, "loss": 0.8846, "step": 34148 }, { "epoch": 0.64, "learning_rate": 1.4835677795382536e-06, "loss": 1.0227, "step": 34149 }, { "epoch": 0.64, "learning_rate": 1.4834282120411333e-06, "loss": 1.0084, "step": 34150 }, { "epoch": 0.64, "learning_rate": 1.483288648339862e-06, "loss": 0.9174, "step": 34151 }, { "epoch": 0.64, "learning_rate": 1.4831490884349597e-06, "loss": 0.8589, "step": 34152 }, { "epoch": 0.64, "learning_rate": 1.4830095323269461e-06, "loss": 0.8764, "step": 34153 }, { "epoch": 0.64, "learning_rate": 1.4828699800163454e-06, "loss": 0.7237, "step": 34154 }, { "epoch": 0.64, "learning_rate": 1.482730431503676e-06, "loss": 0.8083, "step": 34155 }, { "epoch": 0.64, "learning_rate": 1.48259088678946e-06, "loss": 0.9675, "step": 34156 }, { "epoch": 0.64, "learning_rate": 1.4824513458742185e-06, "loss": 0.6773, "step": 34157 }, { "epoch": 0.64, "learning_rate": 1.4823118087584731e-06, "loss": 0.7657, "step": 34158 }, { "epoch": 0.64, "learning_rate": 1.4821722754427432e-06, "loss": 0.7723, "step": 34159 }, { "epoch": 0.64, "learning_rate": 1.482032745927552e-06, "loss": 0.8474, "step": 34160 }, { "epoch": 0.64, "learning_rate": 1.481893220213419e-06, "loss": 0.8307, "step": 34161 }, { "epoch": 0.64, "learning_rate": 1.4817536983008645e-06, "loss": 1.0248, "step": 34162 }, { "epoch": 0.64, "learning_rate": 1.481614180190411e-06, "loss": 0.8718, "step": 34163 }, { "epoch": 0.64, "learning_rate": 1.4814746658825796e-06, "loss": 0.952, "step": 34164 }, { "epoch": 0.64, "learning_rate": 1.4813351553778894e-06, "loss": 1.0341, "step": 34165 }, { "epoch": 0.64, "learning_rate": 1.4811956486768636e-06, "loss": 0.8755, "step": 34166 }, { "epoch": 0.64, "learning_rate": 1.4810561457800218e-06, "loss": 0.899, "step": 34167 }, { "epoch": 0.64, "learning_rate": 1.4809166466878845e-06, "loss": 1.1837, "step": 34168 }, { "epoch": 0.64, "learning_rate": 1.4807771514009738e-06, "loss": 0.9386, "step": 34169 }, { "epoch": 0.64, "learning_rate": 1.4806376599198096e-06, "loss": 0.8453, "step": 34170 }, { "epoch": 0.64, "learning_rate": 1.4804981722449124e-06, "loss": 0.8125, "step": 34171 }, { "epoch": 0.64, "learning_rate": 1.480358688376805e-06, "loss": 0.8098, "step": 34172 }, { "epoch": 0.64, "learning_rate": 1.4802192083160073e-06, "loss": 0.8621, "step": 34173 }, { "epoch": 0.64, "learning_rate": 1.4800797320630383e-06, "loss": 1.1319, "step": 34174 }, { "epoch": 0.64, "learning_rate": 1.4799402596184215e-06, "loss": 1.1447, "step": 34175 }, { "epoch": 0.64, "learning_rate": 1.479800790982676e-06, "loss": 0.8449, "step": 34176 }, { "epoch": 0.64, "learning_rate": 1.479661326156323e-06, "loss": 0.7876, "step": 34177 }, { "epoch": 0.64, "learning_rate": 1.4795218651398835e-06, "loss": 0.9702, "step": 34178 }, { "epoch": 0.64, "learning_rate": 1.4793824079338786e-06, "loss": 0.6908, "step": 34179 }, { "epoch": 0.64, "learning_rate": 1.4792429545388272e-06, "loss": 1.0158, "step": 34180 }, { "epoch": 0.64, "learning_rate": 1.4791035049552526e-06, "loss": 1.1049, "step": 34181 }, { "epoch": 0.64, "learning_rate": 1.4789640591836741e-06, "loss": 0.9583, "step": 34182 }, { "epoch": 0.64, "learning_rate": 1.4788246172246115e-06, "loss": 0.755, "step": 34183 }, { "epoch": 0.64, "learning_rate": 1.478685179078587e-06, "loss": 0.8737, "step": 34184 }, { "epoch": 0.64, "learning_rate": 1.478545744746121e-06, "loss": 0.8115, "step": 34185 }, { "epoch": 0.64, "learning_rate": 1.4784063142277332e-06, "loss": 0.9028, "step": 34186 }, { "epoch": 0.65, "learning_rate": 1.478266887523946e-06, "loss": 1.0603, "step": 34187 }, { "epoch": 0.65, "learning_rate": 1.4781274646352783e-06, "loss": 0.8233, "step": 34188 }, { "epoch": 0.65, "learning_rate": 1.4779880455622507e-06, "loss": 0.8694, "step": 34189 }, { "epoch": 0.65, "learning_rate": 1.4778486303053857e-06, "loss": 1.0147, "step": 34190 }, { "epoch": 0.65, "learning_rate": 1.4777092188652014e-06, "loss": 0.9198, "step": 34191 }, { "epoch": 0.65, "learning_rate": 1.4775698112422204e-06, "loss": 0.8232, "step": 34192 }, { "epoch": 0.65, "learning_rate": 1.4774304074369615e-06, "loss": 0.7947, "step": 34193 }, { "epoch": 0.65, "learning_rate": 1.477291007449947e-06, "loss": 1.0324, "step": 34194 }, { "epoch": 0.65, "learning_rate": 1.4771516112816964e-06, "loss": 0.9506, "step": 34195 }, { "epoch": 0.65, "learning_rate": 1.4770122189327297e-06, "loss": 0.9852, "step": 34196 }, { "epoch": 0.65, "learning_rate": 1.4768728304035681e-06, "loss": 0.741, "step": 34197 }, { "epoch": 0.65, "learning_rate": 1.4767334456947327e-06, "loss": 0.7868, "step": 34198 }, { "epoch": 0.65, "learning_rate": 1.4765940648067424e-06, "loss": 1.0264, "step": 34199 }, { "epoch": 0.65, "learning_rate": 1.476454687740119e-06, "loss": 1.1116, "step": 34200 }, { "epoch": 0.65, "learning_rate": 1.4763153144953826e-06, "loss": 0.9142, "step": 34201 }, { "epoch": 0.65, "learning_rate": 1.4761759450730522e-06, "loss": 0.9106, "step": 34202 }, { "epoch": 0.65, "learning_rate": 1.4760365794736508e-06, "loss": 0.9539, "step": 34203 }, { "epoch": 0.65, "learning_rate": 1.4758972176976971e-06, "loss": 0.8805, "step": 34204 }, { "epoch": 0.65, "learning_rate": 1.475757859745711e-06, "loss": 0.8736, "step": 34205 }, { "epoch": 0.65, "learning_rate": 1.4756185056182146e-06, "loss": 1.0083, "step": 34206 }, { "epoch": 0.65, "learning_rate": 1.475479155315727e-06, "loss": 1.0149, "step": 34207 }, { "epoch": 0.65, "learning_rate": 1.4753398088387685e-06, "loss": 0.9659, "step": 34208 }, { "epoch": 0.65, "learning_rate": 1.4752004661878605e-06, "loss": 0.9086, "step": 34209 }, { "epoch": 0.65, "learning_rate": 1.4750611273635218e-06, "loss": 0.8808, "step": 34210 }, { "epoch": 0.65, "learning_rate": 1.4749217923662737e-06, "loss": 0.8426, "step": 34211 }, { "epoch": 0.65, "learning_rate": 1.474782461196636e-06, "loss": 0.8727, "step": 34212 }, { "epoch": 0.65, "learning_rate": 1.4746431338551299e-06, "loss": 0.8989, "step": 34213 }, { "epoch": 0.65, "learning_rate": 1.4745038103422738e-06, "loss": 0.9008, "step": 34214 }, { "epoch": 0.65, "learning_rate": 1.4743644906585897e-06, "loss": 0.9194, "step": 34215 }, { "epoch": 0.65, "learning_rate": 1.4742251748045975e-06, "loss": 0.8212, "step": 34216 }, { "epoch": 0.65, "learning_rate": 1.4740858627808157e-06, "loss": 0.7968, "step": 34217 }, { "epoch": 0.65, "learning_rate": 1.4739465545877668e-06, "loss": 1.1747, "step": 34218 }, { "epoch": 0.65, "learning_rate": 1.4738072502259704e-06, "loss": 0.8907, "step": 34219 }, { "epoch": 0.65, "learning_rate": 1.473667949695945e-06, "loss": 0.8205, "step": 34220 }, { "epoch": 0.65, "learning_rate": 1.4735286529982132e-06, "loss": 0.7193, "step": 34221 }, { "epoch": 0.65, "learning_rate": 1.4733893601332939e-06, "loss": 1.035, "step": 34222 }, { "epoch": 0.65, "learning_rate": 1.4732500711017062e-06, "loss": 0.8804, "step": 34223 }, { "epoch": 0.65, "learning_rate": 1.4731107859039722e-06, "loss": 1.0874, "step": 34224 }, { "epoch": 0.65, "learning_rate": 1.4729715045406106e-06, "loss": 0.896, "step": 34225 }, { "epoch": 0.65, "learning_rate": 1.4728322270121414e-06, "loss": 0.9032, "step": 34226 }, { "epoch": 0.65, "learning_rate": 1.4726929533190865e-06, "loss": 1.0037, "step": 34227 }, { "epoch": 0.65, "learning_rate": 1.472553683461964e-06, "loss": 0.8404, "step": 34228 }, { "epoch": 0.65, "learning_rate": 1.4724144174412942e-06, "loss": 0.7798, "step": 34229 }, { "epoch": 0.65, "learning_rate": 1.472275155257598e-06, "loss": 0.8989, "step": 34230 }, { "epoch": 0.65, "learning_rate": 1.4721358969113948e-06, "loss": 1.1094, "step": 34231 }, { "epoch": 0.65, "learning_rate": 1.4719966424032041e-06, "loss": 1.0818, "step": 34232 }, { "epoch": 0.65, "learning_rate": 1.4718573917335468e-06, "loss": 0.8576, "step": 34233 }, { "epoch": 0.65, "learning_rate": 1.4717181449029428e-06, "loss": 0.9036, "step": 34234 }, { "epoch": 0.65, "learning_rate": 1.4715789019119108e-06, "loss": 0.8638, "step": 34235 }, { "epoch": 0.65, "learning_rate": 1.4714396627609728e-06, "loss": 0.8197, "step": 34236 }, { "epoch": 0.65, "learning_rate": 1.4713004274506471e-06, "loss": 1.1212, "step": 34237 }, { "epoch": 0.65, "learning_rate": 1.4711611959814534e-06, "loss": 0.9963, "step": 34238 }, { "epoch": 0.65, "learning_rate": 1.4710219683539129e-06, "loss": 0.9698, "step": 34239 }, { "epoch": 0.65, "learning_rate": 1.4708827445685447e-06, "loss": 0.9569, "step": 34240 }, { "epoch": 0.65, "learning_rate": 1.4707435246258683e-06, "loss": 0.967, "step": 34241 }, { "epoch": 0.65, "learning_rate": 1.4706043085264048e-06, "loss": 0.9086, "step": 34242 }, { "epoch": 0.65, "learning_rate": 1.4704650962706736e-06, "loss": 0.9571, "step": 34243 }, { "epoch": 0.65, "learning_rate": 1.470325887859193e-06, "loss": 0.858, "step": 34244 }, { "epoch": 0.65, "learning_rate": 1.470186683292485e-06, "loss": 0.9407, "step": 34245 }, { "epoch": 0.65, "learning_rate": 1.4700474825710675e-06, "loss": 0.8302, "step": 34246 }, { "epoch": 0.65, "learning_rate": 1.469908285695461e-06, "loss": 0.6838, "step": 34247 }, { "epoch": 0.65, "learning_rate": 1.4697690926661861e-06, "loss": 0.8618, "step": 34248 }, { "epoch": 0.65, "learning_rate": 1.469629903483762e-06, "loss": 1.1409, "step": 34249 }, { "epoch": 0.65, "learning_rate": 1.4694907181487073e-06, "loss": 1.0823, "step": 34250 }, { "epoch": 0.65, "learning_rate": 1.4693515366615436e-06, "loss": 0.8914, "step": 34251 }, { "epoch": 0.65, "learning_rate": 1.469212359022789e-06, "loss": 0.9377, "step": 34252 }, { "epoch": 0.65, "learning_rate": 1.469073185232964e-06, "loss": 0.9805, "step": 34253 }, { "epoch": 0.65, "learning_rate": 1.468934015292588e-06, "loss": 0.8912, "step": 34254 }, { "epoch": 0.65, "learning_rate": 1.4687948492021813e-06, "loss": 0.8603, "step": 34255 }, { "epoch": 0.65, "learning_rate": 1.4686556869622622e-06, "loss": 1.1343, "step": 34256 }, { "epoch": 0.65, "learning_rate": 1.4685165285733522e-06, "loss": 0.8676, "step": 34257 }, { "epoch": 0.65, "learning_rate": 1.4683773740359698e-06, "loss": 0.9302, "step": 34258 }, { "epoch": 0.65, "learning_rate": 1.4682382233506331e-06, "loss": 0.918, "step": 34259 }, { "epoch": 0.65, "learning_rate": 1.4680990765178643e-06, "loss": 0.8512, "step": 34260 }, { "epoch": 0.65, "learning_rate": 1.4679599335381823e-06, "loss": 0.861, "step": 34261 }, { "epoch": 0.65, "learning_rate": 1.4678207944121052e-06, "loss": 1.0165, "step": 34262 }, { "epoch": 0.65, "learning_rate": 1.467681659140155e-06, "loss": 1.029, "step": 34263 }, { "epoch": 0.65, "learning_rate": 1.4675425277228494e-06, "loss": 1.0018, "step": 34264 }, { "epoch": 0.65, "learning_rate": 1.4674034001607073e-06, "loss": 0.8116, "step": 34265 }, { "epoch": 0.65, "learning_rate": 1.4672642764542506e-06, "loss": 1.0945, "step": 34266 }, { "epoch": 0.65, "learning_rate": 1.4671251566039964e-06, "loss": 0.8336, "step": 34267 }, { "epoch": 0.65, "learning_rate": 1.4669860406104652e-06, "loss": 0.919, "step": 34268 }, { "epoch": 0.65, "learning_rate": 1.4668469284741772e-06, "loss": 0.8668, "step": 34269 }, { "epoch": 0.65, "learning_rate": 1.4667078201956511e-06, "loss": 0.7758, "step": 34270 }, { "epoch": 0.65, "learning_rate": 1.4665687157754055e-06, "loss": 0.7059, "step": 34271 }, { "epoch": 0.65, "learning_rate": 1.4664296152139612e-06, "loss": 0.7588, "step": 34272 }, { "epoch": 0.65, "learning_rate": 1.466290518511837e-06, "loss": 0.7185, "step": 34273 }, { "epoch": 0.65, "learning_rate": 1.466151425669552e-06, "loss": 0.9316, "step": 34274 }, { "epoch": 0.65, "learning_rate": 1.466012336687626e-06, "loss": 0.8554, "step": 34275 }, { "epoch": 0.65, "learning_rate": 1.465873251566579e-06, "loss": 1.0331, "step": 34276 }, { "epoch": 0.65, "learning_rate": 1.4657341703069284e-06, "loss": 0.7126, "step": 34277 }, { "epoch": 0.65, "learning_rate": 1.4655950929091956e-06, "loss": 0.8361, "step": 34278 }, { "epoch": 0.65, "learning_rate": 1.4654560193738988e-06, "loss": 0.7358, "step": 34279 }, { "epoch": 0.65, "learning_rate": 1.4653169497015569e-06, "loss": 0.7753, "step": 34280 }, { "epoch": 0.65, "learning_rate": 1.46517788389269e-06, "loss": 1.1509, "step": 34281 }, { "epoch": 0.65, "learning_rate": 1.4650388219478179e-06, "loss": 0.8044, "step": 34282 }, { "epoch": 0.65, "learning_rate": 1.4648997638674577e-06, "loss": 0.9976, "step": 34283 }, { "epoch": 0.65, "learning_rate": 1.4647607096521315e-06, "loss": 0.944, "step": 34284 }, { "epoch": 0.65, "learning_rate": 1.464621659302357e-06, "loss": 0.7072, "step": 34285 }, { "epoch": 0.65, "learning_rate": 1.4644826128186524e-06, "loss": 0.8274, "step": 34286 }, { "epoch": 0.65, "learning_rate": 1.4643435702015385e-06, "loss": 1.0245, "step": 34287 }, { "epoch": 0.65, "learning_rate": 1.4642045314515341e-06, "loss": 1.0894, "step": 34288 }, { "epoch": 0.65, "learning_rate": 1.4640654965691575e-06, "loss": 0.9933, "step": 34289 }, { "epoch": 0.65, "learning_rate": 1.4639264655549297e-06, "loss": 1.0056, "step": 34290 }, { "epoch": 0.65, "learning_rate": 1.4637874384093687e-06, "loss": 0.905, "step": 34291 }, { "epoch": 0.65, "learning_rate": 1.4636484151329922e-06, "loss": 0.8561, "step": 34292 }, { "epoch": 0.65, "learning_rate": 1.4635093957263222e-06, "loss": 1.2664, "step": 34293 }, { "epoch": 0.65, "learning_rate": 1.4633703801898757e-06, "loss": 0.9088, "step": 34294 }, { "epoch": 0.65, "learning_rate": 1.4632313685241723e-06, "loss": 1.0301, "step": 34295 }, { "epoch": 0.65, "learning_rate": 1.4630923607297314e-06, "loss": 0.8193, "step": 34296 }, { "epoch": 0.65, "learning_rate": 1.4629533568070723e-06, "loss": 0.9003, "step": 34297 }, { "epoch": 0.65, "learning_rate": 1.4628143567567123e-06, "loss": 0.7501, "step": 34298 }, { "epoch": 0.65, "learning_rate": 1.4626753605791734e-06, "loss": 0.8779, "step": 34299 }, { "epoch": 0.65, "learning_rate": 1.462536368274972e-06, "loss": 1.0715, "step": 34300 }, { "epoch": 0.65, "learning_rate": 1.4623973798446273e-06, "loss": 1.1544, "step": 34301 }, { "epoch": 0.65, "learning_rate": 1.4622583952886598e-06, "loss": 0.8618, "step": 34302 }, { "epoch": 0.65, "learning_rate": 1.4621194146075878e-06, "loss": 0.8125, "step": 34303 }, { "epoch": 0.65, "learning_rate": 1.4619804378019293e-06, "loss": 0.8833, "step": 34304 }, { "epoch": 0.65, "learning_rate": 1.4618414648722046e-06, "loss": 0.7937, "step": 34305 }, { "epoch": 0.65, "learning_rate": 1.4617024958189324e-06, "loss": 1.0804, "step": 34306 }, { "epoch": 0.65, "learning_rate": 1.46156353064263e-06, "loss": 0.7548, "step": 34307 }, { "epoch": 0.65, "learning_rate": 1.461424569343819e-06, "loss": 0.9603, "step": 34308 }, { "epoch": 0.65, "learning_rate": 1.4612856119230161e-06, "loss": 0.8777, "step": 34309 }, { "epoch": 0.65, "learning_rate": 1.4611466583807404e-06, "loss": 0.8929, "step": 34310 }, { "epoch": 0.65, "learning_rate": 1.461007708717512e-06, "loss": 1.0898, "step": 34311 }, { "epoch": 0.65, "learning_rate": 1.4608687629338492e-06, "loss": 1.031, "step": 34312 }, { "epoch": 0.65, "learning_rate": 1.4607298210302695e-06, "loss": 0.9628, "step": 34313 }, { "epoch": 0.65, "learning_rate": 1.4605908830072935e-06, "loss": 0.9085, "step": 34314 }, { "epoch": 0.65, "learning_rate": 1.4604519488654392e-06, "loss": 0.8602, "step": 34315 }, { "epoch": 0.65, "learning_rate": 1.4603130186052254e-06, "loss": 0.8224, "step": 34316 }, { "epoch": 0.65, "learning_rate": 1.4601740922271707e-06, "loss": 0.6874, "step": 34317 }, { "epoch": 0.65, "learning_rate": 1.4600351697317947e-06, "loss": 0.9913, "step": 34318 }, { "epoch": 0.65, "learning_rate": 1.4598962511196144e-06, "loss": 0.8132, "step": 34319 }, { "epoch": 0.65, "learning_rate": 1.4597573363911505e-06, "loss": 0.9653, "step": 34320 }, { "epoch": 0.65, "learning_rate": 1.4596184255469203e-06, "loss": 0.8122, "step": 34321 }, { "epoch": 0.65, "learning_rate": 1.4594795185874434e-06, "loss": 0.9078, "step": 34322 }, { "epoch": 0.65, "learning_rate": 1.4593406155132378e-06, "loss": 0.8072, "step": 34323 }, { "epoch": 0.65, "learning_rate": 1.4592017163248234e-06, "loss": 1.1596, "step": 34324 }, { "epoch": 0.65, "learning_rate": 1.459062821022716e-06, "loss": 1.0978, "step": 34325 }, { "epoch": 0.65, "learning_rate": 1.458923929607437e-06, "loss": 0.8451, "step": 34326 }, { "epoch": 0.65, "learning_rate": 1.4587850420795051e-06, "loss": 0.8856, "step": 34327 }, { "epoch": 0.65, "learning_rate": 1.4586461584394363e-06, "loss": 1.0355, "step": 34328 }, { "epoch": 0.65, "learning_rate": 1.4585072786877525e-06, "loss": 0.7368, "step": 34329 }, { "epoch": 0.65, "learning_rate": 1.4583684028249695e-06, "loss": 0.9506, "step": 34330 }, { "epoch": 0.65, "learning_rate": 1.458229530851607e-06, "loss": 1.0712, "step": 34331 }, { "epoch": 0.65, "learning_rate": 1.4580906627681838e-06, "loss": 0.8956, "step": 34332 }, { "epoch": 0.65, "learning_rate": 1.4579517985752179e-06, "loss": 0.7434, "step": 34333 }, { "epoch": 0.65, "learning_rate": 1.4578129382732278e-06, "loss": 0.8221, "step": 34334 }, { "epoch": 0.65, "learning_rate": 1.4576740818627326e-06, "loss": 0.7525, "step": 34335 }, { "epoch": 0.65, "learning_rate": 1.4575352293442514e-06, "loss": 1.0511, "step": 34336 }, { "epoch": 0.65, "learning_rate": 1.4573963807182994e-06, "loss": 1.2012, "step": 34337 }, { "epoch": 0.65, "learning_rate": 1.4572575359853996e-06, "loss": 0.9862, "step": 34338 }, { "epoch": 0.65, "learning_rate": 1.457118695146067e-06, "loss": 1.0963, "step": 34339 }, { "epoch": 0.65, "learning_rate": 1.4569798582008213e-06, "loss": 0.8559, "step": 34340 }, { "epoch": 0.65, "learning_rate": 1.4568410251501809e-06, "loss": 0.8264, "step": 34341 }, { "epoch": 0.65, "learning_rate": 1.456702195994664e-06, "loss": 0.8261, "step": 34342 }, { "epoch": 0.65, "learning_rate": 1.4565633707347893e-06, "loss": 1.1913, "step": 34343 }, { "epoch": 0.65, "learning_rate": 1.456424549371075e-06, "loss": 1.1675, "step": 34344 }, { "epoch": 0.65, "learning_rate": 1.4562857319040401e-06, "loss": 0.952, "step": 34345 }, { "epoch": 0.65, "learning_rate": 1.4561469183342003e-06, "loss": 0.9489, "step": 34346 }, { "epoch": 0.65, "learning_rate": 1.456008108662077e-06, "loss": 0.8386, "step": 34347 }, { "epoch": 0.65, "learning_rate": 1.4558693028881887e-06, "loss": 0.7786, "step": 34348 }, { "epoch": 0.65, "learning_rate": 1.4557305010130501e-06, "loss": 0.9454, "step": 34349 }, { "epoch": 0.65, "learning_rate": 1.455591703037184e-06, "loss": 1.1271, "step": 34350 }, { "epoch": 0.65, "learning_rate": 1.4554529089611053e-06, "loss": 0.7762, "step": 34351 }, { "epoch": 0.65, "learning_rate": 1.4553141187853334e-06, "loss": 0.9085, "step": 34352 }, { "epoch": 0.65, "learning_rate": 1.4551753325103868e-06, "loss": 0.7724, "step": 34353 }, { "epoch": 0.65, "learning_rate": 1.455036550136783e-06, "loss": 1.0394, "step": 34354 }, { "epoch": 0.65, "learning_rate": 1.4548977716650412e-06, "loss": 0.8931, "step": 34355 }, { "epoch": 0.65, "learning_rate": 1.4547589970956788e-06, "loss": 1.1613, "step": 34356 }, { "epoch": 0.65, "learning_rate": 1.4546202264292152e-06, "loss": 0.932, "step": 34357 }, { "epoch": 0.65, "learning_rate": 1.4544814596661658e-06, "loss": 0.8859, "step": 34358 }, { "epoch": 0.65, "learning_rate": 1.4543426968070522e-06, "loss": 0.9344, "step": 34359 }, { "epoch": 0.65, "learning_rate": 1.4542039378523904e-06, "loss": 0.8741, "step": 34360 }, { "epoch": 0.65, "learning_rate": 1.454065182802699e-06, "loss": 1.0029, "step": 34361 }, { "epoch": 0.65, "learning_rate": 1.453926431658496e-06, "loss": 1.0587, "step": 34362 }, { "epoch": 0.65, "learning_rate": 1.4537876844202994e-06, "loss": 0.976, "step": 34363 }, { "epoch": 0.65, "learning_rate": 1.453648941088628e-06, "loss": 0.8624, "step": 34364 }, { "epoch": 0.65, "learning_rate": 1.453510201663999e-06, "loss": 0.7721, "step": 34365 }, { "epoch": 0.65, "learning_rate": 1.4533714661469316e-06, "loss": 0.8093, "step": 34366 }, { "epoch": 0.65, "learning_rate": 1.4532327345379416e-06, "loss": 0.8004, "step": 34367 }, { "epoch": 0.65, "learning_rate": 1.4530940068375493e-06, "loss": 1.0344, "step": 34368 }, { "epoch": 0.65, "learning_rate": 1.4529552830462728e-06, "loss": 1.0558, "step": 34369 }, { "epoch": 0.65, "learning_rate": 1.4528165631646271e-06, "loss": 0.5864, "step": 34370 }, { "epoch": 0.65, "learning_rate": 1.4526778471931344e-06, "loss": 1.0153, "step": 34371 }, { "epoch": 0.65, "learning_rate": 1.4525391351323093e-06, "loss": 1.0404, "step": 34372 }, { "epoch": 0.65, "learning_rate": 1.4524004269826714e-06, "loss": 1.0369, "step": 34373 }, { "epoch": 0.65, "learning_rate": 1.4522617227447377e-06, "loss": 0.8672, "step": 34374 }, { "epoch": 0.65, "learning_rate": 1.452123022419027e-06, "loss": 0.9533, "step": 34375 }, { "epoch": 0.65, "learning_rate": 1.4519843260060562e-06, "loss": 0.9353, "step": 34376 }, { "epoch": 0.65, "learning_rate": 1.451845633506344e-06, "loss": 0.7275, "step": 34377 }, { "epoch": 0.65, "learning_rate": 1.4517069449204097e-06, "loss": 0.9557, "step": 34378 }, { "epoch": 0.65, "learning_rate": 1.4515682602487669e-06, "loss": 0.8232, "step": 34379 }, { "epoch": 0.65, "learning_rate": 1.4514295794919381e-06, "loss": 0.7282, "step": 34380 }, { "epoch": 0.65, "learning_rate": 1.4512909026504385e-06, "loss": 1.024, "step": 34381 }, { "epoch": 0.65, "learning_rate": 1.451152229724786e-06, "loss": 0.7988, "step": 34382 }, { "epoch": 0.65, "learning_rate": 1.4510135607154993e-06, "loss": 0.8986, "step": 34383 }, { "epoch": 0.65, "learning_rate": 1.4508748956230955e-06, "loss": 0.8254, "step": 34384 }, { "epoch": 0.65, "learning_rate": 1.450736234448093e-06, "loss": 0.7911, "step": 34385 }, { "epoch": 0.65, "learning_rate": 1.450597577191009e-06, "loss": 0.9097, "step": 34386 }, { "epoch": 0.65, "learning_rate": 1.4504589238523626e-06, "loss": 0.9265, "step": 34387 }, { "epoch": 0.65, "learning_rate": 1.4503202744326684e-06, "loss": 0.9628, "step": 34388 }, { "epoch": 0.65, "learning_rate": 1.4501816289324473e-06, "loss": 1.0347, "step": 34389 }, { "epoch": 0.65, "learning_rate": 1.4500429873522165e-06, "loss": 0.7606, "step": 34390 }, { "epoch": 0.65, "learning_rate": 1.4499043496924908e-06, "loss": 0.812, "step": 34391 }, { "epoch": 0.65, "learning_rate": 1.4497657159537925e-06, "loss": 0.9308, "step": 34392 }, { "epoch": 0.65, "learning_rate": 1.4496270861366358e-06, "loss": 1.0146, "step": 34393 }, { "epoch": 0.65, "learning_rate": 1.449488460241539e-06, "loss": 0.7659, "step": 34394 }, { "epoch": 0.65, "learning_rate": 1.4493498382690202e-06, "loss": 0.8426, "step": 34395 }, { "epoch": 0.65, "learning_rate": 1.4492112202195972e-06, "loss": 0.949, "step": 34396 }, { "epoch": 0.65, "learning_rate": 1.449072606093787e-06, "loss": 0.9853, "step": 34397 }, { "epoch": 0.65, "learning_rate": 1.4489339958921074e-06, "loss": 0.7409, "step": 34398 }, { "epoch": 0.65, "learning_rate": 1.4487953896150771e-06, "loss": 0.9056, "step": 34399 }, { "epoch": 0.65, "learning_rate": 1.4486567872632107e-06, "loss": 1.1266, "step": 34400 }, { "epoch": 0.65, "learning_rate": 1.4485181888370298e-06, "loss": 0.9937, "step": 34401 }, { "epoch": 0.65, "learning_rate": 1.4483795943370482e-06, "loss": 0.9893, "step": 34402 }, { "epoch": 0.65, "learning_rate": 1.4482410037637854e-06, "loss": 0.8379, "step": 34403 }, { "epoch": 0.65, "learning_rate": 1.4481024171177583e-06, "loss": 0.8969, "step": 34404 }, { "epoch": 0.65, "learning_rate": 1.4479638343994845e-06, "loss": 0.7671, "step": 34405 }, { "epoch": 0.65, "learning_rate": 1.4478252556094812e-06, "loss": 1.0228, "step": 34406 }, { "epoch": 0.65, "learning_rate": 1.4476866807482667e-06, "loss": 0.648, "step": 34407 }, { "epoch": 0.65, "learning_rate": 1.4475481098163585e-06, "loss": 0.7387, "step": 34408 }, { "epoch": 0.65, "learning_rate": 1.4474095428142714e-06, "loss": 0.9117, "step": 34409 }, { "epoch": 0.65, "learning_rate": 1.447270979742526e-06, "loss": 0.753, "step": 34410 }, { "epoch": 0.65, "learning_rate": 1.4471324206016396e-06, "loss": 0.6434, "step": 34411 }, { "epoch": 0.65, "learning_rate": 1.4469938653921262e-06, "loss": 1.1497, "step": 34412 }, { "epoch": 0.65, "learning_rate": 1.4468553141145076e-06, "loss": 1.0681, "step": 34413 }, { "epoch": 0.65, "learning_rate": 1.4467167667692977e-06, "loss": 0.857, "step": 34414 }, { "epoch": 0.65, "learning_rate": 1.4465782233570152e-06, "loss": 0.567, "step": 34415 }, { "epoch": 0.65, "learning_rate": 1.4464396838781774e-06, "loss": 0.8098, "step": 34416 }, { "epoch": 0.65, "learning_rate": 1.446301148333301e-06, "loss": 0.7863, "step": 34417 }, { "epoch": 0.65, "learning_rate": 1.4461626167229044e-06, "loss": 0.8607, "step": 34418 }, { "epoch": 0.65, "learning_rate": 1.4460240890475042e-06, "loss": 0.9064, "step": 34419 }, { "epoch": 0.65, "learning_rate": 1.4458855653076187e-06, "loss": 0.7815, "step": 34420 }, { "epoch": 0.65, "learning_rate": 1.4457470455037623e-06, "loss": 0.7731, "step": 34421 }, { "epoch": 0.65, "learning_rate": 1.4456085296364558e-06, "loss": 0.9431, "step": 34422 }, { "epoch": 0.65, "learning_rate": 1.4454700177062143e-06, "loss": 0.8866, "step": 34423 }, { "epoch": 0.65, "learning_rate": 1.4453315097135545e-06, "loss": 0.9493, "step": 34424 }, { "epoch": 0.65, "learning_rate": 1.4451930056589953e-06, "loss": 0.8548, "step": 34425 }, { "epoch": 0.65, "learning_rate": 1.4450545055430527e-06, "loss": 1.0434, "step": 34426 }, { "epoch": 0.65, "learning_rate": 1.4449160093662455e-06, "loss": 0.9235, "step": 34427 }, { "epoch": 0.65, "learning_rate": 1.4447775171290874e-06, "loss": 0.8377, "step": 34428 }, { "epoch": 0.65, "learning_rate": 1.4446390288320994e-06, "loss": 0.9178, "step": 34429 }, { "epoch": 0.65, "learning_rate": 1.4445005444757964e-06, "loss": 1.1288, "step": 34430 }, { "epoch": 0.65, "learning_rate": 1.4443620640606947e-06, "loss": 1.1868, "step": 34431 }, { "epoch": 0.65, "learning_rate": 1.4442235875873148e-06, "loss": 0.9045, "step": 34432 }, { "epoch": 0.65, "learning_rate": 1.4440851150561707e-06, "loss": 0.7384, "step": 34433 }, { "epoch": 0.65, "learning_rate": 1.4439466464677804e-06, "loss": 0.8353, "step": 34434 }, { "epoch": 0.65, "learning_rate": 1.4438081818226606e-06, "loss": 0.9688, "step": 34435 }, { "epoch": 0.65, "learning_rate": 1.443669721121329e-06, "loss": 0.9637, "step": 34436 }, { "epoch": 0.65, "learning_rate": 1.4435312643643025e-06, "loss": 0.9789, "step": 34437 }, { "epoch": 0.65, "learning_rate": 1.4433928115520972e-06, "loss": 0.8855, "step": 34438 }, { "epoch": 0.65, "learning_rate": 1.4432543626852323e-06, "loss": 1.0208, "step": 34439 }, { "epoch": 0.65, "learning_rate": 1.4431159177642213e-06, "loss": 0.7722, "step": 34440 }, { "epoch": 0.65, "learning_rate": 1.4429774767895847e-06, "loss": 1.0162, "step": 34441 }, { "epoch": 0.65, "learning_rate": 1.442839039761837e-06, "loss": 0.9569, "step": 34442 }, { "epoch": 0.65, "learning_rate": 1.4427006066814959e-06, "loss": 1.134, "step": 34443 }, { "epoch": 0.65, "learning_rate": 1.4425621775490778e-06, "loss": 0.7154, "step": 34444 }, { "epoch": 0.65, "learning_rate": 1.4424237523651008e-06, "loss": 0.8548, "step": 34445 }, { "epoch": 0.65, "learning_rate": 1.4422853311300807e-06, "loss": 0.8868, "step": 34446 }, { "epoch": 0.65, "learning_rate": 1.4421469138445348e-06, "loss": 0.863, "step": 34447 }, { "epoch": 0.65, "learning_rate": 1.4420085005089813e-06, "loss": 0.9482, "step": 34448 }, { "epoch": 0.65, "learning_rate": 1.4418700911239331e-06, "loss": 0.9938, "step": 34449 }, { "epoch": 0.65, "learning_rate": 1.4417316856899117e-06, "loss": 1.1695, "step": 34450 }, { "epoch": 0.65, "learning_rate": 1.4415932842074306e-06, "loss": 0.9952, "step": 34451 }, { "epoch": 0.65, "learning_rate": 1.441454886677007e-06, "loss": 1.0409, "step": 34452 }, { "epoch": 0.65, "learning_rate": 1.4413164930991603e-06, "loss": 0.9128, "step": 34453 }, { "epoch": 0.65, "learning_rate": 1.4411781034744042e-06, "loss": 0.9047, "step": 34454 }, { "epoch": 0.65, "learning_rate": 1.4410397178032568e-06, "loss": 0.838, "step": 34455 }, { "epoch": 0.65, "learning_rate": 1.4409013360862345e-06, "loss": 1.0447, "step": 34456 }, { "epoch": 0.65, "learning_rate": 1.440762958323854e-06, "loss": 0.92, "step": 34457 }, { "epoch": 0.65, "learning_rate": 1.4406245845166325e-06, "loss": 0.922, "step": 34458 }, { "epoch": 0.65, "learning_rate": 1.440486214665086e-06, "loss": 0.939, "step": 34459 }, { "epoch": 0.65, "learning_rate": 1.4403478487697329e-06, "loss": 0.8373, "step": 34460 }, { "epoch": 0.65, "learning_rate": 1.4402094868310862e-06, "loss": 0.9561, "step": 34461 }, { "epoch": 0.65, "learning_rate": 1.4400711288496667e-06, "loss": 0.8886, "step": 34462 }, { "epoch": 0.65, "learning_rate": 1.439932774825988e-06, "loss": 1.1341, "step": 34463 }, { "epoch": 0.65, "learning_rate": 1.439794424760568e-06, "loss": 0.8646, "step": 34464 }, { "epoch": 0.65, "learning_rate": 1.4396560786539233e-06, "loss": 0.7284, "step": 34465 }, { "epoch": 0.65, "learning_rate": 1.4395177365065699e-06, "loss": 0.836, "step": 34466 }, { "epoch": 0.65, "learning_rate": 1.4393793983190252e-06, "loss": 0.7614, "step": 34467 }, { "epoch": 0.65, "learning_rate": 1.4392410640918048e-06, "loss": 0.8659, "step": 34468 }, { "epoch": 0.65, "learning_rate": 1.439102733825427e-06, "loss": 1.067, "step": 34469 }, { "epoch": 0.65, "learning_rate": 1.438964407520405e-06, "loss": 0.6218, "step": 34470 }, { "epoch": 0.65, "learning_rate": 1.4388260851772596e-06, "loss": 0.7946, "step": 34471 }, { "epoch": 0.65, "learning_rate": 1.4386877667965038e-06, "loss": 0.8697, "step": 34472 }, { "epoch": 0.65, "learning_rate": 1.4385494523786545e-06, "loss": 0.9231, "step": 34473 }, { "epoch": 0.65, "learning_rate": 1.4384111419242308e-06, "loss": 0.8916, "step": 34474 }, { "epoch": 0.65, "learning_rate": 1.4382728354337466e-06, "loss": 1.2313, "step": 34475 }, { "epoch": 0.65, "learning_rate": 1.438134532907719e-06, "loss": 0.594, "step": 34476 }, { "epoch": 0.65, "learning_rate": 1.437996234346664e-06, "loss": 0.8725, "step": 34477 }, { "epoch": 0.65, "learning_rate": 1.4378579397510995e-06, "loss": 0.9345, "step": 34478 }, { "epoch": 0.65, "learning_rate": 1.43771964912154e-06, "loss": 0.8341, "step": 34479 }, { "epoch": 0.65, "learning_rate": 1.4375813624585033e-06, "loss": 1.0502, "step": 34480 }, { "epoch": 0.65, "learning_rate": 1.4374430797625061e-06, "loss": 0.9034, "step": 34481 }, { "epoch": 0.65, "learning_rate": 1.4373048010340619e-06, "loss": 0.9619, "step": 34482 }, { "epoch": 0.65, "learning_rate": 1.4371665262736906e-06, "loss": 1.0191, "step": 34483 }, { "epoch": 0.65, "learning_rate": 1.437028255481906e-06, "loss": 1.0411, "step": 34484 }, { "epoch": 0.65, "learning_rate": 1.4368899886592255e-06, "loss": 0.8649, "step": 34485 }, { "epoch": 0.65, "learning_rate": 1.4367517258061654e-06, "loss": 0.8932, "step": 34486 }, { "epoch": 0.65, "learning_rate": 1.4366134669232412e-06, "loss": 0.955, "step": 34487 }, { "epoch": 0.65, "learning_rate": 1.4364752120109701e-06, "loss": 0.8865, "step": 34488 }, { "epoch": 0.65, "learning_rate": 1.436336961069868e-06, "loss": 1.0557, "step": 34489 }, { "epoch": 0.65, "learning_rate": 1.4361987141004519e-06, "loss": 0.8824, "step": 34490 }, { "epoch": 0.65, "learning_rate": 1.4360604711032353e-06, "loss": 0.9446, "step": 34491 }, { "epoch": 0.65, "learning_rate": 1.4359222320787381e-06, "loss": 1.0815, "step": 34492 }, { "epoch": 0.65, "learning_rate": 1.4357839970274739e-06, "loss": 1.0317, "step": 34493 }, { "epoch": 0.65, "learning_rate": 1.4356457659499584e-06, "loss": 1.0598, "step": 34494 }, { "epoch": 0.65, "learning_rate": 1.435507538846711e-06, "loss": 0.7074, "step": 34495 }, { "epoch": 0.65, "learning_rate": 1.435369315718245e-06, "loss": 0.7122, "step": 34496 }, { "epoch": 0.65, "learning_rate": 1.4352310965650773e-06, "loss": 0.9071, "step": 34497 }, { "epoch": 0.65, "learning_rate": 1.4350928813877238e-06, "loss": 0.9083, "step": 34498 }, { "epoch": 0.65, "learning_rate": 1.4349546701867012e-06, "loss": 1.1063, "step": 34499 }, { "epoch": 0.65, "learning_rate": 1.434816462962525e-06, "loss": 0.9626, "step": 34500 }, { "epoch": 0.65, "learning_rate": 1.4346782597157113e-06, "loss": 0.9141, "step": 34501 }, { "epoch": 0.65, "learning_rate": 1.4345400604467773e-06, "loss": 0.8471, "step": 34502 }, { "epoch": 0.65, "learning_rate": 1.4344018651562364e-06, "loss": 0.8311, "step": 34503 }, { "epoch": 0.65, "learning_rate": 1.4342636738446081e-06, "loss": 0.7362, "step": 34504 }, { "epoch": 0.65, "learning_rate": 1.4341254865124055e-06, "loss": 0.7814, "step": 34505 }, { "epoch": 0.65, "learning_rate": 1.433987303160146e-06, "loss": 1.1141, "step": 34506 }, { "epoch": 0.65, "learning_rate": 1.4338491237883445e-06, "loss": 1.227, "step": 34507 }, { "epoch": 0.65, "learning_rate": 1.4337109483975181e-06, "loss": 0.7679, "step": 34508 }, { "epoch": 0.65, "learning_rate": 1.4335727769881824e-06, "loss": 0.8622, "step": 34509 }, { "epoch": 0.65, "learning_rate": 1.4334346095608531e-06, "loss": 0.949, "step": 34510 }, { "epoch": 0.65, "learning_rate": 1.4332964461160477e-06, "loss": 0.9072, "step": 34511 }, { "epoch": 0.65, "learning_rate": 1.433158286654278e-06, "loss": 0.9255, "step": 34512 }, { "epoch": 0.65, "learning_rate": 1.433020131176065e-06, "loss": 0.8183, "step": 34513 }, { "epoch": 0.65, "learning_rate": 1.432881979681921e-06, "loss": 0.7558, "step": 34514 }, { "epoch": 0.65, "learning_rate": 1.432743832172362e-06, "loss": 0.9214, "step": 34515 }, { "epoch": 0.65, "learning_rate": 1.4326056886479067e-06, "loss": 0.9346, "step": 34516 }, { "epoch": 0.65, "learning_rate": 1.4324675491090684e-06, "loss": 0.8376, "step": 34517 }, { "epoch": 0.65, "learning_rate": 1.4323294135563631e-06, "loss": 1.0776, "step": 34518 }, { "epoch": 0.65, "learning_rate": 1.4321912819903071e-06, "loss": 1.0883, "step": 34519 }, { "epoch": 0.65, "learning_rate": 1.4320531544114163e-06, "loss": 0.9233, "step": 34520 }, { "epoch": 0.65, "learning_rate": 1.4319150308202062e-06, "loss": 1.0054, "step": 34521 }, { "epoch": 0.65, "learning_rate": 1.4317769112171926e-06, "loss": 0.8958, "step": 34522 }, { "epoch": 0.65, "learning_rate": 1.431638795602892e-06, "loss": 0.8818, "step": 34523 }, { "epoch": 0.65, "learning_rate": 1.4315006839778178e-06, "loss": 0.9351, "step": 34524 }, { "epoch": 0.65, "learning_rate": 1.431362576342489e-06, "loss": 1.0945, "step": 34525 }, { "epoch": 0.65, "learning_rate": 1.4312244726974185e-06, "loss": 0.9734, "step": 34526 }, { "epoch": 0.65, "learning_rate": 1.4310863730431235e-06, "loss": 0.6747, "step": 34527 }, { "epoch": 0.65, "learning_rate": 1.430948277380119e-06, "loss": 0.7609, "step": 34528 }, { "epoch": 0.65, "learning_rate": 1.4308101857089208e-06, "loss": 0.8075, "step": 34529 }, { "epoch": 0.65, "learning_rate": 1.4306720980300446e-06, "loss": 0.954, "step": 34530 }, { "epoch": 0.65, "learning_rate": 1.4305340143440057e-06, "loss": 1.0655, "step": 34531 }, { "epoch": 0.65, "learning_rate": 1.4303959346513213e-06, "loss": 0.9666, "step": 34532 }, { "epoch": 0.65, "learning_rate": 1.4302578589525041e-06, "loss": 0.8336, "step": 34533 }, { "epoch": 0.65, "learning_rate": 1.4301197872480726e-06, "loss": 0.7635, "step": 34534 }, { "epoch": 0.65, "learning_rate": 1.42998171953854e-06, "loss": 0.9981, "step": 34535 }, { "epoch": 0.65, "learning_rate": 1.4298436558244222e-06, "loss": 0.8871, "step": 34536 }, { "epoch": 0.65, "learning_rate": 1.4297055961062372e-06, "loss": 1.0564, "step": 34537 }, { "epoch": 0.65, "learning_rate": 1.4295675403844977e-06, "loss": 1.0684, "step": 34538 }, { "epoch": 0.65, "learning_rate": 1.4294294886597204e-06, "loss": 0.8769, "step": 34539 }, { "epoch": 0.65, "learning_rate": 1.4292914409324205e-06, "loss": 0.7931, "step": 34540 }, { "epoch": 0.65, "learning_rate": 1.4291533972031135e-06, "loss": 0.8385, "step": 34541 }, { "epoch": 0.65, "learning_rate": 1.4290153574723148e-06, "loss": 1.0232, "step": 34542 }, { "epoch": 0.65, "learning_rate": 1.42887732174054e-06, "loss": 0.9283, "step": 34543 }, { "epoch": 0.65, "learning_rate": 1.4287392900083051e-06, "loss": 1.0736, "step": 34544 }, { "epoch": 0.65, "learning_rate": 1.428601262276123e-06, "loss": 1.0558, "step": 34545 }, { "epoch": 0.65, "learning_rate": 1.4284632385445132e-06, "loss": 0.6741, "step": 34546 }, { "epoch": 0.65, "learning_rate": 1.4283252188139878e-06, "loss": 0.9106, "step": 34547 }, { "epoch": 0.65, "learning_rate": 1.428187203085063e-06, "loss": 0.882, "step": 34548 }, { "epoch": 0.65, "learning_rate": 1.4280491913582544e-06, "loss": 0.9155, "step": 34549 }, { "epoch": 0.65, "learning_rate": 1.427911183634077e-06, "loss": 0.9993, "step": 34550 }, { "epoch": 0.65, "learning_rate": 1.4277731799130468e-06, "loss": 0.9948, "step": 34551 }, { "epoch": 0.65, "learning_rate": 1.4276351801956784e-06, "loss": 0.741, "step": 34552 }, { "epoch": 0.65, "learning_rate": 1.4274971844824886e-06, "loss": 0.8516, "step": 34553 }, { "epoch": 0.65, "learning_rate": 1.4273591927739891e-06, "loss": 0.7505, "step": 34554 }, { "epoch": 0.65, "learning_rate": 1.4272212050706995e-06, "loss": 0.9064, "step": 34555 }, { "epoch": 0.65, "learning_rate": 1.4270832213731323e-06, "loss": 0.9778, "step": 34556 }, { "epoch": 0.65, "learning_rate": 1.4269452416818024e-06, "loss": 0.9705, "step": 34557 }, { "epoch": 0.65, "learning_rate": 1.4268072659972278e-06, "loss": 0.7975, "step": 34558 }, { "epoch": 0.65, "learning_rate": 1.4266692943199212e-06, "loss": 0.8195, "step": 34559 }, { "epoch": 0.65, "learning_rate": 1.4265313266503986e-06, "loss": 0.9434, "step": 34560 }, { "epoch": 0.65, "learning_rate": 1.4263933629891749e-06, "loss": 0.7863, "step": 34561 }, { "epoch": 0.65, "learning_rate": 1.4262554033367656e-06, "loss": 0.8786, "step": 34562 }, { "epoch": 0.65, "learning_rate": 1.4261174476936857e-06, "loss": 0.9237, "step": 34563 }, { "epoch": 0.65, "learning_rate": 1.4259794960604503e-06, "loss": 1.1039, "step": 34564 }, { "epoch": 0.65, "learning_rate": 1.4258415484375754e-06, "loss": 0.9523, "step": 34565 }, { "epoch": 0.65, "learning_rate": 1.4257036048255735e-06, "loss": 0.859, "step": 34566 }, { "epoch": 0.65, "learning_rate": 1.4255656652249633e-06, "loss": 0.8845, "step": 34567 }, { "epoch": 0.65, "learning_rate": 1.4254277296362567e-06, "loss": 0.9487, "step": 34568 }, { "epoch": 0.65, "learning_rate": 1.4252897980599705e-06, "loss": 0.907, "step": 34569 }, { "epoch": 0.65, "learning_rate": 1.4251518704966188e-06, "loss": 0.7353, "step": 34570 }, { "epoch": 0.65, "learning_rate": 1.4250139469467172e-06, "loss": 0.8055, "step": 34571 }, { "epoch": 0.65, "learning_rate": 1.4248760274107806e-06, "loss": 1.0006, "step": 34572 }, { "epoch": 0.65, "learning_rate": 1.4247381118893238e-06, "loss": 0.7339, "step": 34573 }, { "epoch": 0.65, "learning_rate": 1.4246002003828635e-06, "loss": 1.1625, "step": 34574 }, { "epoch": 0.65, "learning_rate": 1.4244622928919105e-06, "loss": 1.1293, "step": 34575 }, { "epoch": 0.65, "learning_rate": 1.4243243894169845e-06, "loss": 0.8, "step": 34576 }, { "epoch": 0.65, "learning_rate": 1.4241864899585972e-06, "loss": 0.8138, "step": 34577 }, { "epoch": 0.65, "learning_rate": 1.4240485945172633e-06, "loss": 0.9625, "step": 34578 }, { "epoch": 0.65, "learning_rate": 1.4239107030935014e-06, "loss": 0.7152, "step": 34579 }, { "epoch": 0.65, "learning_rate": 1.4237728156878227e-06, "loss": 0.8261, "step": 34580 }, { "epoch": 0.65, "learning_rate": 1.4236349323007436e-06, "loss": 0.9761, "step": 34581 }, { "epoch": 0.65, "learning_rate": 1.4234970529327784e-06, "loss": 1.0721, "step": 34582 }, { "epoch": 0.65, "learning_rate": 1.4233591775844422e-06, "loss": 0.7797, "step": 34583 }, { "epoch": 0.65, "learning_rate": 1.4232213062562499e-06, "loss": 0.884, "step": 34584 }, { "epoch": 0.65, "learning_rate": 1.4230834389487161e-06, "loss": 0.8007, "step": 34585 }, { "epoch": 0.65, "learning_rate": 1.4229455756623567e-06, "loss": 0.8316, "step": 34586 }, { "epoch": 0.65, "learning_rate": 1.4228077163976839e-06, "loss": 1.0917, "step": 34587 }, { "epoch": 0.65, "learning_rate": 1.4226698611552156e-06, "loss": 1.0048, "step": 34588 }, { "epoch": 0.65, "learning_rate": 1.4225320099354641e-06, "loss": 0.7794, "step": 34589 }, { "epoch": 0.65, "learning_rate": 1.4223941627389453e-06, "loss": 0.92, "step": 34590 }, { "epoch": 0.65, "learning_rate": 1.4222563195661735e-06, "loss": 0.8954, "step": 34591 }, { "epoch": 0.65, "learning_rate": 1.4221184804176635e-06, "loss": 0.8125, "step": 34592 }, { "epoch": 0.65, "learning_rate": 1.42198064529393e-06, "loss": 1.0463, "step": 34593 }, { "epoch": 0.65, "learning_rate": 1.4218428141954876e-06, "loss": 1.134, "step": 34594 }, { "epoch": 0.65, "learning_rate": 1.4217049871228525e-06, "loss": 0.6634, "step": 34595 }, { "epoch": 0.65, "learning_rate": 1.4215671640765355e-06, "loss": 0.8624, "step": 34596 }, { "epoch": 0.65, "learning_rate": 1.421429345057056e-06, "loss": 0.7569, "step": 34597 }, { "epoch": 0.65, "learning_rate": 1.421291530064925e-06, "loss": 0.9235, "step": 34598 }, { "epoch": 0.65, "learning_rate": 1.4211537191006576e-06, "loss": 0.8577, "step": 34599 }, { "epoch": 0.65, "learning_rate": 1.421015912164771e-06, "loss": 0.9424, "step": 34600 }, { "epoch": 0.65, "learning_rate": 1.4208781092577766e-06, "loss": 0.9394, "step": 34601 }, { "epoch": 0.65, "learning_rate": 1.4207403103801906e-06, "loss": 0.6082, "step": 34602 }, { "epoch": 0.65, "learning_rate": 1.420602515532527e-06, "loss": 0.8421, "step": 34603 }, { "epoch": 0.65, "learning_rate": 1.4204647247153008e-06, "loss": 0.8186, "step": 34604 }, { "epoch": 0.65, "learning_rate": 1.4203269379290261e-06, "loss": 0.7941, "step": 34605 }, { "epoch": 0.65, "learning_rate": 1.4201891551742174e-06, "loss": 1.2015, "step": 34606 }, { "epoch": 0.65, "learning_rate": 1.4200513764513904e-06, "loss": 1.2867, "step": 34607 }, { "epoch": 0.65, "learning_rate": 1.4199136017610566e-06, "loss": 0.8174, "step": 34608 }, { "epoch": 0.65, "learning_rate": 1.4197758311037338e-06, "loss": 0.9055, "step": 34609 }, { "epoch": 0.65, "learning_rate": 1.4196380644799343e-06, "loss": 0.9407, "step": 34610 }, { "epoch": 0.65, "learning_rate": 1.4195003018901732e-06, "loss": 0.6696, "step": 34611 }, { "epoch": 0.65, "learning_rate": 1.4193625433349646e-06, "loss": 0.9715, "step": 34612 }, { "epoch": 0.65, "learning_rate": 1.419224788814823e-06, "loss": 0.7529, "step": 34613 }, { "epoch": 0.65, "learning_rate": 1.4190870383302633e-06, "loss": 0.8768, "step": 34614 }, { "epoch": 0.65, "learning_rate": 1.4189492918817993e-06, "loss": 0.7633, "step": 34615 }, { "epoch": 0.65, "learning_rate": 1.4188115494699465e-06, "loss": 0.9447, "step": 34616 }, { "epoch": 0.65, "learning_rate": 1.418673811095216e-06, "loss": 0.8545, "step": 34617 }, { "epoch": 0.65, "learning_rate": 1.418536076758127e-06, "loss": 0.9947, "step": 34618 }, { "epoch": 0.65, "learning_rate": 1.4183983464591895e-06, "loss": 1.2328, "step": 34619 }, { "epoch": 0.65, "learning_rate": 1.4182606201989186e-06, "loss": 0.9026, "step": 34620 }, { "epoch": 0.65, "learning_rate": 1.4181228979778311e-06, "loss": 0.7845, "step": 34621 }, { "epoch": 0.65, "learning_rate": 1.417985179796439e-06, "loss": 0.7217, "step": 34622 }, { "epoch": 0.65, "learning_rate": 1.4178474656552568e-06, "loss": 0.9374, "step": 34623 }, { "epoch": 0.65, "learning_rate": 1.417709755554799e-06, "loss": 0.9108, "step": 34624 }, { "epoch": 0.65, "learning_rate": 1.4175720494955796e-06, "loss": 1.0489, "step": 34625 }, { "epoch": 0.65, "learning_rate": 1.4174343474781132e-06, "loss": 0.981, "step": 34626 }, { "epoch": 0.65, "learning_rate": 1.417296649502914e-06, "loss": 0.7135, "step": 34627 }, { "epoch": 0.65, "learning_rate": 1.4171589555704968e-06, "loss": 0.7725, "step": 34628 }, { "epoch": 0.65, "learning_rate": 1.4170212656813725e-06, "loss": 0.6365, "step": 34629 }, { "epoch": 0.65, "learning_rate": 1.41688357983606e-06, "loss": 0.9626, "step": 34630 }, { "epoch": 0.65, "learning_rate": 1.4167458980350699e-06, "loss": 1.0931, "step": 34631 }, { "epoch": 0.65, "learning_rate": 1.4166082202789172e-06, "loss": 0.6538, "step": 34632 }, { "epoch": 0.65, "learning_rate": 1.4164705465681164e-06, "loss": 1.1287, "step": 34633 }, { "epoch": 0.65, "learning_rate": 1.4163328769031812e-06, "loss": 0.8179, "step": 34634 }, { "epoch": 0.65, "learning_rate": 1.4161952112846261e-06, "loss": 0.844, "step": 34635 }, { "epoch": 0.65, "learning_rate": 1.4160575497129645e-06, "loss": 0.961, "step": 34636 }, { "epoch": 0.65, "learning_rate": 1.4159198921887118e-06, "loss": 1.1506, "step": 34637 }, { "epoch": 0.65, "learning_rate": 1.4157822387123793e-06, "loss": 0.9535, "step": 34638 }, { "epoch": 0.65, "learning_rate": 1.4156445892844844e-06, "loss": 0.9727, "step": 34639 }, { "epoch": 0.65, "learning_rate": 1.4155069439055385e-06, "loss": 0.8671, "step": 34640 }, { "epoch": 0.65, "learning_rate": 1.415369302576055e-06, "loss": 0.9279, "step": 34641 }, { "epoch": 0.65, "learning_rate": 1.415231665296552e-06, "loss": 0.7857, "step": 34642 }, { "epoch": 0.65, "learning_rate": 1.4150940320675394e-06, "loss": 0.923, "step": 34643 }, { "epoch": 0.65, "learning_rate": 1.4149564028895322e-06, "loss": 1.0472, "step": 34644 }, { "epoch": 0.65, "learning_rate": 1.4148187777630446e-06, "loss": 1.0157, "step": 34645 }, { "epoch": 0.65, "learning_rate": 1.4146811566885904e-06, "loss": 0.889, "step": 34646 }, { "epoch": 0.65, "learning_rate": 1.4145435396666834e-06, "loss": 0.7836, "step": 34647 }, { "epoch": 0.65, "learning_rate": 1.414405926697838e-06, "loss": 0.787, "step": 34648 }, { "epoch": 0.65, "learning_rate": 1.4142683177825683e-06, "loss": 0.8636, "step": 34649 }, { "epoch": 0.65, "learning_rate": 1.4141307129213855e-06, "loss": 1.2298, "step": 34650 }, { "epoch": 0.65, "learning_rate": 1.413993112114807e-06, "loss": 0.8528, "step": 34651 }, { "epoch": 0.65, "learning_rate": 1.4138555153633443e-06, "loss": 0.87, "step": 34652 }, { "epoch": 0.65, "learning_rate": 1.4137179226675116e-06, "loss": 0.8799, "step": 34653 }, { "epoch": 0.65, "learning_rate": 1.4135803340278228e-06, "loss": 0.834, "step": 34654 }, { "epoch": 0.65, "learning_rate": 1.4134427494447919e-06, "loss": 1.0259, "step": 34655 }, { "epoch": 0.65, "learning_rate": 1.4133051689189325e-06, "loss": 1.1447, "step": 34656 }, { "epoch": 0.65, "learning_rate": 1.4131675924507582e-06, "loss": 0.9205, "step": 34657 }, { "epoch": 0.65, "learning_rate": 1.4130300200407837e-06, "loss": 0.8507, "step": 34658 }, { "epoch": 0.65, "learning_rate": 1.412892451689521e-06, "loss": 0.806, "step": 34659 }, { "epoch": 0.65, "learning_rate": 1.4127548873974833e-06, "loss": 0.8992, "step": 34660 }, { "epoch": 0.65, "learning_rate": 1.4126173271651878e-06, "loss": 0.9668, "step": 34661 }, { "epoch": 0.65, "learning_rate": 1.4124797709931446e-06, "loss": 1.0381, "step": 34662 }, { "epoch": 0.65, "learning_rate": 1.4123422188818687e-06, "loss": 1.1454, "step": 34663 }, { "epoch": 0.65, "learning_rate": 1.4122046708318734e-06, "loss": 0.6431, "step": 34664 }, { "epoch": 0.65, "learning_rate": 1.4120671268436725e-06, "loss": 0.879, "step": 34665 }, { "epoch": 0.65, "learning_rate": 1.41192958691778e-06, "loss": 0.9778, "step": 34666 }, { "epoch": 0.65, "learning_rate": 1.411792051054709e-06, "loss": 1.0183, "step": 34667 }, { "epoch": 0.65, "learning_rate": 1.411654519254974e-06, "loss": 0.8459, "step": 34668 }, { "epoch": 0.65, "learning_rate": 1.4115169915190854e-06, "loss": 1.037, "step": 34669 }, { "epoch": 0.65, "learning_rate": 1.4113794678475612e-06, "loss": 0.8281, "step": 34670 }, { "epoch": 0.65, "learning_rate": 1.4112419482409117e-06, "loss": 0.7634, "step": 34671 }, { "epoch": 0.65, "learning_rate": 1.4111044326996515e-06, "loss": 0.8029, "step": 34672 }, { "epoch": 0.65, "learning_rate": 1.4109669212242938e-06, "loss": 0.8049, "step": 34673 }, { "epoch": 0.65, "learning_rate": 1.4108294138153522e-06, "loss": 1.1742, "step": 34674 }, { "epoch": 0.65, "learning_rate": 1.4106919104733402e-06, "loss": 1.101, "step": 34675 }, { "epoch": 0.65, "learning_rate": 1.4105544111987713e-06, "loss": 0.799, "step": 34676 }, { "epoch": 0.65, "learning_rate": 1.4104169159921597e-06, "loss": 0.8174, "step": 34677 }, { "epoch": 0.65, "learning_rate": 1.4102794248540159e-06, "loss": 0.9577, "step": 34678 }, { "epoch": 0.65, "learning_rate": 1.4101419377848574e-06, "loss": 0.7511, "step": 34679 }, { "epoch": 0.65, "learning_rate": 1.4100044547851944e-06, "loss": 1.0351, "step": 34680 }, { "epoch": 0.65, "learning_rate": 1.4098669758555405e-06, "loss": 0.9133, "step": 34681 }, { "epoch": 0.65, "learning_rate": 1.4097295009964118e-06, "loss": 0.881, "step": 34682 }, { "epoch": 0.65, "learning_rate": 1.4095920302083188e-06, "loss": 0.7559, "step": 34683 }, { "epoch": 0.65, "learning_rate": 1.4094545634917755e-06, "loss": 0.9432, "step": 34684 }, { "epoch": 0.65, "learning_rate": 1.4093171008472955e-06, "loss": 0.8269, "step": 34685 }, { "epoch": 0.65, "learning_rate": 1.4091796422753923e-06, "loss": 0.8172, "step": 34686 }, { "epoch": 0.65, "learning_rate": 1.4090421877765787e-06, "loss": 0.9669, "step": 34687 }, { "epoch": 0.65, "learning_rate": 1.4089047373513682e-06, "loss": 1.2228, "step": 34688 }, { "epoch": 0.65, "learning_rate": 1.4087672910002749e-06, "loss": 0.9329, "step": 34689 }, { "epoch": 0.65, "learning_rate": 1.4086298487238087e-06, "loss": 0.8103, "step": 34690 }, { "epoch": 0.65, "learning_rate": 1.4084924105224878e-06, "loss": 0.667, "step": 34691 }, { "epoch": 0.65, "learning_rate": 1.4083549763968213e-06, "loss": 0.8763, "step": 34692 }, { "epoch": 0.65, "learning_rate": 1.4082175463473242e-06, "loss": 0.9602, "step": 34693 }, { "epoch": 0.65, "learning_rate": 1.408080120374509e-06, "loss": 0.9661, "step": 34694 }, { "epoch": 0.65, "learning_rate": 1.4079426984788891e-06, "loss": 0.7223, "step": 34695 }, { "epoch": 0.65, "learning_rate": 1.4078052806609781e-06, "loss": 0.7676, "step": 34696 }, { "epoch": 0.65, "learning_rate": 1.4076678669212885e-06, "loss": 0.7256, "step": 34697 }, { "epoch": 0.65, "learning_rate": 1.4075304572603342e-06, "loss": 0.889, "step": 34698 }, { "epoch": 0.65, "learning_rate": 1.407393051678626e-06, "loss": 0.9456, "step": 34699 }, { "epoch": 0.65, "learning_rate": 1.407255650176681e-06, "loss": 0.9142, "step": 34700 }, { "epoch": 0.65, "learning_rate": 1.4071182527550087e-06, "loss": 0.9178, "step": 34701 }, { "epoch": 0.65, "learning_rate": 1.4069808594141222e-06, "loss": 0.6552, "step": 34702 }, { "epoch": 0.65, "learning_rate": 1.4068434701545375e-06, "loss": 1.0681, "step": 34703 }, { "epoch": 0.65, "learning_rate": 1.406706084976765e-06, "loss": 0.9193, "step": 34704 }, { "epoch": 0.65, "learning_rate": 1.4065687038813184e-06, "loss": 0.7806, "step": 34705 }, { "epoch": 0.65, "learning_rate": 1.4064313268687108e-06, "loss": 1.0454, "step": 34706 }, { "epoch": 0.65, "learning_rate": 1.4062939539394548e-06, "loss": 0.9679, "step": 34707 }, { "epoch": 0.65, "learning_rate": 1.406156585094064e-06, "loss": 0.7694, "step": 34708 }, { "epoch": 0.65, "learning_rate": 1.4060192203330508e-06, "loss": 0.9382, "step": 34709 }, { "epoch": 0.65, "learning_rate": 1.405881859656929e-06, "loss": 0.7355, "step": 34710 }, { "epoch": 0.65, "learning_rate": 1.4057445030662093e-06, "loss": 0.8646, "step": 34711 }, { "epoch": 0.65, "learning_rate": 1.4056071505614078e-06, "loss": 1.0981, "step": 34712 }, { "epoch": 0.65, "learning_rate": 1.405469802143035e-06, "loss": 0.9626, "step": 34713 }, { "epoch": 0.65, "learning_rate": 1.405332457811604e-06, "loss": 0.8705, "step": 34714 }, { "epoch": 0.65, "learning_rate": 1.4051951175676282e-06, "loss": 0.7193, "step": 34715 }, { "epoch": 0.65, "learning_rate": 1.40505778141162e-06, "loss": 1.163, "step": 34716 }, { "epoch": 0.66, "learning_rate": 1.404920449344093e-06, "loss": 0.6745, "step": 34717 }, { "epoch": 0.66, "learning_rate": 1.404783121365559e-06, "loss": 1.0477, "step": 34718 }, { "epoch": 0.66, "learning_rate": 1.4046457974765326e-06, "loss": 0.9752, "step": 34719 }, { "epoch": 0.66, "learning_rate": 1.404508477677523e-06, "loss": 0.8206, "step": 34720 }, { "epoch": 0.66, "learning_rate": 1.404371161969047e-06, "loss": 0.8254, "step": 34721 }, { "epoch": 0.66, "learning_rate": 1.4042338503516148e-06, "loss": 0.953, "step": 34722 }, { "epoch": 0.66, "learning_rate": 1.4040965428257385e-06, "loss": 0.9798, "step": 34723 }, { "epoch": 0.66, "learning_rate": 1.4039592393919343e-06, "loss": 0.8803, "step": 34724 }, { "epoch": 0.66, "learning_rate": 1.4038219400507118e-06, "loss": 1.1572, "step": 34725 }, { "epoch": 0.66, "learning_rate": 1.4036846448025842e-06, "loss": 1.1558, "step": 34726 }, { "epoch": 0.66, "learning_rate": 1.4035473536480648e-06, "loss": 0.8816, "step": 34727 }, { "epoch": 0.66, "learning_rate": 1.403410066587666e-06, "loss": 1.0148, "step": 34728 }, { "epoch": 0.66, "learning_rate": 1.4032727836219003e-06, "loss": 0.8597, "step": 34729 }, { "epoch": 0.66, "learning_rate": 1.4031355047512807e-06, "loss": 0.9062, "step": 34730 }, { "epoch": 0.66, "learning_rate": 1.40299822997632e-06, "loss": 1.1458, "step": 34731 }, { "epoch": 0.66, "learning_rate": 1.4028609592975285e-06, "loss": 0.929, "step": 34732 }, { "epoch": 0.66, "learning_rate": 1.4027236927154226e-06, "loss": 0.9308, "step": 34733 }, { "epoch": 0.66, "learning_rate": 1.4025864302305118e-06, "loss": 0.744, "step": 34734 }, { "epoch": 0.66, "learning_rate": 1.4024491718433095e-06, "loss": 0.8271, "step": 34735 }, { "epoch": 0.66, "learning_rate": 1.4023119175543283e-06, "loss": 0.9598, "step": 34736 }, { "epoch": 0.66, "learning_rate": 1.4021746673640806e-06, "loss": 1.1179, "step": 34737 }, { "epoch": 0.66, "learning_rate": 1.4020374212730794e-06, "loss": 0.9742, "step": 34738 }, { "epoch": 0.66, "learning_rate": 1.4019001792818369e-06, "loss": 0.89, "step": 34739 }, { "epoch": 0.66, "learning_rate": 1.4017629413908663e-06, "loss": 0.8145, "step": 34740 }, { "epoch": 0.66, "learning_rate": 1.4016257076006768e-06, "loss": 1.0622, "step": 34741 }, { "epoch": 0.66, "learning_rate": 1.4014884779117857e-06, "loss": 0.8187, "step": 34742 }, { "epoch": 0.66, "learning_rate": 1.4013512523247018e-06, "loss": 0.8089, "step": 34743 }, { "epoch": 0.66, "learning_rate": 1.4012140308399375e-06, "loss": 1.0059, "step": 34744 }, { "epoch": 0.66, "learning_rate": 1.4010768134580086e-06, "loss": 0.8395, "step": 34745 }, { "epoch": 0.66, "learning_rate": 1.4009396001794239e-06, "loss": 0.6299, "step": 34746 }, { "epoch": 0.66, "learning_rate": 1.4008023910046973e-06, "loss": 0.9692, "step": 34747 }, { "epoch": 0.66, "learning_rate": 1.4006651859343407e-06, "loss": 0.9119, "step": 34748 }, { "epoch": 0.66, "learning_rate": 1.4005279849688666e-06, "loss": 0.9473, "step": 34749 }, { "epoch": 0.66, "learning_rate": 1.4003907881087874e-06, "loss": 1.2209, "step": 34750 }, { "epoch": 0.66, "learning_rate": 1.4002535953546153e-06, "loss": 0.7675, "step": 34751 }, { "epoch": 0.66, "learning_rate": 1.4001164067068633e-06, "loss": 0.9777, "step": 34752 }, { "epoch": 0.66, "learning_rate": 1.3999792221660413e-06, "loss": 0.8896, "step": 34753 }, { "epoch": 0.66, "learning_rate": 1.3998420417326647e-06, "loss": 0.8888, "step": 34754 }, { "epoch": 0.66, "learning_rate": 1.3997048654072438e-06, "loss": 0.8881, "step": 34755 }, { "epoch": 0.66, "learning_rate": 1.3995676931902907e-06, "loss": 1.0765, "step": 34756 }, { "epoch": 0.66, "learning_rate": 1.3994305250823182e-06, "loss": 0.9916, "step": 34757 }, { "epoch": 0.66, "learning_rate": 1.3992933610838383e-06, "loss": 0.9331, "step": 34758 }, { "epoch": 0.66, "learning_rate": 1.3991562011953632e-06, "loss": 0.8884, "step": 34759 }, { "epoch": 0.66, "learning_rate": 1.3990190454174052e-06, "loss": 0.8868, "step": 34760 }, { "epoch": 0.66, "learning_rate": 1.3988818937504773e-06, "loss": 0.9193, "step": 34761 }, { "epoch": 0.66, "learning_rate": 1.3987447461950888e-06, "loss": 1.2491, "step": 34762 }, { "epoch": 0.66, "learning_rate": 1.3986076027517556e-06, "loss": 0.8889, "step": 34763 }, { "epoch": 0.66, "learning_rate": 1.3984704634209867e-06, "loss": 0.9214, "step": 34764 }, { "epoch": 0.66, "learning_rate": 1.3983333282032947e-06, "loss": 0.9345, "step": 34765 }, { "epoch": 0.66, "learning_rate": 1.3981961970991936e-06, "loss": 0.9585, "step": 34766 }, { "epoch": 0.66, "learning_rate": 1.3980590701091937e-06, "loss": 0.8863, "step": 34767 }, { "epoch": 0.66, "learning_rate": 1.3979219472338074e-06, "loss": 0.9622, "step": 34768 }, { "epoch": 0.66, "learning_rate": 1.3977848284735463e-06, "loss": 1.1171, "step": 34769 }, { "epoch": 0.66, "learning_rate": 1.3976477138289233e-06, "loss": 1.0093, "step": 34770 }, { "epoch": 0.66, "learning_rate": 1.3975106033004498e-06, "loss": 0.6411, "step": 34771 }, { "epoch": 0.66, "learning_rate": 1.3973734968886379e-06, "loss": 0.7977, "step": 34772 }, { "epoch": 0.66, "learning_rate": 1.3972363945940003e-06, "loss": 0.8254, "step": 34773 }, { "epoch": 0.66, "learning_rate": 1.3970992964170465e-06, "loss": 0.8338, "step": 34774 }, { "epoch": 0.66, "learning_rate": 1.3969622023582924e-06, "loss": 0.9856, "step": 34775 }, { "epoch": 0.66, "learning_rate": 1.3968251124182462e-06, "loss": 0.8451, "step": 34776 }, { "epoch": 0.66, "learning_rate": 1.3966880265974211e-06, "loss": 1.0216, "step": 34777 }, { "epoch": 0.66, "learning_rate": 1.3965509448963294e-06, "loss": 0.9628, "step": 34778 }, { "epoch": 0.66, "learning_rate": 1.3964138673154826e-06, "loss": 1.0765, "step": 34779 }, { "epoch": 0.66, "learning_rate": 1.3962767938553922e-06, "loss": 0.9396, "step": 34780 }, { "epoch": 0.66, "learning_rate": 1.3961397245165708e-06, "loss": 1.2195, "step": 34781 }, { "epoch": 0.66, "learning_rate": 1.3960026592995306e-06, "loss": 1.0139, "step": 34782 }, { "epoch": 0.66, "learning_rate": 1.3958655982047808e-06, "loss": 0.7509, "step": 34783 }, { "epoch": 0.66, "learning_rate": 1.395728541232837e-06, "loss": 1.0053, "step": 34784 }, { "epoch": 0.66, "learning_rate": 1.395591488384208e-06, "loss": 0.7533, "step": 34785 }, { "epoch": 0.66, "learning_rate": 1.3954544396594054e-06, "loss": 0.8107, "step": 34786 }, { "epoch": 0.66, "learning_rate": 1.395317395058944e-06, "loss": 1.0851, "step": 34787 }, { "epoch": 0.66, "learning_rate": 1.3951803545833326e-06, "loss": 0.9645, "step": 34788 }, { "epoch": 0.66, "learning_rate": 1.3950433182330842e-06, "loss": 0.8034, "step": 34789 }, { "epoch": 0.66, "learning_rate": 1.3949062860087097e-06, "loss": 0.8777, "step": 34790 }, { "epoch": 0.66, "learning_rate": 1.3947692579107217e-06, "loss": 0.7766, "step": 34791 }, { "epoch": 0.66, "learning_rate": 1.3946322339396311e-06, "loss": 0.7186, "step": 34792 }, { "epoch": 0.66, "learning_rate": 1.39449521409595e-06, "loss": 0.826, "step": 34793 }, { "epoch": 0.66, "learning_rate": 1.3943581983801907e-06, "loss": 1.0877, "step": 34794 }, { "epoch": 0.66, "learning_rate": 1.3942211867928621e-06, "loss": 1.0163, "step": 34795 }, { "epoch": 0.66, "learning_rate": 1.3940841793344796e-06, "loss": 0.8525, "step": 34796 }, { "epoch": 0.66, "learning_rate": 1.3939471760055518e-06, "loss": 0.8483, "step": 34797 }, { "epoch": 0.66, "learning_rate": 1.3938101768065915e-06, "loss": 0.8203, "step": 34798 }, { "epoch": 0.66, "learning_rate": 1.39367318173811e-06, "loss": 0.9743, "step": 34799 }, { "epoch": 0.66, "learning_rate": 1.393536190800619e-06, "loss": 1.0018, "step": 34800 }, { "epoch": 0.66, "learning_rate": 1.3933992039946298e-06, "loss": 0.8568, "step": 34801 }, { "epoch": 0.66, "learning_rate": 1.3932622213206542e-06, "loss": 0.9136, "step": 34802 }, { "epoch": 0.66, "learning_rate": 1.3931252427792046e-06, "loss": 0.7869, "step": 34803 }, { "epoch": 0.66, "learning_rate": 1.3929882683707894e-06, "loss": 0.6706, "step": 34804 }, { "epoch": 0.66, "learning_rate": 1.392851298095924e-06, "loss": 1.0151, "step": 34805 }, { "epoch": 0.66, "learning_rate": 1.3927143319551167e-06, "loss": 1.0604, "step": 34806 }, { "epoch": 0.66, "learning_rate": 1.3925773699488793e-06, "loss": 1.0544, "step": 34807 }, { "epoch": 0.66, "learning_rate": 1.392440412077726e-06, "loss": 0.7791, "step": 34808 }, { "epoch": 0.66, "learning_rate": 1.3923034583421651e-06, "loss": 0.9827, "step": 34809 }, { "epoch": 0.66, "learning_rate": 1.3921665087427094e-06, "loss": 0.911, "step": 34810 }, { "epoch": 0.66, "learning_rate": 1.39202956327987e-06, "loss": 0.9565, "step": 34811 }, { "epoch": 0.66, "learning_rate": 1.3918926219541582e-06, "loss": 1.0219, "step": 34812 }, { "epoch": 0.66, "learning_rate": 1.3917556847660851e-06, "loss": 0.9586, "step": 34813 }, { "epoch": 0.66, "learning_rate": 1.3916187517161628e-06, "loss": 0.9371, "step": 34814 }, { "epoch": 0.66, "learning_rate": 1.3914818228049026e-06, "loss": 0.9101, "step": 34815 }, { "epoch": 0.66, "learning_rate": 1.3913448980328138e-06, "loss": 0.7341, "step": 34816 }, { "epoch": 0.66, "learning_rate": 1.3912079774004106e-06, "loss": 0.8321, "step": 34817 }, { "epoch": 0.66, "learning_rate": 1.391071060908202e-06, "loss": 1.1233, "step": 34818 }, { "epoch": 0.66, "learning_rate": 1.3909341485567002e-06, "loss": 1.024, "step": 34819 }, { "epoch": 0.66, "learning_rate": 1.390797240346416e-06, "loss": 0.9093, "step": 34820 }, { "epoch": 0.66, "learning_rate": 1.390660336277861e-06, "loss": 0.8632, "step": 34821 }, { "epoch": 0.66, "learning_rate": 1.3905234363515466e-06, "loss": 0.8888, "step": 34822 }, { "epoch": 0.66, "learning_rate": 1.3903865405679834e-06, "loss": 0.8418, "step": 34823 }, { "epoch": 0.66, "learning_rate": 1.390249648927684e-06, "loss": 1.1299, "step": 34824 }, { "epoch": 0.66, "learning_rate": 1.3901127614311561e-06, "loss": 1.1649, "step": 34825 }, { "epoch": 0.66, "learning_rate": 1.3899758780789155e-06, "loss": 0.8405, "step": 34826 }, { "epoch": 0.66, "learning_rate": 1.3898389988714697e-06, "loss": 0.9003, "step": 34827 }, { "epoch": 0.66, "learning_rate": 1.38970212380933e-06, "loss": 0.913, "step": 34828 }, { "epoch": 0.66, "learning_rate": 1.3895652528930107e-06, "loss": 0.7299, "step": 34829 }, { "epoch": 0.66, "learning_rate": 1.3894283861230195e-06, "loss": 0.8849, "step": 34830 }, { "epoch": 0.66, "learning_rate": 1.389291523499869e-06, "loss": 0.9659, "step": 34831 }, { "epoch": 0.66, "learning_rate": 1.3891546650240695e-06, "loss": 0.7242, "step": 34832 }, { "epoch": 0.66, "learning_rate": 1.3890178106961327e-06, "loss": 0.7252, "step": 34833 }, { "epoch": 0.66, "learning_rate": 1.388880960516569e-06, "loss": 0.8195, "step": 34834 }, { "epoch": 0.66, "learning_rate": 1.38874411448589e-06, "loss": 0.7644, "step": 34835 }, { "epoch": 0.66, "learning_rate": 1.3886072726046073e-06, "loss": 0.8284, "step": 34836 }, { "epoch": 0.66, "learning_rate": 1.3884704348732292e-06, "loss": 1.1181, "step": 34837 }, { "epoch": 0.66, "learning_rate": 1.38833360129227e-06, "loss": 0.9567, "step": 34838 }, { "epoch": 0.66, "learning_rate": 1.3881967718622382e-06, "loss": 0.8519, "step": 34839 }, { "epoch": 0.66, "learning_rate": 1.3880599465836458e-06, "loss": 0.9474, "step": 34840 }, { "epoch": 0.66, "learning_rate": 1.387923125457003e-06, "loss": 0.6772, "step": 34841 }, { "epoch": 0.66, "learning_rate": 1.3877863084828217e-06, "loss": 0.9904, "step": 34842 }, { "epoch": 0.66, "learning_rate": 1.387649495661612e-06, "loss": 0.8737, "step": 34843 }, { "epoch": 0.66, "learning_rate": 1.3875126869938849e-06, "loss": 1.0644, "step": 34844 }, { "epoch": 0.66, "learning_rate": 1.3873758824801525e-06, "loss": 1.0383, "step": 34845 }, { "epoch": 0.66, "learning_rate": 1.3872390821209221e-06, "loss": 1.0092, "step": 34846 }, { "epoch": 0.66, "learning_rate": 1.3871022859167092e-06, "loss": 0.853, "step": 34847 }, { "epoch": 0.66, "learning_rate": 1.386965493868021e-06, "loss": 1.0567, "step": 34848 }, { "epoch": 0.66, "learning_rate": 1.3868287059753689e-06, "loss": 1.0206, "step": 34849 }, { "epoch": 0.66, "learning_rate": 1.3866919222392658e-06, "loss": 0.9297, "step": 34850 }, { "epoch": 0.66, "learning_rate": 1.3865551426602204e-06, "loss": 0.7108, "step": 34851 }, { "epoch": 0.66, "learning_rate": 1.3864183672387432e-06, "loss": 0.8391, "step": 34852 }, { "epoch": 0.66, "learning_rate": 1.3862815959753462e-06, "loss": 0.8878, "step": 34853 }, { "epoch": 0.66, "learning_rate": 1.3861448288705397e-06, "loss": 0.8796, "step": 34854 }, { "epoch": 0.66, "learning_rate": 1.3860080659248343e-06, "loss": 0.9131, "step": 34855 }, { "epoch": 0.66, "learning_rate": 1.3858713071387403e-06, "loss": 1.1842, "step": 34856 }, { "epoch": 0.66, "learning_rate": 1.3857345525127697e-06, "loss": 0.9088, "step": 34857 }, { "epoch": 0.66, "learning_rate": 1.3855978020474302e-06, "loss": 0.89, "step": 34858 }, { "epoch": 0.66, "learning_rate": 1.3854610557432362e-06, "loss": 0.9604, "step": 34859 }, { "epoch": 0.66, "learning_rate": 1.3853243136006957e-06, "loss": 0.7497, "step": 34860 }, { "epoch": 0.66, "learning_rate": 1.3851875756203202e-06, "loss": 0.7649, "step": 34861 }, { "epoch": 0.66, "learning_rate": 1.3850508418026198e-06, "loss": 1.1467, "step": 34862 }, { "epoch": 0.66, "learning_rate": 1.3849141121481052e-06, "loss": 0.9637, "step": 34863 }, { "epoch": 0.66, "learning_rate": 1.3847773866572872e-06, "loss": 0.8065, "step": 34864 }, { "epoch": 0.66, "learning_rate": 1.3846406653306764e-06, "loss": 0.9122, "step": 34865 }, { "epoch": 0.66, "learning_rate": 1.3845039481687844e-06, "loss": 0.7769, "step": 34866 }, { "epoch": 0.66, "learning_rate": 1.3843672351721182e-06, "loss": 0.7192, "step": 34867 }, { "epoch": 0.66, "learning_rate": 1.3842305263411925e-06, "loss": 1.0787, "step": 34868 }, { "epoch": 0.66, "learning_rate": 1.3840938216765148e-06, "loss": 1.082, "step": 34869 }, { "epoch": 0.66, "learning_rate": 1.3839571211785956e-06, "loss": 1.1307, "step": 34870 }, { "epoch": 0.66, "learning_rate": 1.3838204248479481e-06, "loss": 0.7404, "step": 34871 }, { "epoch": 0.66, "learning_rate": 1.3836837326850803e-06, "loss": 0.9656, "step": 34872 }, { "epoch": 0.66, "learning_rate": 1.3835470446905031e-06, "loss": 0.8677, "step": 34873 }, { "epoch": 0.66, "learning_rate": 1.3834103608647267e-06, "loss": 0.8793, "step": 34874 }, { "epoch": 0.66, "learning_rate": 1.383273681208262e-06, "loss": 0.9893, "step": 34875 }, { "epoch": 0.66, "learning_rate": 1.3831370057216192e-06, "loss": 0.711, "step": 34876 }, { "epoch": 0.66, "learning_rate": 1.3830003344053083e-06, "loss": 0.9143, "step": 34877 }, { "epoch": 0.66, "learning_rate": 1.382863667259841e-06, "loss": 0.9338, "step": 34878 }, { "epoch": 0.66, "learning_rate": 1.382727004285725e-06, "loss": 0.9341, "step": 34879 }, { "epoch": 0.66, "learning_rate": 1.3825903454834738e-06, "loss": 0.909, "step": 34880 }, { "epoch": 0.66, "learning_rate": 1.3824536908535945e-06, "loss": 1.0695, "step": 34881 }, { "epoch": 0.66, "learning_rate": 1.3823170403965997e-06, "loss": 0.7917, "step": 34882 }, { "epoch": 0.66, "learning_rate": 1.3821803941129983e-06, "loss": 0.8214, "step": 34883 }, { "epoch": 0.66, "learning_rate": 1.3820437520033008e-06, "loss": 0.8938, "step": 34884 }, { "epoch": 0.66, "learning_rate": 1.3819071140680183e-06, "loss": 0.754, "step": 34885 }, { "epoch": 0.66, "learning_rate": 1.3817704803076598e-06, "loss": 1.222, "step": 34886 }, { "epoch": 0.66, "learning_rate": 1.3816338507227372e-06, "loss": 0.8724, "step": 34887 }, { "epoch": 0.66, "learning_rate": 1.3814972253137575e-06, "loss": 1.0527, "step": 34888 }, { "epoch": 0.66, "learning_rate": 1.3813606040812352e-06, "loss": 0.8243, "step": 34889 }, { "epoch": 0.66, "learning_rate": 1.3812239870256768e-06, "loss": 0.9405, "step": 34890 }, { "epoch": 0.66, "learning_rate": 1.3810873741475927e-06, "loss": 0.7467, "step": 34891 }, { "epoch": 0.66, "learning_rate": 1.3809507654474962e-06, "loss": 1.0701, "step": 34892 }, { "epoch": 0.66, "learning_rate": 1.3808141609258941e-06, "loss": 1.2369, "step": 34893 }, { "epoch": 0.66, "learning_rate": 1.3806775605832987e-06, "loss": 1.1282, "step": 34894 }, { "epoch": 0.66, "learning_rate": 1.380540964420217e-06, "loss": 0.9034, "step": 34895 }, { "epoch": 0.66, "learning_rate": 1.3804043724371619e-06, "loss": 0.8405, "step": 34896 }, { "epoch": 0.66, "learning_rate": 1.3802677846346434e-06, "loss": 0.7353, "step": 34897 }, { "epoch": 0.66, "learning_rate": 1.380131201013169e-06, "loss": 0.8411, "step": 34898 }, { "epoch": 0.66, "learning_rate": 1.3799946215732524e-06, "loss": 0.8853, "step": 34899 }, { "epoch": 0.66, "learning_rate": 1.3798580463154e-06, "loss": 1.1066, "step": 34900 }, { "epoch": 0.66, "learning_rate": 1.3797214752401239e-06, "loss": 0.943, "step": 34901 }, { "epoch": 0.66, "learning_rate": 1.379584908347933e-06, "loss": 0.9472, "step": 34902 }, { "epoch": 0.66, "learning_rate": 1.3794483456393382e-06, "loss": 0.7267, "step": 34903 }, { "epoch": 0.66, "learning_rate": 1.3793117871148485e-06, "loss": 0.8154, "step": 34904 }, { "epoch": 0.66, "learning_rate": 1.3791752327749742e-06, "loss": 0.8254, "step": 34905 }, { "epoch": 0.66, "learning_rate": 1.3790386826202265e-06, "loss": 1.1052, "step": 34906 }, { "epoch": 0.66, "learning_rate": 1.3789021366511119e-06, "loss": 1.02, "step": 34907 }, { "epoch": 0.66, "learning_rate": 1.3787655948681444e-06, "loss": 0.8712, "step": 34908 }, { "epoch": 0.66, "learning_rate": 1.3786290572718305e-06, "loss": 0.9155, "step": 34909 }, { "epoch": 0.66, "learning_rate": 1.3784925238626818e-06, "loss": 0.7833, "step": 34910 }, { "epoch": 0.66, "learning_rate": 1.3783559946412074e-06, "loss": 0.6992, "step": 34911 }, { "epoch": 0.66, "learning_rate": 1.378219469607917e-06, "loss": 0.9119, "step": 34912 }, { "epoch": 0.66, "learning_rate": 1.378082948763321e-06, "loss": 0.9752, "step": 34913 }, { "epoch": 0.66, "learning_rate": 1.377946432107929e-06, "loss": 0.9103, "step": 34914 }, { "epoch": 0.66, "learning_rate": 1.3778099196422511e-06, "loss": 0.9468, "step": 34915 }, { "epoch": 0.66, "learning_rate": 1.377673411366795e-06, "loss": 0.824, "step": 34916 }, { "epoch": 0.66, "learning_rate": 1.3775369072820733e-06, "loss": 0.9355, "step": 34917 }, { "epoch": 0.66, "learning_rate": 1.377400407388595e-06, "loss": 1.1691, "step": 34918 }, { "epoch": 0.66, "learning_rate": 1.3772639116868668e-06, "loss": 1.0572, "step": 34919 }, { "epoch": 0.66, "learning_rate": 1.3771274201774033e-06, "loss": 0.7336, "step": 34920 }, { "epoch": 0.66, "learning_rate": 1.37699093286071e-06, "loss": 0.8896, "step": 34921 }, { "epoch": 0.66, "learning_rate": 1.3768544497372987e-06, "loss": 1.0538, "step": 34922 }, { "epoch": 0.66, "learning_rate": 1.3767179708076784e-06, "loss": 0.7987, "step": 34923 }, { "epoch": 0.66, "learning_rate": 1.3765814960723583e-06, "loss": 1.0789, "step": 34924 }, { "epoch": 0.66, "learning_rate": 1.376445025531849e-06, "loss": 1.0723, "step": 34925 }, { "epoch": 0.66, "learning_rate": 1.376308559186659e-06, "loss": 0.9432, "step": 34926 }, { "epoch": 0.66, "learning_rate": 1.3761720970372997e-06, "loss": 0.8038, "step": 34927 }, { "epoch": 0.66, "learning_rate": 1.3760356390842773e-06, "loss": 1.0903, "step": 34928 }, { "epoch": 0.66, "learning_rate": 1.3758991853281053e-06, "loss": 0.8126, "step": 34929 }, { "epoch": 0.66, "learning_rate": 1.3757627357692904e-06, "loss": 1.0684, "step": 34930 }, { "epoch": 0.66, "learning_rate": 1.3756262904083428e-06, "loss": 0.9673, "step": 34931 }, { "epoch": 0.66, "learning_rate": 1.3754898492457725e-06, "loss": 0.8208, "step": 34932 }, { "epoch": 0.66, "learning_rate": 1.3753534122820882e-06, "loss": 0.8829, "step": 34933 }, { "epoch": 0.66, "learning_rate": 1.3752169795178e-06, "loss": 0.9548, "step": 34934 }, { "epoch": 0.66, "learning_rate": 1.375080550953417e-06, "loss": 0.7503, "step": 34935 }, { "epoch": 0.66, "learning_rate": 1.3749441265894497e-06, "loss": 0.9625, "step": 34936 }, { "epoch": 0.66, "learning_rate": 1.3748077064264048e-06, "loss": 1.1149, "step": 34937 }, { "epoch": 0.66, "learning_rate": 1.374671290464794e-06, "loss": 1.1364, "step": 34938 }, { "epoch": 0.66, "learning_rate": 1.3745348787051274e-06, "loss": 0.9165, "step": 34939 }, { "epoch": 0.66, "learning_rate": 1.3743984711479108e-06, "loss": 0.9638, "step": 34940 }, { "epoch": 0.66, "learning_rate": 1.374262067793658e-06, "loss": 0.7376, "step": 34941 }, { "epoch": 0.66, "learning_rate": 1.3741256686428752e-06, "loss": 0.875, "step": 34942 }, { "epoch": 0.66, "learning_rate": 1.3739892736960725e-06, "loss": 1.107, "step": 34943 }, { "epoch": 0.66, "learning_rate": 1.3738528829537596e-06, "loss": 1.1037, "step": 34944 }, { "epoch": 0.66, "learning_rate": 1.373716496416445e-06, "loss": 0.9531, "step": 34945 }, { "epoch": 0.66, "learning_rate": 1.3735801140846389e-06, "loss": 0.7981, "step": 34946 }, { "epoch": 0.66, "learning_rate": 1.3734437359588502e-06, "loss": 1.1761, "step": 34947 }, { "epoch": 0.66, "learning_rate": 1.3733073620395887e-06, "loss": 0.7262, "step": 34948 }, { "epoch": 0.66, "learning_rate": 1.3731709923273611e-06, "loss": 0.9074, "step": 34949 }, { "epoch": 0.66, "learning_rate": 1.3730346268226804e-06, "loss": 1.1686, "step": 34950 }, { "epoch": 0.66, "learning_rate": 1.3728982655260532e-06, "loss": 0.8177, "step": 34951 }, { "epoch": 0.66, "learning_rate": 1.372761908437989e-06, "loss": 0.8563, "step": 34952 }, { "epoch": 0.66, "learning_rate": 1.3726255555589971e-06, "loss": 0.9006, "step": 34953 }, { "epoch": 0.66, "learning_rate": 1.372489206889587e-06, "loss": 0.7484, "step": 34954 }, { "epoch": 0.66, "learning_rate": 1.3723528624302676e-06, "loss": 0.9405, "step": 34955 }, { "epoch": 0.66, "learning_rate": 1.3722165221815481e-06, "loss": 0.9619, "step": 34956 }, { "epoch": 0.66, "learning_rate": 1.3720801861439387e-06, "loss": 0.9598, "step": 34957 }, { "epoch": 0.66, "learning_rate": 1.3719438543179448e-06, "loss": 0.9728, "step": 34958 }, { "epoch": 0.66, "learning_rate": 1.3718075267040793e-06, "loss": 0.8788, "step": 34959 }, { "epoch": 0.66, "learning_rate": 1.3716712033028509e-06, "loss": 1.0167, "step": 34960 }, { "epoch": 0.66, "learning_rate": 1.3715348841147658e-06, "loss": 0.9266, "step": 34961 }, { "epoch": 0.66, "learning_rate": 1.3713985691403363e-06, "loss": 1.1754, "step": 34962 }, { "epoch": 0.66, "learning_rate": 1.3712622583800694e-06, "loss": 1.1389, "step": 34963 }, { "epoch": 0.66, "learning_rate": 1.3711259518344743e-06, "loss": 1.0985, "step": 34964 }, { "epoch": 0.66, "learning_rate": 1.370989649504061e-06, "loss": 0.8842, "step": 34965 }, { "epoch": 0.66, "learning_rate": 1.3708533513893367e-06, "loss": 0.7825, "step": 34966 }, { "epoch": 0.66, "learning_rate": 1.3707170574908122e-06, "loss": 0.7812, "step": 34967 }, { "epoch": 0.66, "learning_rate": 1.3705807678089953e-06, "loss": 0.8903, "step": 34968 }, { "epoch": 0.66, "learning_rate": 1.370444482344396e-06, "loss": 1.2274, "step": 34969 }, { "epoch": 0.66, "learning_rate": 1.3703082010975204e-06, "loss": 0.9718, "step": 34970 }, { "epoch": 0.66, "learning_rate": 1.3701719240688816e-06, "loss": 0.6807, "step": 34971 }, { "epoch": 0.66, "learning_rate": 1.3700356512589853e-06, "loss": 0.866, "step": 34972 }, { "epoch": 0.66, "learning_rate": 1.369899382668341e-06, "loss": 0.758, "step": 34973 }, { "epoch": 0.66, "learning_rate": 1.3697631182974575e-06, "loss": 0.9462, "step": 34974 }, { "epoch": 0.66, "learning_rate": 1.3696268581468442e-06, "loss": 1.1671, "step": 34975 }, { "epoch": 0.66, "learning_rate": 1.3694906022170096e-06, "loss": 0.9334, "step": 34976 }, { "epoch": 0.66, "learning_rate": 1.3693543505084622e-06, "loss": 0.8085, "step": 34977 }, { "epoch": 0.66, "learning_rate": 1.3692181030217119e-06, "loss": 0.8669, "step": 34978 }, { "epoch": 0.66, "learning_rate": 1.3690818597572647e-06, "loss": 0.5705, "step": 34979 }, { "epoch": 0.66, "learning_rate": 1.3689456207156321e-06, "loss": 0.9354, "step": 34980 }, { "epoch": 0.66, "learning_rate": 1.3688093858973232e-06, "loss": 0.9762, "step": 34981 }, { "epoch": 0.66, "learning_rate": 1.3686731553028431e-06, "loss": 1.0499, "step": 34982 }, { "epoch": 0.66, "learning_rate": 1.3685369289327046e-06, "loss": 0.7506, "step": 34983 }, { "epoch": 0.66, "learning_rate": 1.3684007067874138e-06, "loss": 0.9501, "step": 34984 }, { "epoch": 0.66, "learning_rate": 1.3682644888674801e-06, "loss": 0.8928, "step": 34985 }, { "epoch": 0.66, "learning_rate": 1.3681282751734118e-06, "loss": 0.8085, "step": 34986 }, { "epoch": 0.66, "learning_rate": 1.3679920657057178e-06, "loss": 0.9709, "step": 34987 }, { "epoch": 0.66, "learning_rate": 1.367855860464907e-06, "loss": 0.8998, "step": 34988 }, { "epoch": 0.66, "learning_rate": 1.3677196594514875e-06, "loss": 0.9719, "step": 34989 }, { "epoch": 0.66, "learning_rate": 1.3675834626659693e-06, "loss": 1.0037, "step": 34990 }, { "epoch": 0.66, "learning_rate": 1.3674472701088577e-06, "loss": 0.9051, "step": 34991 }, { "epoch": 0.66, "learning_rate": 1.367311081780665e-06, "loss": 1.0342, "step": 34992 }, { "epoch": 0.66, "learning_rate": 1.3671748976818972e-06, "loss": 0.9725, "step": 34993 }, { "epoch": 0.66, "learning_rate": 1.3670387178130635e-06, "loss": 0.97, "step": 34994 }, { "epoch": 0.66, "learning_rate": 1.3669025421746723e-06, "loss": 0.7603, "step": 34995 }, { "epoch": 0.66, "learning_rate": 1.3667663707672327e-06, "loss": 0.6982, "step": 34996 }, { "epoch": 0.66, "learning_rate": 1.3666302035912527e-06, "loss": 0.8817, "step": 34997 }, { "epoch": 0.66, "learning_rate": 1.3664940406472405e-06, "loss": 0.9445, "step": 34998 }, { "epoch": 0.66, "learning_rate": 1.366357881935706e-06, "loss": 1.1329, "step": 34999 }, { "epoch": 0.66, "learning_rate": 1.3662217274571544e-06, "loss": 1.1256, "step": 35000 }, { "epoch": 0.66, "learning_rate": 1.3660855772120969e-06, "loss": 0.9621, "step": 35001 }, { "epoch": 0.66, "learning_rate": 1.3659494312010422e-06, "loss": 0.8278, "step": 35002 }, { "epoch": 0.66, "learning_rate": 1.3658132894244956e-06, "loss": 0.8963, "step": 35003 }, { "epoch": 0.66, "learning_rate": 1.3656771518829693e-06, "loss": 0.8103, "step": 35004 }, { "epoch": 0.66, "learning_rate": 1.3655410185769686e-06, "loss": 0.8588, "step": 35005 }, { "epoch": 0.66, "learning_rate": 1.3654048895070031e-06, "loss": 0.9363, "step": 35006 }, { "epoch": 0.66, "learning_rate": 1.3652687646735812e-06, "loss": 0.9328, "step": 35007 }, { "epoch": 0.66, "learning_rate": 1.3651326440772106e-06, "loss": 0.6934, "step": 35008 }, { "epoch": 0.66, "learning_rate": 1.3649965277184003e-06, "loss": 0.7989, "step": 35009 }, { "epoch": 0.66, "learning_rate": 1.3648604155976577e-06, "loss": 0.8414, "step": 35010 }, { "epoch": 0.66, "learning_rate": 1.3647243077154928e-06, "loss": 1.0103, "step": 35011 }, { "epoch": 0.66, "learning_rate": 1.3645882040724107e-06, "loss": 1.0405, "step": 35012 }, { "epoch": 0.66, "learning_rate": 1.364452104668923e-06, "loss": 1.0535, "step": 35013 }, { "epoch": 0.66, "learning_rate": 1.3643160095055355e-06, "loss": 0.869, "step": 35014 }, { "epoch": 0.66, "learning_rate": 1.364179918582757e-06, "loss": 0.8336, "step": 35015 }, { "epoch": 0.66, "learning_rate": 1.3640438319010962e-06, "loss": 0.9028, "step": 35016 }, { "epoch": 0.66, "learning_rate": 1.3639077494610608e-06, "loss": 0.9061, "step": 35017 }, { "epoch": 0.66, "learning_rate": 1.363771671263159e-06, "loss": 1.2268, "step": 35018 }, { "epoch": 0.66, "learning_rate": 1.363635597307899e-06, "loss": 1.0444, "step": 35019 }, { "epoch": 0.66, "learning_rate": 1.3634995275957897e-06, "loss": 1.1046, "step": 35020 }, { "epoch": 0.66, "learning_rate": 1.3633634621273365e-06, "loss": 0.9335, "step": 35021 }, { "epoch": 0.66, "learning_rate": 1.3632274009030502e-06, "loss": 0.8828, "step": 35022 }, { "epoch": 0.66, "learning_rate": 1.3630913439234389e-06, "loss": 0.842, "step": 35023 }, { "epoch": 0.66, "learning_rate": 1.3629552911890076e-06, "loss": 0.8474, "step": 35024 }, { "epoch": 0.66, "learning_rate": 1.3628192427002684e-06, "loss": 0.9274, "step": 35025 }, { "epoch": 0.66, "learning_rate": 1.3626831984577266e-06, "loss": 0.8673, "step": 35026 }, { "epoch": 0.66, "learning_rate": 1.3625471584618905e-06, "loss": 0.786, "step": 35027 }, { "epoch": 0.66, "learning_rate": 1.3624111227132686e-06, "loss": 0.94, "step": 35028 }, { "epoch": 0.66, "learning_rate": 1.3622750912123683e-06, "loss": 0.8868, "step": 35029 }, { "epoch": 0.66, "learning_rate": 1.3621390639596985e-06, "loss": 0.6962, "step": 35030 }, { "epoch": 0.66, "learning_rate": 1.3620030409557664e-06, "loss": 1.0909, "step": 35031 }, { "epoch": 0.66, "learning_rate": 1.361867022201081e-06, "loss": 1.1372, "step": 35032 }, { "epoch": 0.66, "learning_rate": 1.3617310076961471e-06, "loss": 0.7766, "step": 35033 }, { "epoch": 0.66, "learning_rate": 1.3615949974414765e-06, "loss": 0.889, "step": 35034 }, { "epoch": 0.66, "learning_rate": 1.3614589914375747e-06, "loss": 0.796, "step": 35035 }, { "epoch": 0.66, "learning_rate": 1.36132298968495e-06, "loss": 0.9256, "step": 35036 }, { "epoch": 0.66, "learning_rate": 1.3611869921841103e-06, "loss": 1.0497, "step": 35037 }, { "epoch": 0.66, "learning_rate": 1.3610509989355637e-06, "loss": 1.0346, "step": 35038 }, { "epoch": 0.66, "learning_rate": 1.3609150099398177e-06, "loss": 0.8075, "step": 35039 }, { "epoch": 0.66, "learning_rate": 1.3607790251973798e-06, "loss": 0.8588, "step": 35040 }, { "epoch": 0.66, "learning_rate": 1.3606430447087593e-06, "loss": 0.9652, "step": 35041 }, { "epoch": 0.66, "learning_rate": 1.3605070684744608e-06, "loss": 0.9661, "step": 35042 }, { "epoch": 0.66, "learning_rate": 1.3603710964949947e-06, "loss": 0.998, "step": 35043 }, { "epoch": 0.66, "learning_rate": 1.3602351287708693e-06, "loss": 0.9379, "step": 35044 }, { "epoch": 0.66, "learning_rate": 1.360099165302589e-06, "loss": 0.9387, "step": 35045 }, { "epoch": 0.66, "learning_rate": 1.3599632060906654e-06, "loss": 0.8147, "step": 35046 }, { "epoch": 0.66, "learning_rate": 1.3598272511356031e-06, "loss": 1.0789, "step": 35047 }, { "epoch": 0.66, "learning_rate": 1.3596913004379108e-06, "loss": 1.0374, "step": 35048 }, { "epoch": 0.66, "learning_rate": 1.3595553539980962e-06, "loss": 0.9506, "step": 35049 }, { "epoch": 0.66, "learning_rate": 1.359419411816667e-06, "loss": 1.1395, "step": 35050 }, { "epoch": 0.66, "learning_rate": 1.359283473894131e-06, "loss": 0.6393, "step": 35051 }, { "epoch": 0.66, "learning_rate": 1.3591475402309955e-06, "loss": 1.0372, "step": 35052 }, { "epoch": 0.66, "learning_rate": 1.359011610827769e-06, "loss": 0.7953, "step": 35053 }, { "epoch": 0.66, "learning_rate": 1.3588756856849562e-06, "loss": 0.8951, "step": 35054 }, { "epoch": 0.66, "learning_rate": 1.3587397648030684e-06, "loss": 1.0246, "step": 35055 }, { "epoch": 0.66, "learning_rate": 1.3586038481826105e-06, "loss": 1.1847, "step": 35056 }, { "epoch": 0.66, "learning_rate": 1.3584679358240909e-06, "loss": 0.7946, "step": 35057 }, { "epoch": 0.66, "learning_rate": 1.3583320277280168e-06, "loss": 0.7047, "step": 35058 }, { "epoch": 0.66, "learning_rate": 1.358196123894896e-06, "loss": 0.7988, "step": 35059 }, { "epoch": 0.66, "learning_rate": 1.3580602243252362e-06, "loss": 0.8736, "step": 35060 }, { "epoch": 0.66, "learning_rate": 1.357924329019544e-06, "loss": 0.8826, "step": 35061 }, { "epoch": 0.66, "learning_rate": 1.3577884379783286e-06, "loss": 0.9094, "step": 35062 }, { "epoch": 0.66, "learning_rate": 1.357652551202094e-06, "loss": 0.7978, "step": 35063 }, { "epoch": 0.66, "learning_rate": 1.357516668691351e-06, "loss": 0.9977, "step": 35064 }, { "epoch": 0.66, "learning_rate": 1.3573807904466063e-06, "loss": 0.9316, "step": 35065 }, { "epoch": 0.66, "learning_rate": 1.3572449164683652e-06, "loss": 0.9551, "step": 35066 }, { "epoch": 0.66, "learning_rate": 1.3571090467571383e-06, "loss": 0.9654, "step": 35067 }, { "epoch": 0.66, "learning_rate": 1.35697318131343e-06, "loss": 1.025, "step": 35068 }, { "epoch": 0.66, "learning_rate": 1.356837320137749e-06, "loss": 1.1993, "step": 35069 }, { "epoch": 0.66, "learning_rate": 1.3567014632306026e-06, "loss": 0.9271, "step": 35070 }, { "epoch": 0.66, "learning_rate": 1.3565656105924977e-06, "loss": 0.6727, "step": 35071 }, { "epoch": 0.66, "learning_rate": 1.3564297622239418e-06, "loss": 0.8903, "step": 35072 }, { "epoch": 0.66, "learning_rate": 1.356293918125442e-06, "loss": 0.8987, "step": 35073 }, { "epoch": 0.66, "learning_rate": 1.3561580782975064e-06, "loss": 0.9776, "step": 35074 }, { "epoch": 0.66, "learning_rate": 1.35602224274064e-06, "loss": 0.9261, "step": 35075 }, { "epoch": 0.66, "learning_rate": 1.3558864114553532e-06, "loss": 0.8929, "step": 35076 }, { "epoch": 0.66, "learning_rate": 1.3557505844421502e-06, "loss": 0.9917, "step": 35077 }, { "epoch": 0.66, "learning_rate": 1.3556147617015396e-06, "loss": 0.9796, "step": 35078 }, { "epoch": 0.66, "learning_rate": 1.3554789432340288e-06, "loss": 0.7656, "step": 35079 }, { "epoch": 0.66, "learning_rate": 1.3553431290401242e-06, "loss": 0.8832, "step": 35080 }, { "epoch": 0.66, "learning_rate": 1.3552073191203332e-06, "loss": 1.1275, "step": 35081 }, { "epoch": 0.66, "learning_rate": 1.3550715134751629e-06, "loss": 1.0173, "step": 35082 }, { "epoch": 0.66, "learning_rate": 1.3549357121051218e-06, "loss": 0.7979, "step": 35083 }, { "epoch": 0.66, "learning_rate": 1.3547999150107136e-06, "loss": 0.7667, "step": 35084 }, { "epoch": 0.66, "learning_rate": 1.3546641221924484e-06, "loss": 0.7946, "step": 35085 }, { "epoch": 0.66, "learning_rate": 1.354528333650833e-06, "loss": 1.0031, "step": 35086 }, { "epoch": 0.66, "learning_rate": 1.3543925493863718e-06, "loss": 0.9443, "step": 35087 }, { "epoch": 0.66, "learning_rate": 1.3542567693995756e-06, "loss": 0.9154, "step": 35088 }, { "epoch": 0.66, "learning_rate": 1.3541209936909486e-06, "loss": 1.1031, "step": 35089 }, { "epoch": 0.66, "learning_rate": 1.3539852222609986e-06, "loss": 0.7844, "step": 35090 }, { "epoch": 0.66, "learning_rate": 1.3538494551102327e-06, "loss": 0.9354, "step": 35091 }, { "epoch": 0.66, "learning_rate": 1.353713692239158e-06, "loss": 0.7834, "step": 35092 }, { "epoch": 0.66, "learning_rate": 1.353577933648281e-06, "loss": 1.1683, "step": 35093 }, { "epoch": 0.66, "learning_rate": 1.353442179338109e-06, "loss": 0.9228, "step": 35094 }, { "epoch": 0.66, "learning_rate": 1.3533064293091494e-06, "loss": 0.9642, "step": 35095 }, { "epoch": 0.66, "learning_rate": 1.353170683561907e-06, "loss": 1.0038, "step": 35096 }, { "epoch": 0.66, "learning_rate": 1.3530349420968914e-06, "loss": 0.931, "step": 35097 }, { "epoch": 0.66, "learning_rate": 1.3528992049146078e-06, "loss": 0.681, "step": 35098 }, { "epoch": 0.66, "learning_rate": 1.352763472015563e-06, "loss": 1.0908, "step": 35099 }, { "epoch": 0.66, "learning_rate": 1.3526277434002643e-06, "loss": 1.1791, "step": 35100 }, { "epoch": 0.66, "learning_rate": 1.3524920190692184e-06, "loss": 0.8882, "step": 35101 }, { "epoch": 0.66, "learning_rate": 1.3523562990229323e-06, "loss": 0.8887, "step": 35102 }, { "epoch": 0.66, "learning_rate": 1.3522205832619123e-06, "loss": 0.9275, "step": 35103 }, { "epoch": 0.66, "learning_rate": 1.3520848717866668e-06, "loss": 0.8603, "step": 35104 }, { "epoch": 0.66, "learning_rate": 1.351949164597699e-06, "loss": 0.8593, "step": 35105 }, { "epoch": 0.66, "learning_rate": 1.3518134616955186e-06, "loss": 1.0157, "step": 35106 }, { "epoch": 0.66, "learning_rate": 1.351677763080633e-06, "loss": 1.0153, "step": 35107 }, { "epoch": 0.66, "learning_rate": 1.3515420687535453e-06, "loss": 0.8768, "step": 35108 }, { "epoch": 0.66, "learning_rate": 1.351406378714766e-06, "loss": 0.816, "step": 35109 }, { "epoch": 0.66, "learning_rate": 1.3512706929647996e-06, "loss": 0.8222, "step": 35110 }, { "epoch": 0.66, "learning_rate": 1.3511350115041527e-06, "loss": 1.1346, "step": 35111 }, { "epoch": 0.66, "learning_rate": 1.3509993343333324e-06, "loss": 1.0715, "step": 35112 }, { "epoch": 0.66, "learning_rate": 1.350863661452846e-06, "loss": 0.9941, "step": 35113 }, { "epoch": 0.66, "learning_rate": 1.350727992863199e-06, "loss": 0.944, "step": 35114 }, { "epoch": 0.66, "learning_rate": 1.350592328564898e-06, "loss": 0.8997, "step": 35115 }, { "epoch": 0.66, "learning_rate": 1.3504566685584515e-06, "loss": 0.808, "step": 35116 }, { "epoch": 0.66, "learning_rate": 1.3503210128443629e-06, "loss": 0.8832, "step": 35117 }, { "epoch": 0.66, "learning_rate": 1.350185361423142e-06, "loss": 1.1532, "step": 35118 }, { "epoch": 0.66, "learning_rate": 1.3500497142952923e-06, "loss": 0.9541, "step": 35119 }, { "epoch": 0.66, "learning_rate": 1.3499140714613224e-06, "loss": 0.7853, "step": 35120 }, { "epoch": 0.66, "learning_rate": 1.3497784329217377e-06, "loss": 0.8005, "step": 35121 }, { "epoch": 0.66, "learning_rate": 1.3496427986770453e-06, "loss": 0.8666, "step": 35122 }, { "epoch": 0.66, "learning_rate": 1.3495071687277511e-06, "loss": 0.7596, "step": 35123 }, { "epoch": 0.66, "learning_rate": 1.349371543074362e-06, "loss": 1.1035, "step": 35124 }, { "epoch": 0.66, "learning_rate": 1.3492359217173856e-06, "loss": 1.0734, "step": 35125 }, { "epoch": 0.66, "learning_rate": 1.3491003046573257e-06, "loss": 0.7323, "step": 35126 }, { "epoch": 0.66, "learning_rate": 1.3489646918946892e-06, "loss": 0.8009, "step": 35127 }, { "epoch": 0.66, "learning_rate": 1.3488290834299849e-06, "loss": 0.8597, "step": 35128 }, { "epoch": 0.66, "learning_rate": 1.3486934792637166e-06, "loss": 0.7967, "step": 35129 }, { "epoch": 0.66, "learning_rate": 1.3485578793963916e-06, "loss": 0.8509, "step": 35130 }, { "epoch": 0.66, "learning_rate": 1.348422283828516e-06, "loss": 1.1049, "step": 35131 }, { "epoch": 0.66, "learning_rate": 1.3482866925605968e-06, "loss": 0.9717, "step": 35132 }, { "epoch": 0.66, "learning_rate": 1.3481511055931393e-06, "loss": 0.5181, "step": 35133 }, { "epoch": 0.66, "learning_rate": 1.3480155229266503e-06, "loss": 0.8987, "step": 35134 }, { "epoch": 0.66, "learning_rate": 1.3478799445616372e-06, "loss": 1.0688, "step": 35135 }, { "epoch": 0.66, "learning_rate": 1.3477443704986032e-06, "loss": 0.9237, "step": 35136 }, { "epoch": 0.66, "learning_rate": 1.3476088007380577e-06, "loss": 1.0468, "step": 35137 }, { "epoch": 0.66, "learning_rate": 1.3474732352805054e-06, "loss": 0.9839, "step": 35138 }, { "epoch": 0.66, "learning_rate": 1.3473376741264521e-06, "loss": 0.8845, "step": 35139 }, { "epoch": 0.66, "learning_rate": 1.347202117276405e-06, "loss": 0.827, "step": 35140 }, { "epoch": 0.66, "learning_rate": 1.3470665647308698e-06, "loss": 1.0576, "step": 35141 }, { "epoch": 0.66, "learning_rate": 1.3469310164903527e-06, "loss": 0.9204, "step": 35142 }, { "epoch": 0.66, "learning_rate": 1.3467954725553595e-06, "loss": 0.9473, "step": 35143 }, { "epoch": 0.66, "learning_rate": 1.346659932926398e-06, "loss": 0.9568, "step": 35144 }, { "epoch": 0.66, "learning_rate": 1.346524397603971e-06, "loss": 0.964, "step": 35145 }, { "epoch": 0.66, "learning_rate": 1.3463888665885882e-06, "loss": 0.9165, "step": 35146 }, { "epoch": 0.66, "learning_rate": 1.346253339880753e-06, "loss": 0.7734, "step": 35147 }, { "epoch": 0.66, "learning_rate": 1.3461178174809718e-06, "loss": 0.917, "step": 35148 }, { "epoch": 0.66, "learning_rate": 1.345982299389753e-06, "loss": 0.9492, "step": 35149 }, { "epoch": 0.66, "learning_rate": 1.3458467856076001e-06, "loss": 0.8925, "step": 35150 }, { "epoch": 0.66, "learning_rate": 1.34571127613502e-06, "loss": 0.8124, "step": 35151 }, { "epoch": 0.66, "learning_rate": 1.3455757709725182e-06, "loss": 0.8848, "step": 35152 }, { "epoch": 0.66, "learning_rate": 1.3454402701206014e-06, "loss": 0.8654, "step": 35153 }, { "epoch": 0.66, "learning_rate": 1.3453047735797753e-06, "loss": 0.8837, "step": 35154 }, { "epoch": 0.66, "learning_rate": 1.3451692813505453e-06, "loss": 0.7537, "step": 35155 }, { "epoch": 0.66, "learning_rate": 1.3450337934334193e-06, "loss": 0.9858, "step": 35156 }, { "epoch": 0.66, "learning_rate": 1.3448983098288996e-06, "loss": 0.7659, "step": 35157 }, { "epoch": 0.66, "learning_rate": 1.344762830537496e-06, "loss": 0.803, "step": 35158 }, { "epoch": 0.66, "learning_rate": 1.3446273555597118e-06, "loss": 0.9049, "step": 35159 }, { "epoch": 0.66, "learning_rate": 1.3444918848960533e-06, "loss": 0.9482, "step": 35160 }, { "epoch": 0.66, "learning_rate": 1.344356418547027e-06, "loss": 1.0038, "step": 35161 }, { "epoch": 0.66, "learning_rate": 1.344220956513138e-06, "loss": 1.0705, "step": 35162 }, { "epoch": 0.66, "learning_rate": 1.344085498794893e-06, "loss": 0.9599, "step": 35163 }, { "epoch": 0.66, "learning_rate": 1.3439500453927973e-06, "loss": 0.906, "step": 35164 }, { "epoch": 0.66, "learning_rate": 1.3438145963073573e-06, "loss": 0.9189, "step": 35165 }, { "epoch": 0.66, "learning_rate": 1.3436791515390763e-06, "loss": 0.9296, "step": 35166 }, { "epoch": 0.66, "learning_rate": 1.3435437110884641e-06, "loss": 0.887, "step": 35167 }, { "epoch": 0.66, "learning_rate": 1.3434082749560229e-06, "loss": 0.9668, "step": 35168 }, { "epoch": 0.66, "learning_rate": 1.343272843142259e-06, "loss": 0.919, "step": 35169 }, { "epoch": 0.66, "learning_rate": 1.3431374156476806e-06, "loss": 0.8929, "step": 35170 }, { "epoch": 0.66, "learning_rate": 1.343001992472791e-06, "loss": 0.812, "step": 35171 }, { "epoch": 0.66, "learning_rate": 1.3428665736180963e-06, "loss": 0.7646, "step": 35172 }, { "epoch": 0.66, "learning_rate": 1.3427311590841022e-06, "loss": 0.8141, "step": 35173 }, { "epoch": 0.66, "learning_rate": 1.3425957488713143e-06, "loss": 1.148, "step": 35174 }, { "epoch": 0.66, "learning_rate": 1.3424603429802388e-06, "loss": 1.2141, "step": 35175 }, { "epoch": 0.66, "learning_rate": 1.3423249414113808e-06, "loss": 0.7621, "step": 35176 }, { "epoch": 0.66, "learning_rate": 1.3421895441652468e-06, "loss": 0.7331, "step": 35177 }, { "epoch": 0.66, "learning_rate": 1.3420541512423396e-06, "loss": 0.8035, "step": 35178 }, { "epoch": 0.66, "learning_rate": 1.3419187626431687e-06, "loss": 0.7815, "step": 35179 }, { "epoch": 0.66, "learning_rate": 1.3417833783682366e-06, "loss": 0.985, "step": 35180 }, { "epoch": 0.66, "learning_rate": 1.3416479984180502e-06, "loss": 0.8971, "step": 35181 }, { "epoch": 0.66, "learning_rate": 1.341512622793114e-06, "loss": 0.8653, "step": 35182 }, { "epoch": 0.66, "learning_rate": 1.341377251493935e-06, "loss": 1.0228, "step": 35183 }, { "epoch": 0.66, "learning_rate": 1.3412418845210172e-06, "loss": 0.7354, "step": 35184 }, { "epoch": 0.66, "learning_rate": 1.3411065218748667e-06, "loss": 0.9177, "step": 35185 }, { "epoch": 0.66, "learning_rate": 1.3409711635559902e-06, "loss": 0.8141, "step": 35186 }, { "epoch": 0.66, "learning_rate": 1.3408358095648896e-06, "loss": 1.0672, "step": 35187 }, { "epoch": 0.66, "learning_rate": 1.3407004599020746e-06, "loss": 0.8579, "step": 35188 }, { "epoch": 0.66, "learning_rate": 1.3405651145680476e-06, "loss": 0.7026, "step": 35189 }, { "epoch": 0.66, "learning_rate": 1.3404297735633138e-06, "loss": 0.9804, "step": 35190 }, { "epoch": 0.66, "learning_rate": 1.340294436888382e-06, "loss": 0.8581, "step": 35191 }, { "epoch": 0.66, "learning_rate": 1.3401591045437536e-06, "loss": 0.8843, "step": 35192 }, { "epoch": 0.66, "learning_rate": 1.3400237765299361e-06, "loss": 0.9314, "step": 35193 }, { "epoch": 0.66, "learning_rate": 1.339888452847434e-06, "loss": 0.834, "step": 35194 }, { "epoch": 0.66, "learning_rate": 1.3397531334967528e-06, "loss": 0.8611, "step": 35195 }, { "epoch": 0.66, "learning_rate": 1.3396178184783982e-06, "loss": 1.0085, "step": 35196 }, { "epoch": 0.66, "learning_rate": 1.3394825077928747e-06, "loss": 0.9476, "step": 35197 }, { "epoch": 0.66, "learning_rate": 1.3393472014406888e-06, "loss": 0.862, "step": 35198 }, { "epoch": 0.66, "learning_rate": 1.3392118994223432e-06, "loss": 0.8477, "step": 35199 }, { "epoch": 0.66, "learning_rate": 1.3390766017383467e-06, "loss": 1.0634, "step": 35200 }, { "epoch": 0.66, "learning_rate": 1.3389413083892016e-06, "loss": 1.0742, "step": 35201 }, { "epoch": 0.66, "learning_rate": 1.338806019375414e-06, "loss": 0.773, "step": 35202 }, { "epoch": 0.66, "learning_rate": 1.3386707346974892e-06, "loss": 0.7844, "step": 35203 }, { "epoch": 0.66, "learning_rate": 1.338535454355932e-06, "loss": 0.7764, "step": 35204 }, { "epoch": 0.66, "learning_rate": 1.3384001783512482e-06, "loss": 1.0016, "step": 35205 }, { "epoch": 0.66, "learning_rate": 1.3382649066839424e-06, "loss": 1.1243, "step": 35206 }, { "epoch": 0.66, "learning_rate": 1.3381296393545208e-06, "loss": 0.8189, "step": 35207 }, { "epoch": 0.66, "learning_rate": 1.3379943763634854e-06, "loss": 0.9438, "step": 35208 }, { "epoch": 0.66, "learning_rate": 1.3378591177113454e-06, "loss": 1.1467, "step": 35209 }, { "epoch": 0.66, "learning_rate": 1.3377238633986029e-06, "loss": 0.9317, "step": 35210 }, { "epoch": 0.66, "learning_rate": 1.3375886134257626e-06, "loss": 1.1962, "step": 35211 }, { "epoch": 0.66, "learning_rate": 1.337453367793333e-06, "loss": 0.887, "step": 35212 }, { "epoch": 0.66, "learning_rate": 1.337318126501816e-06, "loss": 0.8296, "step": 35213 }, { "epoch": 0.66, "learning_rate": 1.3371828895517172e-06, "loss": 1.0502, "step": 35214 }, { "epoch": 0.66, "learning_rate": 1.337047656943542e-06, "loss": 0.7899, "step": 35215 }, { "epoch": 0.66, "learning_rate": 1.3369124286777952e-06, "loss": 0.7788, "step": 35216 }, { "epoch": 0.66, "learning_rate": 1.3367772047549816e-06, "loss": 0.7766, "step": 35217 }, { "epoch": 0.66, "learning_rate": 1.3366419851756062e-06, "loss": 1.2025, "step": 35218 }, { "epoch": 0.66, "learning_rate": 1.3365067699401752e-06, "loss": 1.1152, "step": 35219 }, { "epoch": 0.66, "learning_rate": 1.3363715590491903e-06, "loss": 1.1417, "step": 35220 }, { "epoch": 0.66, "learning_rate": 1.3362363525031602e-06, "loss": 0.9202, "step": 35221 }, { "epoch": 0.66, "learning_rate": 1.3361011503025868e-06, "loss": 0.8961, "step": 35222 }, { "epoch": 0.66, "learning_rate": 1.335965952447976e-06, "loss": 0.9979, "step": 35223 }, { "epoch": 0.66, "learning_rate": 1.3358307589398328e-06, "loss": 0.6764, "step": 35224 }, { "epoch": 0.66, "learning_rate": 1.3356955697786616e-06, "loss": 1.2466, "step": 35225 }, { "epoch": 0.66, "learning_rate": 1.3355603849649675e-06, "loss": 1.0627, "step": 35226 }, { "epoch": 0.66, "learning_rate": 1.3354252044992555e-06, "loss": 0.8385, "step": 35227 }, { "epoch": 0.66, "learning_rate": 1.335290028382031e-06, "loss": 0.8331, "step": 35228 }, { "epoch": 0.66, "learning_rate": 1.3351548566137957e-06, "loss": 0.794, "step": 35229 }, { "epoch": 0.66, "learning_rate": 1.3350196891950584e-06, "loss": 0.8941, "step": 35230 }, { "epoch": 0.66, "learning_rate": 1.334884526126321e-06, "loss": 1.0143, "step": 35231 }, { "epoch": 0.66, "learning_rate": 1.3347493674080881e-06, "loss": 0.86, "step": 35232 }, { "epoch": 0.66, "learning_rate": 1.334614213040867e-06, "loss": 0.7348, "step": 35233 }, { "epoch": 0.66, "learning_rate": 1.3344790630251597e-06, "loss": 0.9016, "step": 35234 }, { "epoch": 0.66, "learning_rate": 1.3343439173614722e-06, "loss": 0.9097, "step": 35235 }, { "epoch": 0.66, "learning_rate": 1.3342087760503086e-06, "loss": 0.965, "step": 35236 }, { "epoch": 0.66, "learning_rate": 1.3340736390921738e-06, "loss": 0.885, "step": 35237 }, { "epoch": 0.66, "learning_rate": 1.333938506487572e-06, "loss": 0.9479, "step": 35238 }, { "epoch": 0.66, "learning_rate": 1.3338033782370085e-06, "loss": 1.024, "step": 35239 }, { "epoch": 0.66, "learning_rate": 1.3336682543409882e-06, "loss": 0.7469, "step": 35240 }, { "epoch": 0.66, "learning_rate": 1.333533134800013e-06, "loss": 0.6452, "step": 35241 }, { "epoch": 0.66, "learning_rate": 1.3333980196145914e-06, "loss": 0.8469, "step": 35242 }, { "epoch": 0.66, "learning_rate": 1.3332629087852245e-06, "loss": 1.1213, "step": 35243 }, { "epoch": 0.66, "learning_rate": 1.333127802312418e-06, "loss": 0.8293, "step": 35244 }, { "epoch": 0.66, "learning_rate": 1.332992700196677e-06, "loss": 0.7895, "step": 35245 }, { "epoch": 0.66, "learning_rate": 1.332857602438505e-06, "loss": 0.8915, "step": 35246 }, { "epoch": 0.67, "learning_rate": 1.3327225090384072e-06, "loss": 0.7232, "step": 35247 }, { "epoch": 0.67, "learning_rate": 1.3325874199968876e-06, "loss": 0.7913, "step": 35248 }, { "epoch": 0.67, "learning_rate": 1.332452335314452e-06, "loss": 0.905, "step": 35249 }, { "epoch": 0.67, "learning_rate": 1.3323172549916014e-06, "loss": 0.8058, "step": 35250 }, { "epoch": 0.67, "learning_rate": 1.3321821790288446e-06, "loss": 0.7588, "step": 35251 }, { "epoch": 0.67, "learning_rate": 1.3320471074266825e-06, "loss": 0.8754, "step": 35252 }, { "epoch": 0.67, "learning_rate": 1.3319120401856198e-06, "loss": 0.8287, "step": 35253 }, { "epoch": 0.67, "learning_rate": 1.3317769773061636e-06, "loss": 0.8931, "step": 35254 }, { "epoch": 0.67, "learning_rate": 1.3316419187888154e-06, "loss": 0.795, "step": 35255 }, { "epoch": 0.67, "learning_rate": 1.3315068646340806e-06, "loss": 1.1512, "step": 35256 }, { "epoch": 0.67, "learning_rate": 1.331371814842463e-06, "loss": 0.5836, "step": 35257 }, { "epoch": 0.67, "learning_rate": 1.331236769414468e-06, "loss": 0.8935, "step": 35258 }, { "epoch": 0.67, "learning_rate": 1.3311017283505983e-06, "loss": 0.9781, "step": 35259 }, { "epoch": 0.67, "learning_rate": 1.3309666916513593e-06, "loss": 0.8088, "step": 35260 }, { "epoch": 0.67, "learning_rate": 1.3308316593172553e-06, "loss": 0.8151, "step": 35261 }, { "epoch": 0.67, "learning_rate": 1.3306966313487885e-06, "loss": 1.0319, "step": 35262 }, { "epoch": 0.67, "learning_rate": 1.3305616077464666e-06, "loss": 0.9459, "step": 35263 }, { "epoch": 0.67, "learning_rate": 1.3304265885107908e-06, "loss": 0.8727, "step": 35264 }, { "epoch": 0.67, "learning_rate": 1.3302915736422661e-06, "loss": 0.9722, "step": 35265 }, { "epoch": 0.67, "learning_rate": 1.330156563141397e-06, "loss": 0.9267, "step": 35266 }, { "epoch": 0.67, "learning_rate": 1.330021557008687e-06, "loss": 0.8358, "step": 35267 }, { "epoch": 0.67, "learning_rate": 1.3298865552446411e-06, "loss": 1.0681, "step": 35268 }, { "epoch": 0.67, "learning_rate": 1.3297515578497628e-06, "loss": 0.9329, "step": 35269 }, { "epoch": 0.67, "learning_rate": 1.3296165648245575e-06, "loss": 0.526, "step": 35270 }, { "epoch": 0.67, "learning_rate": 1.3294815761695256e-06, "loss": 1.0157, "step": 35271 }, { "epoch": 0.67, "learning_rate": 1.329346591885175e-06, "loss": 0.8472, "step": 35272 }, { "epoch": 0.67, "learning_rate": 1.3292116119720088e-06, "loss": 1.0273, "step": 35273 }, { "epoch": 0.67, "learning_rate": 1.3290766364305291e-06, "loss": 1.0354, "step": 35274 }, { "epoch": 0.67, "learning_rate": 1.3289416652612431e-06, "loss": 1.0511, "step": 35275 }, { "epoch": 0.67, "learning_rate": 1.3288066984646522e-06, "loss": 0.7631, "step": 35276 }, { "epoch": 0.67, "learning_rate": 1.328671736041261e-06, "loss": 0.7753, "step": 35277 }, { "epoch": 0.67, "learning_rate": 1.3285367779915736e-06, "loss": 0.7978, "step": 35278 }, { "epoch": 0.67, "learning_rate": 1.328401824316094e-06, "loss": 0.8546, "step": 35279 }, { "epoch": 0.67, "learning_rate": 1.328266875015326e-06, "loss": 0.8173, "step": 35280 }, { "epoch": 0.67, "learning_rate": 1.3281319300897739e-06, "loss": 0.9286, "step": 35281 }, { "epoch": 0.67, "learning_rate": 1.327996989539942e-06, "loss": 1.0312, "step": 35282 }, { "epoch": 0.67, "learning_rate": 1.3278620533663315e-06, "loss": 0.8844, "step": 35283 }, { "epoch": 0.67, "learning_rate": 1.32772712156945e-06, "loss": 0.8776, "step": 35284 }, { "epoch": 0.67, "learning_rate": 1.3275921941497985e-06, "loss": 0.9163, "step": 35285 }, { "epoch": 0.67, "learning_rate": 1.3274572711078818e-06, "loss": 0.8018, "step": 35286 }, { "epoch": 0.67, "learning_rate": 1.3273223524442035e-06, "loss": 1.0916, "step": 35287 }, { "epoch": 0.67, "learning_rate": 1.3271874381592682e-06, "loss": 1.0309, "step": 35288 }, { "epoch": 0.67, "learning_rate": 1.3270525282535785e-06, "loss": 0.9198, "step": 35289 }, { "epoch": 0.67, "learning_rate": 1.326917622727639e-06, "loss": 0.7037, "step": 35290 }, { "epoch": 0.67, "learning_rate": 1.326782721581954e-06, "loss": 0.972, "step": 35291 }, { "epoch": 0.67, "learning_rate": 1.3266478248170245e-06, "loss": 0.7443, "step": 35292 }, { "epoch": 0.67, "learning_rate": 1.3265129324333567e-06, "loss": 1.0765, "step": 35293 }, { "epoch": 0.67, "learning_rate": 1.3263780444314548e-06, "loss": 1.2753, "step": 35294 }, { "epoch": 0.67, "learning_rate": 1.3262431608118192e-06, "loss": 0.9247, "step": 35295 }, { "epoch": 0.67, "learning_rate": 1.3261082815749579e-06, "loss": 0.8617, "step": 35296 }, { "epoch": 0.67, "learning_rate": 1.3259734067213711e-06, "loss": 1.015, "step": 35297 }, { "epoch": 0.67, "learning_rate": 1.3258385362515636e-06, "loss": 0.7485, "step": 35298 }, { "epoch": 0.67, "learning_rate": 1.3257036701660393e-06, "loss": 0.8232, "step": 35299 }, { "epoch": 0.67, "learning_rate": 1.3255688084653012e-06, "loss": 1.1299, "step": 35300 }, { "epoch": 0.67, "learning_rate": 1.3254339511498531e-06, "loss": 1.019, "step": 35301 }, { "epoch": 0.67, "learning_rate": 1.3252990982201984e-06, "loss": 0.7834, "step": 35302 }, { "epoch": 0.67, "learning_rate": 1.3251642496768425e-06, "loss": 0.9405, "step": 35303 }, { "epoch": 0.67, "learning_rate": 1.325029405520285e-06, "loss": 0.9922, "step": 35304 }, { "epoch": 0.67, "learning_rate": 1.3248945657510337e-06, "loss": 0.8361, "step": 35305 }, { "epoch": 0.67, "learning_rate": 1.3247597303695889e-06, "loss": 0.9767, "step": 35306 }, { "epoch": 0.67, "learning_rate": 1.3246248993764551e-06, "loss": 0.9726, "step": 35307 }, { "epoch": 0.67, "learning_rate": 1.324490072772136e-06, "loss": 0.7046, "step": 35308 }, { "epoch": 0.67, "learning_rate": 1.3243552505571353e-06, "loss": 0.9984, "step": 35309 }, { "epoch": 0.67, "learning_rate": 1.3242204327319559e-06, "loss": 0.8722, "step": 35310 }, { "epoch": 0.67, "learning_rate": 1.324085619297101e-06, "loss": 0.873, "step": 35311 }, { "epoch": 0.67, "learning_rate": 1.3239508102530757e-06, "loss": 0.981, "step": 35312 }, { "epoch": 0.67, "learning_rate": 1.3238160056003798e-06, "loss": 1.0425, "step": 35313 }, { "epoch": 0.67, "learning_rate": 1.3236812053395199e-06, "loss": 0.8379, "step": 35314 }, { "epoch": 0.67, "learning_rate": 1.3235464094709992e-06, "loss": 0.6763, "step": 35315 }, { "epoch": 0.67, "learning_rate": 1.3234116179953186e-06, "loss": 1.0768, "step": 35316 }, { "epoch": 0.67, "learning_rate": 1.3232768309129845e-06, "loss": 1.0443, "step": 35317 }, { "epoch": 0.67, "learning_rate": 1.3231420482244978e-06, "loss": 0.9879, "step": 35318 }, { "epoch": 0.67, "learning_rate": 1.3230072699303627e-06, "loss": 0.9311, "step": 35319 }, { "epoch": 0.67, "learning_rate": 1.3228724960310823e-06, "loss": 0.7204, "step": 35320 }, { "epoch": 0.67, "learning_rate": 1.32273772652716e-06, "loss": 0.9073, "step": 35321 }, { "epoch": 0.67, "learning_rate": 1.3226029614190989e-06, "loss": 0.8625, "step": 35322 }, { "epoch": 0.67, "learning_rate": 1.322468200707402e-06, "loss": 0.6729, "step": 35323 }, { "epoch": 0.67, "learning_rate": 1.322333444392574e-06, "loss": 0.9836, "step": 35324 }, { "epoch": 0.67, "learning_rate": 1.3221986924751145e-06, "loss": 1.0878, "step": 35325 }, { "epoch": 0.67, "learning_rate": 1.3220639449555312e-06, "loss": 0.8793, "step": 35326 }, { "epoch": 0.67, "learning_rate": 1.3219292018343238e-06, "loss": 0.8724, "step": 35327 }, { "epoch": 0.67, "learning_rate": 1.321794463111997e-06, "loss": 0.8795, "step": 35328 }, { "epoch": 0.67, "learning_rate": 1.3216597287890531e-06, "loss": 0.9412, "step": 35329 }, { "epoch": 0.67, "learning_rate": 1.3215249988659961e-06, "loss": 0.8269, "step": 35330 }, { "epoch": 0.67, "learning_rate": 1.3213902733433284e-06, "loss": 1.1768, "step": 35331 }, { "epoch": 0.67, "learning_rate": 1.3212555522215534e-06, "loss": 0.9015, "step": 35332 }, { "epoch": 0.67, "learning_rate": 1.321120835501175e-06, "loss": 0.8818, "step": 35333 }, { "epoch": 0.67, "learning_rate": 1.3209861231826932e-06, "loss": 0.8521, "step": 35334 }, { "epoch": 0.67, "learning_rate": 1.3208514152666142e-06, "loss": 0.8384, "step": 35335 }, { "epoch": 0.67, "learning_rate": 1.3207167117534403e-06, "loss": 0.8478, "step": 35336 }, { "epoch": 0.67, "learning_rate": 1.3205820126436725e-06, "loss": 1.1686, "step": 35337 }, { "epoch": 0.67, "learning_rate": 1.3204473179378174e-06, "loss": 1.0579, "step": 35338 }, { "epoch": 0.67, "learning_rate": 1.3203126276363748e-06, "loss": 0.9483, "step": 35339 }, { "epoch": 0.67, "learning_rate": 1.3201779417398486e-06, "loss": 0.8544, "step": 35340 }, { "epoch": 0.67, "learning_rate": 1.3200432602487417e-06, "loss": 0.8683, "step": 35341 }, { "epoch": 0.67, "learning_rate": 1.3199085831635572e-06, "loss": 0.8074, "step": 35342 }, { "epoch": 0.67, "learning_rate": 1.3197739104847979e-06, "loss": 0.9204, "step": 35343 }, { "epoch": 0.67, "learning_rate": 1.3196392422129666e-06, "loss": 1.0708, "step": 35344 }, { "epoch": 0.67, "learning_rate": 1.319504578348567e-06, "loss": 0.8694, "step": 35345 }, { "epoch": 0.67, "learning_rate": 1.3193699188920995e-06, "loss": 1.1355, "step": 35346 }, { "epoch": 0.67, "learning_rate": 1.3192352638440704e-06, "loss": 0.9252, "step": 35347 }, { "epoch": 0.67, "learning_rate": 1.3191006132049794e-06, "loss": 1.0121, "step": 35348 }, { "epoch": 0.67, "learning_rate": 1.3189659669753305e-06, "loss": 1.1627, "step": 35349 }, { "epoch": 0.67, "learning_rate": 1.3188313251556266e-06, "loss": 1.1643, "step": 35350 }, { "epoch": 0.67, "learning_rate": 1.3186966877463702e-06, "loss": 1.0599, "step": 35351 }, { "epoch": 0.67, "learning_rate": 1.3185620547480643e-06, "loss": 0.8892, "step": 35352 }, { "epoch": 0.67, "learning_rate": 1.3184274261612112e-06, "loss": 0.9517, "step": 35353 }, { "epoch": 0.67, "learning_rate": 1.318292801986315e-06, "loss": 0.9888, "step": 35354 }, { "epoch": 0.67, "learning_rate": 1.3181581822238757e-06, "loss": 0.856, "step": 35355 }, { "epoch": 0.67, "learning_rate": 1.3180235668743979e-06, "loss": 1.1896, "step": 35356 }, { "epoch": 0.67, "learning_rate": 1.317888955938385e-06, "loss": 1.0372, "step": 35357 }, { "epoch": 0.67, "learning_rate": 1.317754349416337e-06, "loss": 0.9386, "step": 35358 }, { "epoch": 0.67, "learning_rate": 1.3176197473087592e-06, "loss": 1.0737, "step": 35359 }, { "epoch": 0.67, "learning_rate": 1.3174851496161526e-06, "loss": 0.9511, "step": 35360 }, { "epoch": 0.67, "learning_rate": 1.31735055633902e-06, "loss": 0.91, "step": 35361 }, { "epoch": 0.67, "learning_rate": 1.3172159674778639e-06, "loss": 1.1259, "step": 35362 }, { "epoch": 0.67, "learning_rate": 1.3170813830331874e-06, "loss": 0.9091, "step": 35363 }, { "epoch": 0.67, "learning_rate": 1.3169468030054937e-06, "loss": 1.0161, "step": 35364 }, { "epoch": 0.67, "learning_rate": 1.3168122273952828e-06, "loss": 0.9194, "step": 35365 }, { "epoch": 0.67, "learning_rate": 1.3166776562030603e-06, "loss": 0.7735, "step": 35366 }, { "epoch": 0.67, "learning_rate": 1.316543089429326e-06, "loss": 0.7581, "step": 35367 }, { "epoch": 0.67, "learning_rate": 1.316408527074584e-06, "loss": 0.9481, "step": 35368 }, { "epoch": 0.67, "learning_rate": 1.3162739691393356e-06, "loss": 1.1635, "step": 35369 }, { "epoch": 0.67, "learning_rate": 1.3161394156240845e-06, "loss": 0.7145, "step": 35370 }, { "epoch": 0.67, "learning_rate": 1.3160048665293323e-06, "loss": 0.5924, "step": 35371 }, { "epoch": 0.67, "learning_rate": 1.3158703218555818e-06, "loss": 0.8964, "step": 35372 }, { "epoch": 0.67, "learning_rate": 1.315735781603336e-06, "loss": 0.8779, "step": 35373 }, { "epoch": 0.67, "learning_rate": 1.3156012457730943e-06, "loss": 1.0048, "step": 35374 }, { "epoch": 0.67, "learning_rate": 1.3154667143653637e-06, "loss": 1.0632, "step": 35375 }, { "epoch": 0.67, "learning_rate": 1.315332187380643e-06, "loss": 0.8141, "step": 35376 }, { "epoch": 0.67, "learning_rate": 1.3151976648194342e-06, "loss": 0.637, "step": 35377 }, { "epoch": 0.67, "learning_rate": 1.3150631466822434e-06, "loss": 0.9606, "step": 35378 }, { "epoch": 0.67, "learning_rate": 1.3149286329695694e-06, "loss": 0.8034, "step": 35379 }, { "epoch": 0.67, "learning_rate": 1.3147941236819152e-06, "loss": 1.104, "step": 35380 }, { "epoch": 0.67, "learning_rate": 1.3146596188197836e-06, "loss": 1.0682, "step": 35381 }, { "epoch": 0.67, "learning_rate": 1.3145251183836766e-06, "loss": 1.171, "step": 35382 }, { "epoch": 0.67, "learning_rate": 1.3143906223740965e-06, "loss": 1.0063, "step": 35383 }, { "epoch": 0.67, "learning_rate": 1.3142561307915459e-06, "loss": 0.8878, "step": 35384 }, { "epoch": 0.67, "learning_rate": 1.314121643636527e-06, "loss": 0.9683, "step": 35385 }, { "epoch": 0.67, "learning_rate": 1.3139871609095398e-06, "loss": 0.993, "step": 35386 }, { "epoch": 0.67, "learning_rate": 1.3138526826110897e-06, "loss": 1.113, "step": 35387 }, { "epoch": 0.67, "learning_rate": 1.3137182087416769e-06, "loss": 1.0518, "step": 35388 }, { "epoch": 0.67, "learning_rate": 1.3135837393018036e-06, "loss": 0.8943, "step": 35389 }, { "epoch": 0.67, "learning_rate": 1.3134492742919725e-06, "loss": 1.0006, "step": 35390 }, { "epoch": 0.67, "learning_rate": 1.3133148137126855e-06, "loss": 0.8849, "step": 35391 }, { "epoch": 0.67, "learning_rate": 1.313180357564444e-06, "loss": 0.7917, "step": 35392 }, { "epoch": 0.67, "learning_rate": 1.3130459058477512e-06, "loss": 0.9858, "step": 35393 }, { "epoch": 0.67, "learning_rate": 1.3129114585631094e-06, "loss": 1.2033, "step": 35394 }, { "epoch": 0.67, "learning_rate": 1.3127770157110182e-06, "loss": 1.0384, "step": 35395 }, { "epoch": 0.67, "learning_rate": 1.3126425772919825e-06, "loss": 1.0226, "step": 35396 }, { "epoch": 0.67, "learning_rate": 1.3125081433065026e-06, "loss": 1.0233, "step": 35397 }, { "epoch": 0.67, "learning_rate": 1.3123737137550796e-06, "loss": 0.7754, "step": 35398 }, { "epoch": 0.67, "learning_rate": 1.3122392886382191e-06, "loss": 1.043, "step": 35399 }, { "epoch": 0.67, "learning_rate": 1.312104867956419e-06, "loss": 1.1596, "step": 35400 }, { "epoch": 0.67, "learning_rate": 1.3119704517101833e-06, "loss": 0.7803, "step": 35401 }, { "epoch": 0.67, "learning_rate": 1.3118360399000139e-06, "loss": 0.9338, "step": 35402 }, { "epoch": 0.67, "learning_rate": 1.3117016325264118e-06, "loss": 0.7566, "step": 35403 }, { "epoch": 0.67, "learning_rate": 1.3115672295898796e-06, "loss": 0.6444, "step": 35404 }, { "epoch": 0.67, "learning_rate": 1.3114328310909186e-06, "loss": 0.9713, "step": 35405 }, { "epoch": 0.67, "learning_rate": 1.3112984370300322e-06, "loss": 0.9565, "step": 35406 }, { "epoch": 0.67, "learning_rate": 1.3111640474077188e-06, "loss": 0.7931, "step": 35407 }, { "epoch": 0.67, "learning_rate": 1.3110296622244847e-06, "loss": 0.8123, "step": 35408 }, { "epoch": 0.67, "learning_rate": 1.3108952814808282e-06, "loss": 0.7921, "step": 35409 }, { "epoch": 0.67, "learning_rate": 1.3107609051772524e-06, "loss": 0.7012, "step": 35410 }, { "epoch": 0.67, "learning_rate": 1.3106265333142588e-06, "loss": 0.9175, "step": 35411 }, { "epoch": 0.67, "learning_rate": 1.3104921658923493e-06, "loss": 1.077, "step": 35412 }, { "epoch": 0.67, "learning_rate": 1.3103578029120256e-06, "loss": 1.0039, "step": 35413 }, { "epoch": 0.67, "learning_rate": 1.3102234443737894e-06, "loss": 0.914, "step": 35414 }, { "epoch": 0.67, "learning_rate": 1.3100890902781432e-06, "loss": 0.9656, "step": 35415 }, { "epoch": 0.67, "learning_rate": 1.3099547406255858e-06, "loss": 0.7462, "step": 35416 }, { "epoch": 0.67, "learning_rate": 1.3098203954166232e-06, "loss": 0.8827, "step": 35417 }, { "epoch": 0.67, "learning_rate": 1.3096860546517537e-06, "loss": 1.0172, "step": 35418 }, { "epoch": 0.67, "learning_rate": 1.3095517183314788e-06, "loss": 0.8836, "step": 35419 }, { "epoch": 0.67, "learning_rate": 1.3094173864563037e-06, "loss": 0.967, "step": 35420 }, { "epoch": 0.67, "learning_rate": 1.3092830590267262e-06, "loss": 0.8682, "step": 35421 }, { "epoch": 0.67, "learning_rate": 1.3091487360432491e-06, "loss": 0.9574, "step": 35422 }, { "epoch": 0.67, "learning_rate": 1.3090144175063747e-06, "loss": 0.9395, "step": 35423 }, { "epoch": 0.67, "learning_rate": 1.3088801034166032e-06, "loss": 1.1509, "step": 35424 }, { "epoch": 0.67, "learning_rate": 1.3087457937744374e-06, "loss": 0.9125, "step": 35425 }, { "epoch": 0.67, "learning_rate": 1.308611488580378e-06, "loss": 0.9797, "step": 35426 }, { "epoch": 0.67, "learning_rate": 1.3084771878349282e-06, "loss": 0.8896, "step": 35427 }, { "epoch": 0.67, "learning_rate": 1.3083428915385858e-06, "loss": 0.7507, "step": 35428 }, { "epoch": 0.67, "learning_rate": 1.3082085996918565e-06, "loss": 0.8851, "step": 35429 }, { "epoch": 0.67, "learning_rate": 1.3080743122952382e-06, "loss": 1.0363, "step": 35430 }, { "epoch": 0.67, "learning_rate": 1.3079400293492345e-06, "loss": 1.0117, "step": 35431 }, { "epoch": 0.67, "learning_rate": 1.3078057508543463e-06, "loss": 0.8471, "step": 35432 }, { "epoch": 0.67, "learning_rate": 1.3076714768110746e-06, "loss": 0.8994, "step": 35433 }, { "epoch": 0.67, "learning_rate": 1.307537207219921e-06, "loss": 0.9138, "step": 35434 }, { "epoch": 0.67, "learning_rate": 1.3074029420813872e-06, "loss": 0.8332, "step": 35435 }, { "epoch": 0.67, "learning_rate": 1.3072686813959752e-06, "loss": 0.7795, "step": 35436 }, { "epoch": 0.67, "learning_rate": 1.307134425164183e-06, "loss": 0.9453, "step": 35437 }, { "epoch": 0.67, "learning_rate": 1.3070001733865164e-06, "loss": 0.9317, "step": 35438 }, { "epoch": 0.67, "learning_rate": 1.3068659260634737e-06, "loss": 0.7053, "step": 35439 }, { "epoch": 0.67, "learning_rate": 1.3067316831955562e-06, "loss": 0.9309, "step": 35440 }, { "epoch": 0.67, "learning_rate": 1.3065974447832676e-06, "loss": 0.8622, "step": 35441 }, { "epoch": 0.67, "learning_rate": 1.306463210827107e-06, "loss": 0.6953, "step": 35442 }, { "epoch": 0.67, "learning_rate": 1.3063289813275759e-06, "loss": 0.9056, "step": 35443 }, { "epoch": 0.67, "learning_rate": 1.3061947562851756e-06, "loss": 0.7631, "step": 35444 }, { "epoch": 0.67, "learning_rate": 1.3060605357004081e-06, "loss": 1.0464, "step": 35445 }, { "epoch": 0.67, "learning_rate": 1.305926319573773e-06, "loss": 0.8334, "step": 35446 }, { "epoch": 0.67, "learning_rate": 1.3057921079057733e-06, "loss": 0.8791, "step": 35447 }, { "epoch": 0.67, "learning_rate": 1.30565790069691e-06, "loss": 0.8124, "step": 35448 }, { "epoch": 0.67, "learning_rate": 1.3055236979476816e-06, "loss": 0.8443, "step": 35449 }, { "epoch": 0.67, "learning_rate": 1.3053894996585924e-06, "loss": 1.1025, "step": 35450 }, { "epoch": 0.67, "learning_rate": 1.305255305830142e-06, "loss": 0.8414, "step": 35451 }, { "epoch": 0.67, "learning_rate": 1.3051211164628312e-06, "loss": 0.95, "step": 35452 }, { "epoch": 0.67, "learning_rate": 1.3049869315571617e-06, "loss": 0.8551, "step": 35453 }, { "epoch": 0.67, "learning_rate": 1.3048527511136344e-06, "loss": 0.8414, "step": 35454 }, { "epoch": 0.67, "learning_rate": 1.30471857513275e-06, "loss": 0.942, "step": 35455 }, { "epoch": 0.67, "learning_rate": 1.3045844036150101e-06, "loss": 1.0247, "step": 35456 }, { "epoch": 0.67, "learning_rate": 1.3044502365609163e-06, "loss": 0.8692, "step": 35457 }, { "epoch": 0.67, "learning_rate": 1.3043160739709667e-06, "loss": 0.9241, "step": 35458 }, { "epoch": 0.67, "learning_rate": 1.3041819158456661e-06, "loss": 0.6889, "step": 35459 }, { "epoch": 0.67, "learning_rate": 1.3040477621855127e-06, "loss": 0.938, "step": 35460 }, { "epoch": 0.67, "learning_rate": 1.3039136129910073e-06, "loss": 0.9089, "step": 35461 }, { "epoch": 0.67, "learning_rate": 1.3037794682626537e-06, "loss": 1.0834, "step": 35462 }, { "epoch": 0.67, "learning_rate": 1.3036453280009497e-06, "loss": 1.1074, "step": 35463 }, { "epoch": 0.67, "learning_rate": 1.3035111922063976e-06, "loss": 1.0067, "step": 35464 }, { "epoch": 0.67, "learning_rate": 1.303377060879498e-06, "loss": 0.8994, "step": 35465 }, { "epoch": 0.67, "learning_rate": 1.3032429340207516e-06, "loss": 0.8757, "step": 35466 }, { "epoch": 0.67, "learning_rate": 1.3031088116306596e-06, "loss": 0.7999, "step": 35467 }, { "epoch": 0.67, "learning_rate": 1.3029746937097226e-06, "loss": 0.9504, "step": 35468 }, { "epoch": 0.67, "learning_rate": 1.3028405802584423e-06, "loss": 0.9957, "step": 35469 }, { "epoch": 0.67, "learning_rate": 1.3027064712773166e-06, "loss": 0.7374, "step": 35470 }, { "epoch": 0.67, "learning_rate": 1.3025723667668502e-06, "loss": 0.8103, "step": 35471 }, { "epoch": 0.67, "learning_rate": 1.3024382667275409e-06, "loss": 0.9865, "step": 35472 }, { "epoch": 0.67, "learning_rate": 1.3023041711598906e-06, "loss": 0.835, "step": 35473 }, { "epoch": 0.67, "learning_rate": 1.3021700800643994e-06, "loss": 0.9331, "step": 35474 }, { "epoch": 0.67, "learning_rate": 1.3020359934415687e-06, "loss": 1.0721, "step": 35475 }, { "epoch": 0.67, "learning_rate": 1.3019019112918984e-06, "loss": 1.1801, "step": 35476 }, { "epoch": 0.67, "learning_rate": 1.30176783361589e-06, "loss": 0.8386, "step": 35477 }, { "epoch": 0.67, "learning_rate": 1.301633760414045e-06, "loss": 0.7922, "step": 35478 }, { "epoch": 0.67, "learning_rate": 1.3014996916868605e-06, "loss": 0.7505, "step": 35479 }, { "epoch": 0.67, "learning_rate": 1.3013656274348414e-06, "loss": 0.9586, "step": 35480 }, { "epoch": 0.67, "learning_rate": 1.3012315676584853e-06, "loss": 1.2667, "step": 35481 }, { "epoch": 0.67, "learning_rate": 1.301097512358293e-06, "loss": 0.9164, "step": 35482 }, { "epoch": 0.67, "learning_rate": 1.3009634615347677e-06, "loss": 0.9374, "step": 35483 }, { "epoch": 0.67, "learning_rate": 1.3008294151884068e-06, "loss": 0.9082, "step": 35484 }, { "epoch": 0.67, "learning_rate": 1.3006953733197125e-06, "loss": 0.887, "step": 35485 }, { "epoch": 0.67, "learning_rate": 1.3005613359291847e-06, "loss": 0.7728, "step": 35486 }, { "epoch": 0.67, "learning_rate": 1.3004273030173243e-06, "loss": 0.9747, "step": 35487 }, { "epoch": 0.67, "learning_rate": 1.300293274584631e-06, "loss": 0.9424, "step": 35488 }, { "epoch": 0.67, "learning_rate": 1.3001592506316063e-06, "loss": 0.7775, "step": 35489 }, { "epoch": 0.67, "learning_rate": 1.3000252311587511e-06, "loss": 0.8434, "step": 35490 }, { "epoch": 0.67, "learning_rate": 1.2998912161665628e-06, "loss": 0.9326, "step": 35491 }, { "epoch": 0.67, "learning_rate": 1.299757205655546e-06, "loss": 0.8439, "step": 35492 }, { "epoch": 0.67, "learning_rate": 1.2996231996261981e-06, "loss": 0.9215, "step": 35493 }, { "epoch": 0.67, "learning_rate": 1.2994891980790203e-06, "loss": 0.8266, "step": 35494 }, { "epoch": 0.67, "learning_rate": 1.2993552010145127e-06, "loss": 0.7768, "step": 35495 }, { "epoch": 0.67, "learning_rate": 1.2992212084331763e-06, "loss": 0.8446, "step": 35496 }, { "epoch": 0.67, "learning_rate": 1.2990872203355112e-06, "loss": 0.7562, "step": 35497 }, { "epoch": 0.67, "learning_rate": 1.2989532367220176e-06, "loss": 0.7333, "step": 35498 }, { "epoch": 0.67, "learning_rate": 1.2988192575931963e-06, "loss": 0.8516, "step": 35499 }, { "epoch": 0.67, "learning_rate": 1.2986852829495455e-06, "loss": 1.0697, "step": 35500 }, { "epoch": 0.67, "learning_rate": 1.298551312791569e-06, "loss": 0.994, "step": 35501 }, { "epoch": 0.67, "learning_rate": 1.2984173471197635e-06, "loss": 0.8967, "step": 35502 }, { "epoch": 0.67, "learning_rate": 1.2982833859346304e-06, "loss": 0.9365, "step": 35503 }, { "epoch": 0.67, "learning_rate": 1.2981494292366722e-06, "loss": 0.7143, "step": 35504 }, { "epoch": 0.67, "learning_rate": 1.2980154770263864e-06, "loss": 0.8196, "step": 35505 }, { "epoch": 0.67, "learning_rate": 1.2978815293042734e-06, "loss": 1.0043, "step": 35506 }, { "epoch": 0.67, "learning_rate": 1.2977475860708343e-06, "loss": 0.983, "step": 35507 }, { "epoch": 0.67, "learning_rate": 1.2976136473265688e-06, "loss": 0.8702, "step": 35508 }, { "epoch": 0.67, "learning_rate": 1.297479713071977e-06, "loss": 0.8296, "step": 35509 }, { "epoch": 0.67, "learning_rate": 1.2973457833075592e-06, "loss": 0.7284, "step": 35510 }, { "epoch": 0.67, "learning_rate": 1.2972118580338162e-06, "loss": 0.7487, "step": 35511 }, { "epoch": 0.67, "learning_rate": 1.2970779372512454e-06, "loss": 1.0265, "step": 35512 }, { "epoch": 0.67, "learning_rate": 1.2969440209603503e-06, "loss": 0.9164, "step": 35513 }, { "epoch": 0.67, "learning_rate": 1.2968101091616287e-06, "loss": 0.7362, "step": 35514 }, { "epoch": 0.67, "learning_rate": 1.2966762018555812e-06, "loss": 0.8594, "step": 35515 }, { "epoch": 0.67, "learning_rate": 1.2965422990427078e-06, "loss": 0.9917, "step": 35516 }, { "epoch": 0.67, "learning_rate": 1.2964084007235088e-06, "loss": 0.6548, "step": 35517 }, { "epoch": 0.67, "learning_rate": 1.2962745068984839e-06, "loss": 1.0373, "step": 35518 }, { "epoch": 0.67, "learning_rate": 1.296140617568133e-06, "loss": 1.1035, "step": 35519 }, { "epoch": 0.67, "learning_rate": 1.2960067327329567e-06, "loss": 0.8958, "step": 35520 }, { "epoch": 0.67, "learning_rate": 1.2958728523934527e-06, "loss": 0.8018, "step": 35521 }, { "epoch": 0.67, "learning_rate": 1.295738976550125e-06, "loss": 0.9526, "step": 35522 }, { "epoch": 0.67, "learning_rate": 1.2956051052034693e-06, "loss": 0.7908, "step": 35523 }, { "epoch": 0.67, "learning_rate": 1.2954712383539867e-06, "loss": 0.8942, "step": 35524 }, { "epoch": 0.67, "learning_rate": 1.2953373760021792e-06, "loss": 1.0899, "step": 35525 }, { "epoch": 0.67, "learning_rate": 1.2952035181485441e-06, "loss": 0.8764, "step": 35526 }, { "epoch": 0.67, "learning_rate": 1.2950696647935824e-06, "loss": 0.7421, "step": 35527 }, { "epoch": 0.67, "learning_rate": 1.2949358159377935e-06, "loss": 1.0629, "step": 35528 }, { "epoch": 0.67, "learning_rate": 1.294801971581677e-06, "loss": 0.8719, "step": 35529 }, { "epoch": 0.67, "learning_rate": 1.2946681317257332e-06, "loss": 0.924, "step": 35530 }, { "epoch": 0.67, "learning_rate": 1.2945342963704619e-06, "loss": 0.9142, "step": 35531 }, { "epoch": 0.67, "learning_rate": 1.2944004655163633e-06, "loss": 0.9962, "step": 35532 }, { "epoch": 0.67, "learning_rate": 1.2942666391639344e-06, "loss": 0.827, "step": 35533 }, { "epoch": 0.67, "learning_rate": 1.2941328173136791e-06, "loss": 0.8918, "step": 35534 }, { "epoch": 0.67, "learning_rate": 1.2939989999660935e-06, "loss": 0.8037, "step": 35535 }, { "epoch": 0.67, "learning_rate": 1.2938651871216789e-06, "loss": 1.048, "step": 35536 }, { "epoch": 0.67, "learning_rate": 1.2937313787809346e-06, "loss": 1.182, "step": 35537 }, { "epoch": 0.67, "learning_rate": 1.2935975749443607e-06, "loss": 1.0234, "step": 35538 }, { "epoch": 0.67, "learning_rate": 1.2934637756124563e-06, "loss": 0.7807, "step": 35539 }, { "epoch": 0.67, "learning_rate": 1.2933299807857208e-06, "loss": 0.8591, "step": 35540 }, { "epoch": 0.67, "learning_rate": 1.2931961904646557e-06, "loss": 0.7864, "step": 35541 }, { "epoch": 0.67, "learning_rate": 1.2930624046497564e-06, "loss": 0.8167, "step": 35542 }, { "epoch": 0.67, "learning_rate": 1.2929286233415278e-06, "loss": 0.9431, "step": 35543 }, { "epoch": 0.67, "learning_rate": 1.2927948465404651e-06, "loss": 1.0271, "step": 35544 }, { "epoch": 0.67, "learning_rate": 1.2926610742470689e-06, "loss": 0.8049, "step": 35545 }, { "epoch": 0.67, "learning_rate": 1.292527306461841e-06, "loss": 0.9203, "step": 35546 }, { "epoch": 0.67, "learning_rate": 1.292393543185278e-06, "loss": 1.0455, "step": 35547 }, { "epoch": 0.67, "learning_rate": 1.2922597844178804e-06, "loss": 0.8171, "step": 35548 }, { "epoch": 0.67, "learning_rate": 1.292126030160148e-06, "loss": 0.783, "step": 35549 }, { "epoch": 0.67, "learning_rate": 1.29199228041258e-06, "loss": 1.0844, "step": 35550 }, { "epoch": 0.67, "learning_rate": 1.2918585351756758e-06, "loss": 0.8335, "step": 35551 }, { "epoch": 0.67, "learning_rate": 1.2917247944499346e-06, "loss": 0.9508, "step": 35552 }, { "epoch": 0.67, "learning_rate": 1.291591058235857e-06, "loss": 1.0018, "step": 35553 }, { "epoch": 0.67, "learning_rate": 1.2914573265339395e-06, "loss": 0.7177, "step": 35554 }, { "epoch": 0.67, "learning_rate": 1.2913235993446852e-06, "loss": 0.8129, "step": 35555 }, { "epoch": 0.67, "learning_rate": 1.2911898766685904e-06, "loss": 1.1247, "step": 35556 }, { "epoch": 0.67, "learning_rate": 1.2910561585061558e-06, "loss": 0.9565, "step": 35557 }, { "epoch": 0.67, "learning_rate": 1.29092244485788e-06, "loss": 0.8966, "step": 35558 }, { "epoch": 0.67, "learning_rate": 1.2907887357242632e-06, "loss": 0.8885, "step": 35559 }, { "epoch": 0.67, "learning_rate": 1.2906550311058042e-06, "loss": 0.8254, "step": 35560 }, { "epoch": 0.67, "learning_rate": 1.2905213310030018e-06, "loss": 0.919, "step": 35561 }, { "epoch": 0.67, "learning_rate": 1.2903876354163568e-06, "loss": 0.9671, "step": 35562 }, { "epoch": 0.67, "learning_rate": 1.2902539443463655e-06, "loss": 0.9143, "step": 35563 }, { "epoch": 0.67, "learning_rate": 1.2901202577935306e-06, "loss": 1.0797, "step": 35564 }, { "epoch": 0.67, "learning_rate": 1.2899865757583489e-06, "loss": 0.8136, "step": 35565 }, { "epoch": 0.67, "learning_rate": 1.2898528982413188e-06, "loss": 1.1335, "step": 35566 }, { "epoch": 0.67, "learning_rate": 1.2897192252429431e-06, "loss": 0.9678, "step": 35567 }, { "epoch": 0.67, "learning_rate": 1.2895855567637177e-06, "loss": 1.107, "step": 35568 }, { "epoch": 0.67, "learning_rate": 1.2894518928041427e-06, "loss": 0.9447, "step": 35569 }, { "epoch": 0.67, "learning_rate": 1.2893182333647174e-06, "loss": 1.0533, "step": 35570 }, { "epoch": 0.67, "learning_rate": 1.2891845784459407e-06, "loss": 0.9644, "step": 35571 }, { "epoch": 0.67, "learning_rate": 1.2890509280483113e-06, "loss": 1.1429, "step": 35572 }, { "epoch": 0.67, "learning_rate": 1.288917282172329e-06, "loss": 0.8635, "step": 35573 }, { "epoch": 0.67, "learning_rate": 1.288783640818493e-06, "loss": 1.0917, "step": 35574 }, { "epoch": 0.67, "learning_rate": 1.2886500039873002e-06, "loss": 1.053, "step": 35575 }, { "epoch": 0.67, "learning_rate": 1.2885163716792529e-06, "loss": 0.9011, "step": 35576 }, { "epoch": 0.67, "learning_rate": 1.2883827438948471e-06, "loss": 0.8561, "step": 35577 }, { "epoch": 0.67, "learning_rate": 1.2882491206345834e-06, "loss": 0.9841, "step": 35578 }, { "epoch": 0.67, "learning_rate": 1.2881155018989603e-06, "loss": 0.7306, "step": 35579 }, { "epoch": 0.67, "learning_rate": 1.2879818876884765e-06, "loss": 0.9119, "step": 35580 }, { "epoch": 0.67, "learning_rate": 1.2878482780036314e-06, "loss": 1.1619, "step": 35581 }, { "epoch": 0.67, "learning_rate": 1.2877146728449237e-06, "loss": 0.7198, "step": 35582 }, { "epoch": 0.67, "learning_rate": 1.287581072212853e-06, "loss": 0.897, "step": 35583 }, { "epoch": 0.67, "learning_rate": 1.2874474761079154e-06, "loss": 0.795, "step": 35584 }, { "epoch": 0.67, "learning_rate": 1.2873138845306137e-06, "loss": 0.7035, "step": 35585 }, { "epoch": 0.67, "learning_rate": 1.287180297481444e-06, "loss": 0.9186, "step": 35586 }, { "epoch": 0.67, "learning_rate": 1.287046714960905e-06, "loss": 0.9637, "step": 35587 }, { "epoch": 0.67, "learning_rate": 1.2869131369694982e-06, "loss": 0.9397, "step": 35588 }, { "epoch": 0.67, "learning_rate": 1.2867795635077196e-06, "loss": 0.9565, "step": 35589 }, { "epoch": 0.67, "learning_rate": 1.2866459945760687e-06, "loss": 1.0841, "step": 35590 }, { "epoch": 0.67, "learning_rate": 1.2865124301750447e-06, "loss": 0.8175, "step": 35591 }, { "epoch": 0.67, "learning_rate": 1.286378870305146e-06, "loss": 1.028, "step": 35592 }, { "epoch": 0.67, "learning_rate": 1.2862453149668713e-06, "loss": 0.8898, "step": 35593 }, { "epoch": 0.67, "learning_rate": 1.2861117641607196e-06, "loss": 1.1309, "step": 35594 }, { "epoch": 0.67, "learning_rate": 1.2859782178871898e-06, "loss": 0.83, "step": 35595 }, { "epoch": 0.67, "learning_rate": 1.2858446761467797e-06, "loss": 0.9055, "step": 35596 }, { "epoch": 0.67, "learning_rate": 1.2857111389399884e-06, "loss": 0.9617, "step": 35597 }, { "epoch": 0.67, "learning_rate": 1.2855776062673142e-06, "loss": 0.9662, "step": 35598 }, { "epoch": 0.67, "learning_rate": 1.285444078129256e-06, "loss": 1.007, "step": 35599 }, { "epoch": 0.67, "learning_rate": 1.2853105545263123e-06, "loss": 1.2623, "step": 35600 }, { "epoch": 0.67, "learning_rate": 1.2851770354589822e-06, "loss": 1.1571, "step": 35601 }, { "epoch": 0.67, "learning_rate": 1.2850435209277642e-06, "loss": 0.8508, "step": 35602 }, { "epoch": 0.67, "learning_rate": 1.2849100109331547e-06, "loss": 1.012, "step": 35603 }, { "epoch": 0.67, "learning_rate": 1.2847765054756562e-06, "loss": 0.8307, "step": 35604 }, { "epoch": 0.67, "learning_rate": 1.2846430045557634e-06, "loss": 0.9216, "step": 35605 }, { "epoch": 0.67, "learning_rate": 1.2845095081739767e-06, "loss": 1.0923, "step": 35606 }, { "epoch": 0.67, "learning_rate": 1.2843760163307945e-06, "loss": 0.8663, "step": 35607 }, { "epoch": 0.67, "learning_rate": 1.2842425290267147e-06, "loss": 0.9813, "step": 35608 }, { "epoch": 0.67, "learning_rate": 1.2841090462622358e-06, "loss": 1.0317, "step": 35609 }, { "epoch": 0.67, "learning_rate": 1.2839755680378569e-06, "loss": 0.9785, "step": 35610 }, { "epoch": 0.67, "learning_rate": 1.2838420943540764e-06, "loss": 1.0659, "step": 35611 }, { "epoch": 0.67, "learning_rate": 1.2837086252113906e-06, "loss": 1.181, "step": 35612 }, { "epoch": 0.67, "learning_rate": 1.2835751606103006e-06, "loss": 1.109, "step": 35613 }, { "epoch": 0.67, "learning_rate": 1.2834417005513045e-06, "loss": 0.937, "step": 35614 }, { "epoch": 0.67, "learning_rate": 1.2833082450348978e-06, "loss": 1.0516, "step": 35615 }, { "epoch": 0.67, "learning_rate": 1.2831747940615828e-06, "loss": 0.7966, "step": 35616 }, { "epoch": 0.67, "learning_rate": 1.2830413476318548e-06, "loss": 0.7579, "step": 35617 }, { "epoch": 0.67, "learning_rate": 1.282907905746213e-06, "loss": 0.9999, "step": 35618 }, { "epoch": 0.67, "learning_rate": 1.2827744684051557e-06, "loss": 0.9277, "step": 35619 }, { "epoch": 0.67, "learning_rate": 1.2826410356091818e-06, "loss": 1.0864, "step": 35620 }, { "epoch": 0.67, "learning_rate": 1.2825076073587883e-06, "loss": 0.8058, "step": 35621 }, { "epoch": 0.67, "learning_rate": 1.2823741836544742e-06, "loss": 0.8481, "step": 35622 }, { "epoch": 0.67, "learning_rate": 1.282240764496739e-06, "loss": 0.6339, "step": 35623 }, { "epoch": 0.67, "learning_rate": 1.282107349886077e-06, "loss": 0.921, "step": 35624 }, { "epoch": 0.67, "learning_rate": 1.2819739398229907e-06, "loss": 0.7851, "step": 35625 }, { "epoch": 0.67, "learning_rate": 1.2818405343079757e-06, "loss": 0.8545, "step": 35626 }, { "epoch": 0.67, "learning_rate": 1.2817071333415303e-06, "loss": 0.9393, "step": 35627 }, { "epoch": 0.67, "learning_rate": 1.2815737369241538e-06, "loss": 0.944, "step": 35628 }, { "epoch": 0.67, "learning_rate": 1.2814403450563434e-06, "loss": 1.0327, "step": 35629 }, { "epoch": 0.67, "learning_rate": 1.2813069577385973e-06, "loss": 1.0209, "step": 35630 }, { "epoch": 0.67, "learning_rate": 1.2811735749714136e-06, "loss": 1.0045, "step": 35631 }, { "epoch": 0.67, "learning_rate": 1.2810401967552912e-06, "loss": 0.9475, "step": 35632 }, { "epoch": 0.67, "learning_rate": 1.2809068230907257e-06, "loss": 0.9479, "step": 35633 }, { "epoch": 0.67, "learning_rate": 1.2807734539782176e-06, "loss": 0.7872, "step": 35634 }, { "epoch": 0.67, "learning_rate": 1.2806400894182652e-06, "loss": 0.8892, "step": 35635 }, { "epoch": 0.67, "learning_rate": 1.2805067294113633e-06, "loss": 0.7912, "step": 35636 }, { "epoch": 0.67, "learning_rate": 1.2803733739580135e-06, "loss": 1.2247, "step": 35637 }, { "epoch": 0.67, "learning_rate": 1.2802400230587115e-06, "loss": 0.8634, "step": 35638 }, { "epoch": 0.67, "learning_rate": 1.2801066767139555e-06, "loss": 0.9871, "step": 35639 }, { "epoch": 0.67, "learning_rate": 1.279973334924244e-06, "loss": 1.0422, "step": 35640 }, { "epoch": 0.67, "learning_rate": 1.279839997690075e-06, "loss": 0.7534, "step": 35641 }, { "epoch": 0.67, "learning_rate": 1.2797066650119454e-06, "loss": 0.9194, "step": 35642 }, { "epoch": 0.67, "learning_rate": 1.279573336890354e-06, "loss": 1.0057, "step": 35643 }, { "epoch": 0.67, "learning_rate": 1.2794400133257995e-06, "loss": 1.0789, "step": 35644 }, { "epoch": 0.67, "learning_rate": 1.2793066943187765e-06, "loss": 0.6276, "step": 35645 }, { "epoch": 0.67, "learning_rate": 1.2791733798697866e-06, "loss": 1.1095, "step": 35646 }, { "epoch": 0.67, "learning_rate": 1.279040069979325e-06, "loss": 0.8474, "step": 35647 }, { "epoch": 0.67, "learning_rate": 1.2789067646478903e-06, "loss": 0.723, "step": 35648 }, { "epoch": 0.67, "learning_rate": 1.2787734638759809e-06, "loss": 1.0218, "step": 35649 }, { "epoch": 0.67, "learning_rate": 1.2786401676640931e-06, "loss": 1.1671, "step": 35650 }, { "epoch": 0.67, "learning_rate": 1.278506876012726e-06, "loss": 0.7873, "step": 35651 }, { "epoch": 0.67, "learning_rate": 1.2783735889223763e-06, "loss": 0.8176, "step": 35652 }, { "epoch": 0.67, "learning_rate": 1.2782403063935434e-06, "loss": 0.8132, "step": 35653 }, { "epoch": 0.67, "learning_rate": 1.2781070284267218e-06, "loss": 0.6398, "step": 35654 }, { "epoch": 0.67, "learning_rate": 1.2779737550224121e-06, "loss": 0.9302, "step": 35655 }, { "epoch": 0.67, "learning_rate": 1.277840486181112e-06, "loss": 1.0888, "step": 35656 }, { "epoch": 0.67, "learning_rate": 1.277707221903316e-06, "loss": 0.7956, "step": 35657 }, { "epoch": 0.67, "learning_rate": 1.2775739621895256e-06, "loss": 0.8162, "step": 35658 }, { "epoch": 0.67, "learning_rate": 1.2774407070402356e-06, "loss": 0.7648, "step": 35659 }, { "epoch": 0.67, "learning_rate": 1.2773074564559445e-06, "loss": 0.6353, "step": 35660 }, { "epoch": 0.67, "learning_rate": 1.2771742104371502e-06, "loss": 0.8752, "step": 35661 }, { "epoch": 0.67, "learning_rate": 1.2770409689843497e-06, "loss": 1.1421, "step": 35662 }, { "epoch": 0.67, "learning_rate": 1.2769077320980406e-06, "loss": 0.8148, "step": 35663 }, { "epoch": 0.67, "learning_rate": 1.2767744997787207e-06, "loss": 0.8517, "step": 35664 }, { "epoch": 0.67, "learning_rate": 1.276641272026888e-06, "loss": 0.7809, "step": 35665 }, { "epoch": 0.67, "learning_rate": 1.2765080488430377e-06, "loss": 0.784, "step": 35666 }, { "epoch": 0.67, "learning_rate": 1.2763748302276705e-06, "loss": 0.7833, "step": 35667 }, { "epoch": 0.67, "learning_rate": 1.2762416161812813e-06, "loss": 0.9183, "step": 35668 }, { "epoch": 0.67, "learning_rate": 1.2761084067043684e-06, "loss": 1.056, "step": 35669 }, { "epoch": 0.67, "learning_rate": 1.275975201797429e-06, "loss": 0.8799, "step": 35670 }, { "epoch": 0.67, "learning_rate": 1.275842001460961e-06, "loss": 0.7934, "step": 35671 }, { "epoch": 0.67, "learning_rate": 1.275708805695461e-06, "loss": 0.7804, "step": 35672 }, { "epoch": 0.67, "learning_rate": 1.2755756145014272e-06, "loss": 0.7803, "step": 35673 }, { "epoch": 0.67, "learning_rate": 1.2754424278793576e-06, "loss": 0.7533, "step": 35674 }, { "epoch": 0.67, "learning_rate": 1.2753092458297461e-06, "loss": 1.2011, "step": 35675 }, { "epoch": 0.67, "learning_rate": 1.2751760683530934e-06, "loss": 0.9405, "step": 35676 }, { "epoch": 0.67, "learning_rate": 1.2750428954498966e-06, "loss": 0.8772, "step": 35677 }, { "epoch": 0.67, "learning_rate": 1.27490972712065e-06, "loss": 0.9655, "step": 35678 }, { "epoch": 0.67, "learning_rate": 1.2747765633658554e-06, "loss": 0.7523, "step": 35679 }, { "epoch": 0.67, "learning_rate": 1.2746434041860063e-06, "loss": 0.9495, "step": 35680 }, { "epoch": 0.67, "learning_rate": 1.2745102495816008e-06, "loss": 1.0267, "step": 35681 }, { "epoch": 0.67, "learning_rate": 1.2743770995531367e-06, "loss": 1.0213, "step": 35682 }, { "epoch": 0.67, "learning_rate": 1.2742439541011112e-06, "loss": 0.8271, "step": 35683 }, { "epoch": 0.67, "learning_rate": 1.274110813226021e-06, "loss": 0.9267, "step": 35684 }, { "epoch": 0.67, "learning_rate": 1.2739776769283635e-06, "loss": 0.8142, "step": 35685 }, { "epoch": 0.67, "learning_rate": 1.2738445452086368e-06, "loss": 0.8322, "step": 35686 }, { "epoch": 0.67, "learning_rate": 1.273711418067335e-06, "loss": 1.0636, "step": 35687 }, { "epoch": 0.67, "learning_rate": 1.2735782955049586e-06, "loss": 1.0956, "step": 35688 }, { "epoch": 0.67, "learning_rate": 1.2734451775220027e-06, "loss": 0.9514, "step": 35689 }, { "epoch": 0.67, "learning_rate": 1.273312064118965e-06, "loss": 0.7188, "step": 35690 }, { "epoch": 0.67, "learning_rate": 1.2731789552963422e-06, "loss": 0.9181, "step": 35691 }, { "epoch": 0.67, "learning_rate": 1.2730458510546318e-06, "loss": 0.9129, "step": 35692 }, { "epoch": 0.67, "learning_rate": 1.2729127513943304e-06, "loss": 0.7735, "step": 35693 }, { "epoch": 0.67, "learning_rate": 1.272779656315935e-06, "loss": 1.0416, "step": 35694 }, { "epoch": 0.67, "learning_rate": 1.2726465658199441e-06, "loss": 0.8312, "step": 35695 }, { "epoch": 0.67, "learning_rate": 1.2725134799068512e-06, "loss": 0.865, "step": 35696 }, { "epoch": 0.67, "learning_rate": 1.2723803985771563e-06, "loss": 0.791, "step": 35697 }, { "epoch": 0.67, "learning_rate": 1.2722473218313564e-06, "loss": 0.7518, "step": 35698 }, { "epoch": 0.67, "learning_rate": 1.272114249669945e-06, "loss": 0.9332, "step": 35699 }, { "epoch": 0.67, "learning_rate": 1.2719811820934235e-06, "loss": 1.2783, "step": 35700 }, { "epoch": 0.67, "learning_rate": 1.271848119102286e-06, "loss": 0.9801, "step": 35701 }, { "epoch": 0.67, "learning_rate": 1.2717150606970296e-06, "loss": 0.7806, "step": 35702 }, { "epoch": 0.67, "learning_rate": 1.2715820068781519e-06, "loss": 0.9473, "step": 35703 }, { "epoch": 0.67, "learning_rate": 1.271448957646149e-06, "loss": 0.785, "step": 35704 }, { "epoch": 0.67, "learning_rate": 1.271315913001518e-06, "loss": 0.7315, "step": 35705 }, { "epoch": 0.67, "learning_rate": 1.2711828729447557e-06, "loss": 1.1921, "step": 35706 }, { "epoch": 0.67, "learning_rate": 1.27104983747636e-06, "loss": 0.9756, "step": 35707 }, { "epoch": 0.67, "learning_rate": 1.2709168065968245e-06, "loss": 0.9727, "step": 35708 }, { "epoch": 0.67, "learning_rate": 1.2707837803066496e-06, "loss": 0.8448, "step": 35709 }, { "epoch": 0.67, "learning_rate": 1.27065075860633e-06, "loss": 0.7747, "step": 35710 }, { "epoch": 0.67, "learning_rate": 1.2705177414963624e-06, "loss": 0.8676, "step": 35711 }, { "epoch": 0.67, "learning_rate": 1.270384728977244e-06, "loss": 0.924, "step": 35712 }, { "epoch": 0.67, "learning_rate": 1.2702517210494714e-06, "loss": 0.9971, "step": 35713 }, { "epoch": 0.67, "learning_rate": 1.270118717713541e-06, "loss": 0.9682, "step": 35714 }, { "epoch": 0.67, "learning_rate": 1.2699857189699495e-06, "loss": 0.9161, "step": 35715 }, { "epoch": 0.67, "learning_rate": 1.2698527248191947e-06, "loss": 0.9464, "step": 35716 }, { "epoch": 0.67, "learning_rate": 1.2697197352617702e-06, "loss": 0.9648, "step": 35717 }, { "epoch": 0.67, "learning_rate": 1.2695867502981754e-06, "loss": 1.0632, "step": 35718 }, { "epoch": 0.67, "learning_rate": 1.269453769928907e-06, "loss": 0.8077, "step": 35719 }, { "epoch": 0.67, "learning_rate": 1.2693207941544583e-06, "loss": 0.9286, "step": 35720 }, { "epoch": 0.67, "learning_rate": 1.2691878229753302e-06, "loss": 0.7566, "step": 35721 }, { "epoch": 0.67, "learning_rate": 1.269054856392016e-06, "loss": 0.7029, "step": 35722 }, { "epoch": 0.67, "learning_rate": 1.2689218944050133e-06, "loss": 0.9126, "step": 35723 }, { "epoch": 0.67, "learning_rate": 1.2687889370148184e-06, "loss": 0.9281, "step": 35724 }, { "epoch": 0.67, "learning_rate": 1.2686559842219282e-06, "loss": 1.1448, "step": 35725 }, { "epoch": 0.67, "learning_rate": 1.2685230360268384e-06, "loss": 0.7976, "step": 35726 }, { "epoch": 0.67, "learning_rate": 1.2683900924300457e-06, "loss": 0.7931, "step": 35727 }, { "epoch": 0.67, "learning_rate": 1.268257153432048e-06, "loss": 1.0112, "step": 35728 }, { "epoch": 0.67, "learning_rate": 1.2681242190333382e-06, "loss": 0.9517, "step": 35729 }, { "epoch": 0.67, "learning_rate": 1.2679912892344168e-06, "loss": 0.8276, "step": 35730 }, { "epoch": 0.67, "learning_rate": 1.2678583640357773e-06, "loss": 1.0821, "step": 35731 }, { "epoch": 0.67, "learning_rate": 1.2677254434379167e-06, "loss": 0.8219, "step": 35732 }, { "epoch": 0.67, "learning_rate": 1.2675925274413315e-06, "loss": 0.8964, "step": 35733 }, { "epoch": 0.67, "learning_rate": 1.267459616046518e-06, "loss": 0.9817, "step": 35734 }, { "epoch": 0.67, "learning_rate": 1.2673267092539726e-06, "loss": 0.8167, "step": 35735 }, { "epoch": 0.67, "learning_rate": 1.2671938070641915e-06, "loss": 1.1122, "step": 35736 }, { "epoch": 0.67, "learning_rate": 1.2670609094776718e-06, "loss": 1.1086, "step": 35737 }, { "epoch": 0.67, "learning_rate": 1.2669280164949068e-06, "loss": 0.9601, "step": 35738 }, { "epoch": 0.67, "learning_rate": 1.2667951281163959e-06, "loss": 0.8205, "step": 35739 }, { "epoch": 0.67, "learning_rate": 1.2666622443426351e-06, "loss": 0.8602, "step": 35740 }, { "epoch": 0.67, "learning_rate": 1.2665293651741178e-06, "loss": 0.7513, "step": 35741 }, { "epoch": 0.67, "learning_rate": 1.2663964906113442e-06, "loss": 0.8142, "step": 35742 }, { "epoch": 0.67, "learning_rate": 1.2662636206548069e-06, "loss": 1.0735, "step": 35743 }, { "epoch": 0.67, "learning_rate": 1.2661307553050033e-06, "loss": 1.0685, "step": 35744 }, { "epoch": 0.67, "learning_rate": 1.2659978945624301e-06, "loss": 0.8781, "step": 35745 }, { "epoch": 0.67, "learning_rate": 1.2658650384275827e-06, "loss": 0.9857, "step": 35746 }, { "epoch": 0.67, "learning_rate": 1.2657321869009575e-06, "loss": 0.9368, "step": 35747 }, { "epoch": 0.67, "learning_rate": 1.2655993399830504e-06, "loss": 0.8827, "step": 35748 }, { "epoch": 0.67, "learning_rate": 1.2654664976743586e-06, "loss": 0.9123, "step": 35749 }, { "epoch": 0.67, "learning_rate": 1.2653336599753752e-06, "loss": 1.2357, "step": 35750 }, { "epoch": 0.67, "learning_rate": 1.2652008268865996e-06, "loss": 0.7647, "step": 35751 }, { "epoch": 0.67, "learning_rate": 1.2650679984085254e-06, "loss": 0.8184, "step": 35752 }, { "epoch": 0.67, "learning_rate": 1.2649351745416495e-06, "loss": 0.9471, "step": 35753 }, { "epoch": 0.67, "learning_rate": 1.264802355286468e-06, "loss": 0.8303, "step": 35754 }, { "epoch": 0.67, "learning_rate": 1.264669540643476e-06, "loss": 0.8874, "step": 35755 }, { "epoch": 0.67, "learning_rate": 1.2645367306131707e-06, "loss": 1.2309, "step": 35756 }, { "epoch": 0.67, "learning_rate": 1.2644039251960471e-06, "loss": 0.9707, "step": 35757 }, { "epoch": 0.67, "learning_rate": 1.2642711243926025e-06, "loss": 0.7504, "step": 35758 }, { "epoch": 0.67, "learning_rate": 1.2641383282033298e-06, "loss": 0.7419, "step": 35759 }, { "epoch": 0.67, "learning_rate": 1.2640055366287274e-06, "loss": 0.8414, "step": 35760 }, { "epoch": 0.67, "learning_rate": 1.2638727496692912e-06, "loss": 0.9941, "step": 35761 }, { "epoch": 0.67, "learning_rate": 1.2637399673255147e-06, "loss": 1.0607, "step": 35762 }, { "epoch": 0.67, "learning_rate": 1.2636071895978968e-06, "loss": 0.9635, "step": 35763 }, { "epoch": 0.67, "learning_rate": 1.263474416486931e-06, "loss": 0.9135, "step": 35764 }, { "epoch": 0.67, "learning_rate": 1.263341647993114e-06, "loss": 1.0443, "step": 35765 }, { "epoch": 0.67, "learning_rate": 1.2632088841169412e-06, "loss": 0.8062, "step": 35766 }, { "epoch": 0.67, "learning_rate": 1.2630761248589086e-06, "loss": 0.8237, "step": 35767 }, { "epoch": 0.67, "learning_rate": 1.2629433702195118e-06, "loss": 0.9172, "step": 35768 }, { "epoch": 0.67, "learning_rate": 1.2628106201992463e-06, "loss": 1.2107, "step": 35769 }, { "epoch": 0.67, "learning_rate": 1.2626778747986093e-06, "loss": 0.888, "step": 35770 }, { "epoch": 0.67, "learning_rate": 1.262545134018093e-06, "loss": 0.9086, "step": 35771 }, { "epoch": 0.67, "learning_rate": 1.2624123978581972e-06, "loss": 0.7315, "step": 35772 }, { "epoch": 0.67, "learning_rate": 1.2622796663194148e-06, "loss": 0.6893, "step": 35773 }, { "epoch": 0.67, "learning_rate": 1.262146939402242e-06, "loss": 1.0971, "step": 35774 }, { "epoch": 0.67, "learning_rate": 1.2620142171071748e-06, "loss": 1.05, "step": 35775 }, { "epoch": 0.67, "learning_rate": 1.2618814994347084e-06, "loss": 0.7294, "step": 35776 }, { "epoch": 0.67, "learning_rate": 1.2617487863853384e-06, "loss": 0.7541, "step": 35777 }, { "epoch": 0.68, "learning_rate": 1.2616160779595603e-06, "loss": 1.1443, "step": 35778 }, { "epoch": 0.68, "learning_rate": 1.261483374157871e-06, "loss": 0.8109, "step": 35779 }, { "epoch": 0.68, "learning_rate": 1.261350674980763e-06, "loss": 1.0264, "step": 35780 }, { "epoch": 0.68, "learning_rate": 1.2612179804287345e-06, "loss": 1.1371, "step": 35781 }, { "epoch": 0.68, "learning_rate": 1.2610852905022809e-06, "loss": 0.6988, "step": 35782 }, { "epoch": 0.68, "learning_rate": 1.260952605201895e-06, "loss": 0.7477, "step": 35783 }, { "epoch": 0.68, "learning_rate": 1.260819924528076e-06, "loss": 0.8544, "step": 35784 }, { "epoch": 0.68, "learning_rate": 1.2606872484813165e-06, "loss": 0.834, "step": 35785 }, { "epoch": 0.68, "learning_rate": 1.2605545770621128e-06, "loss": 0.8609, "step": 35786 }, { "epoch": 0.68, "learning_rate": 1.2604219102709602e-06, "loss": 0.8366, "step": 35787 }, { "epoch": 0.68, "learning_rate": 1.2602892481083546e-06, "loss": 1.1076, "step": 35788 }, { "epoch": 0.68, "learning_rate": 1.2601565905747903e-06, "loss": 0.9285, "step": 35789 }, { "epoch": 0.68, "learning_rate": 1.2600239376707634e-06, "loss": 0.8283, "step": 35790 }, { "epoch": 0.68, "learning_rate": 1.2598912893967704e-06, "loss": 0.8405, "step": 35791 }, { "epoch": 0.68, "learning_rate": 1.2597586457533035e-06, "loss": 0.9588, "step": 35792 }, { "epoch": 0.68, "learning_rate": 1.259626006740861e-06, "loss": 1.1732, "step": 35793 }, { "epoch": 0.68, "learning_rate": 1.2594933723599368e-06, "loss": 1.0929, "step": 35794 }, { "epoch": 0.68, "learning_rate": 1.2593607426110257e-06, "loss": 0.8444, "step": 35795 }, { "epoch": 0.68, "learning_rate": 1.2592281174946238e-06, "loss": 0.6883, "step": 35796 }, { "epoch": 0.68, "learning_rate": 1.2590954970112262e-06, "loss": 0.8458, "step": 35797 }, { "epoch": 0.68, "learning_rate": 1.2589628811613277e-06, "loss": 0.8855, "step": 35798 }, { "epoch": 0.68, "learning_rate": 1.2588302699454238e-06, "loss": 1.0536, "step": 35799 }, { "epoch": 0.68, "learning_rate": 1.2586976633640107e-06, "loss": 1.0613, "step": 35800 }, { "epoch": 0.68, "learning_rate": 1.2585650614175804e-06, "loss": 0.967, "step": 35801 }, { "epoch": 0.68, "learning_rate": 1.2584324641066314e-06, "loss": 0.8593, "step": 35802 }, { "epoch": 0.68, "learning_rate": 1.258299871431658e-06, "loss": 0.7158, "step": 35803 }, { "epoch": 0.68, "learning_rate": 1.2581672833931532e-06, "loss": 0.6762, "step": 35804 }, { "epoch": 0.68, "learning_rate": 1.2580346999916154e-06, "loss": 0.9029, "step": 35805 }, { "epoch": 0.68, "learning_rate": 1.2579021212275372e-06, "loss": 1.0873, "step": 35806 }, { "epoch": 0.68, "learning_rate": 1.2577695471014144e-06, "loss": 0.7144, "step": 35807 }, { "epoch": 0.68, "learning_rate": 1.257636977613742e-06, "loss": 0.9101, "step": 35808 }, { "epoch": 0.68, "learning_rate": 1.257504412765015e-06, "loss": 1.0487, "step": 35809 }, { "epoch": 0.68, "learning_rate": 1.2573718525557283e-06, "loss": 0.8154, "step": 35810 }, { "epoch": 0.68, "learning_rate": 1.2572392969863773e-06, "loss": 0.9454, "step": 35811 }, { "epoch": 0.68, "learning_rate": 1.2571067460574571e-06, "loss": 1.2524, "step": 35812 }, { "epoch": 0.68, "learning_rate": 1.2569741997694607e-06, "loss": 1.0099, "step": 35813 }, { "epoch": 0.68, "learning_rate": 1.2568416581228866e-06, "loss": 0.9199, "step": 35814 }, { "epoch": 0.68, "learning_rate": 1.256709121118226e-06, "loss": 0.9716, "step": 35815 }, { "epoch": 0.68, "learning_rate": 1.256576588755976e-06, "loss": 0.9106, "step": 35816 }, { "epoch": 0.68, "learning_rate": 1.2564440610366308e-06, "loss": 0.8669, "step": 35817 }, { "epoch": 0.68, "learning_rate": 1.2563115379606853e-06, "loss": 0.7653, "step": 35818 }, { "epoch": 0.68, "learning_rate": 1.2561790195286345e-06, "loss": 1.1223, "step": 35819 }, { "epoch": 0.68, "learning_rate": 1.2560465057409727e-06, "loss": 0.9823, "step": 35820 }, { "epoch": 0.68, "learning_rate": 1.2559139965981965e-06, "loss": 0.9134, "step": 35821 }, { "epoch": 0.68, "learning_rate": 1.2557814921007972e-06, "loss": 0.7927, "step": 35822 }, { "epoch": 0.68, "learning_rate": 1.2556489922492726e-06, "loss": 0.8127, "step": 35823 }, { "epoch": 0.68, "learning_rate": 1.2555164970441174e-06, "loss": 0.7478, "step": 35824 }, { "epoch": 0.68, "learning_rate": 1.2553840064858237e-06, "loss": 1.0578, "step": 35825 }, { "epoch": 0.68, "learning_rate": 1.2552515205748897e-06, "loss": 0.7411, "step": 35826 }, { "epoch": 0.68, "learning_rate": 1.2551190393118074e-06, "loss": 0.8972, "step": 35827 }, { "epoch": 0.68, "learning_rate": 1.2549865626970726e-06, "loss": 0.8482, "step": 35828 }, { "epoch": 0.68, "learning_rate": 1.2548540907311795e-06, "loss": 0.7113, "step": 35829 }, { "epoch": 0.68, "learning_rate": 1.2547216234146237e-06, "loss": 0.7944, "step": 35830 }, { "epoch": 0.68, "learning_rate": 1.2545891607478997e-06, "loss": 1.053, "step": 35831 }, { "epoch": 0.68, "learning_rate": 1.2544567027314996e-06, "loss": 0.8169, "step": 35832 }, { "epoch": 0.68, "learning_rate": 1.2543242493659218e-06, "loss": 1.0486, "step": 35833 }, { "epoch": 0.68, "learning_rate": 1.2541918006516586e-06, "loss": 0.8601, "step": 35834 }, { "epoch": 0.68, "learning_rate": 1.2540593565892045e-06, "loss": 0.9219, "step": 35835 }, { "epoch": 0.68, "learning_rate": 1.2539269171790546e-06, "loss": 0.782, "step": 35836 }, { "epoch": 0.68, "learning_rate": 1.2537944824217039e-06, "loss": 1.0946, "step": 35837 }, { "epoch": 0.68, "learning_rate": 1.253662052317646e-06, "loss": 0.7881, "step": 35838 }, { "epoch": 0.68, "learning_rate": 1.2535296268673758e-06, "loss": 0.8756, "step": 35839 }, { "epoch": 0.68, "learning_rate": 1.253397206071389e-06, "loss": 0.9108, "step": 35840 }, { "epoch": 0.68, "learning_rate": 1.2532647899301764e-06, "loss": 0.9055, "step": 35841 }, { "epoch": 0.68, "learning_rate": 1.253132378444237e-06, "loss": 0.69, "step": 35842 }, { "epoch": 0.68, "learning_rate": 1.2529999716140624e-06, "loss": 1.1146, "step": 35843 }, { "epoch": 0.68, "learning_rate": 1.2528675694401462e-06, "loss": 1.1284, "step": 35844 }, { "epoch": 0.68, "learning_rate": 1.2527351719229863e-06, "loss": 0.9868, "step": 35845 }, { "epoch": 0.68, "learning_rate": 1.2526027790630744e-06, "loss": 0.7892, "step": 35846 }, { "epoch": 0.68, "learning_rate": 1.252470390860905e-06, "loss": 0.9306, "step": 35847 }, { "epoch": 0.68, "learning_rate": 1.2523380073169733e-06, "loss": 0.9083, "step": 35848 }, { "epoch": 0.68, "learning_rate": 1.2522056284317729e-06, "loss": 1.0934, "step": 35849 }, { "epoch": 0.68, "learning_rate": 1.252073254205799e-06, "loss": 0.9951, "step": 35850 }, { "epoch": 0.68, "learning_rate": 1.2519408846395447e-06, "loss": 1.042, "step": 35851 }, { "epoch": 0.68, "learning_rate": 1.251808519733506e-06, "loss": 0.8727, "step": 35852 }, { "epoch": 0.68, "learning_rate": 1.2516761594881743e-06, "loss": 1.0334, "step": 35853 }, { "epoch": 0.68, "learning_rate": 1.2515438039040473e-06, "loss": 0.8715, "step": 35854 }, { "epoch": 0.68, "learning_rate": 1.2514114529816166e-06, "loss": 1.0678, "step": 35855 }, { "epoch": 0.68, "learning_rate": 1.2512791067213769e-06, "loss": 1.0222, "step": 35856 }, { "epoch": 0.68, "learning_rate": 1.2511467651238232e-06, "loss": 1.0027, "step": 35857 }, { "epoch": 0.68, "learning_rate": 1.2510144281894487e-06, "loss": 0.8581, "step": 35858 }, { "epoch": 0.68, "learning_rate": 1.2508820959187484e-06, "loss": 0.7851, "step": 35859 }, { "epoch": 0.68, "learning_rate": 1.250749768312216e-06, "loss": 0.8467, "step": 35860 }, { "epoch": 0.68, "learning_rate": 1.2506174453703467e-06, "loss": 0.8758, "step": 35861 }, { "epoch": 0.68, "learning_rate": 1.2504851270936313e-06, "loss": 0.9611, "step": 35862 }, { "epoch": 0.68, "learning_rate": 1.2503528134825684e-06, "loss": 1.0833, "step": 35863 }, { "epoch": 0.68, "learning_rate": 1.2502205045376486e-06, "loss": 0.9456, "step": 35864 }, { "epoch": 0.68, "learning_rate": 1.2500882002593664e-06, "loss": 0.8287, "step": 35865 }, { "epoch": 0.68, "learning_rate": 1.2499559006482184e-06, "loss": 0.9074, "step": 35866 }, { "epoch": 0.68, "learning_rate": 1.2498236057046955e-06, "loss": 1.049, "step": 35867 }, { "epoch": 0.68, "learning_rate": 1.2496913154292933e-06, "loss": 0.8913, "step": 35868 }, { "epoch": 0.68, "learning_rate": 1.2495590298225052e-06, "loss": 1.0478, "step": 35869 }, { "epoch": 0.68, "learning_rate": 1.2494267488848253e-06, "loss": 0.8844, "step": 35870 }, { "epoch": 0.68, "learning_rate": 1.2492944726167475e-06, "loss": 0.8314, "step": 35871 }, { "epoch": 0.68, "learning_rate": 1.249162201018766e-06, "loss": 0.8004, "step": 35872 }, { "epoch": 0.68, "learning_rate": 1.2490299340913754e-06, "loss": 0.8157, "step": 35873 }, { "epoch": 0.68, "learning_rate": 1.2488976718350668e-06, "loss": 0.8322, "step": 35874 }, { "epoch": 0.68, "learning_rate": 1.2487654142503377e-06, "loss": 1.2097, "step": 35875 }, { "epoch": 0.68, "learning_rate": 1.2486331613376793e-06, "loss": 0.8946, "step": 35876 }, { "epoch": 0.68, "learning_rate": 1.248500913097586e-06, "loss": 0.9575, "step": 35877 }, { "epoch": 0.68, "learning_rate": 1.2483686695305524e-06, "loss": 0.7914, "step": 35878 }, { "epoch": 0.68, "learning_rate": 1.2482364306370717e-06, "loss": 0.8038, "step": 35879 }, { "epoch": 0.68, "learning_rate": 1.2481041964176378e-06, "loss": 0.7884, "step": 35880 }, { "epoch": 0.68, "learning_rate": 1.2479719668727441e-06, "loss": 1.088, "step": 35881 }, { "epoch": 0.68, "learning_rate": 1.247839742002886e-06, "loss": 1.0282, "step": 35882 }, { "epoch": 0.68, "learning_rate": 1.2477075218085537e-06, "loss": 1.0273, "step": 35883 }, { "epoch": 0.68, "learning_rate": 1.2475753062902447e-06, "loss": 0.8432, "step": 35884 }, { "epoch": 0.68, "learning_rate": 1.2474430954484515e-06, "loss": 0.9569, "step": 35885 }, { "epoch": 0.68, "learning_rate": 1.2473108892836655e-06, "loss": 0.9582, "step": 35886 }, { "epoch": 0.68, "learning_rate": 1.2471786877963844e-06, "loss": 0.8813, "step": 35887 }, { "epoch": 0.68, "learning_rate": 1.2470464909870985e-06, "loss": 1.0709, "step": 35888 }, { "epoch": 0.68, "learning_rate": 1.2469142988563027e-06, "loss": 0.7919, "step": 35889 }, { "epoch": 0.68, "learning_rate": 1.2467821114044903e-06, "loss": 0.6704, "step": 35890 }, { "epoch": 0.68, "learning_rate": 1.2466499286321552e-06, "loss": 0.6993, "step": 35891 }, { "epoch": 0.68, "learning_rate": 1.2465177505397907e-06, "loss": 0.9263, "step": 35892 }, { "epoch": 0.68, "learning_rate": 1.2463855771278907e-06, "loss": 0.9657, "step": 35893 }, { "epoch": 0.68, "learning_rate": 1.2462534083969493e-06, "loss": 0.9632, "step": 35894 }, { "epoch": 0.68, "learning_rate": 1.2461212443474576e-06, "loss": 0.8529, "step": 35895 }, { "epoch": 0.68, "learning_rate": 1.2459890849799125e-06, "loss": 0.9626, "step": 35896 }, { "epoch": 0.68, "learning_rate": 1.2458569302948048e-06, "loss": 0.9517, "step": 35897 }, { "epoch": 0.68, "learning_rate": 1.2457247802926286e-06, "loss": 0.9821, "step": 35898 }, { "epoch": 0.68, "learning_rate": 1.2455926349738778e-06, "loss": 0.9551, "step": 35899 }, { "epoch": 0.68, "learning_rate": 1.2454604943390457e-06, "loss": 1.1929, "step": 35900 }, { "epoch": 0.68, "learning_rate": 1.2453283583886256e-06, "loss": 0.9105, "step": 35901 }, { "epoch": 0.68, "learning_rate": 1.2451962271231109e-06, "loss": 0.9489, "step": 35902 }, { "epoch": 0.68, "learning_rate": 1.2450641005429961e-06, "loss": 1.0998, "step": 35903 }, { "epoch": 0.68, "learning_rate": 1.2449319786487712e-06, "loss": 0.9932, "step": 35904 }, { "epoch": 0.68, "learning_rate": 1.2447998614409331e-06, "loss": 0.9507, "step": 35905 }, { "epoch": 0.68, "learning_rate": 1.2446677489199748e-06, "loss": 0.9541, "step": 35906 }, { "epoch": 0.68, "learning_rate": 1.2445356410863865e-06, "loss": 0.9113, "step": 35907 }, { "epoch": 0.68, "learning_rate": 1.2444035379406658e-06, "loss": 0.8549, "step": 35908 }, { "epoch": 0.68, "learning_rate": 1.2442714394833027e-06, "loss": 0.8041, "step": 35909 }, { "epoch": 0.68, "learning_rate": 1.2441393457147916e-06, "loss": 0.8576, "step": 35910 }, { "epoch": 0.68, "learning_rate": 1.2440072566356257e-06, "loss": 0.9259, "step": 35911 }, { "epoch": 0.68, "learning_rate": 1.243875172246298e-06, "loss": 1.0853, "step": 35912 }, { "epoch": 0.68, "learning_rate": 1.2437430925473022e-06, "loss": 1.0783, "step": 35913 }, { "epoch": 0.68, "learning_rate": 1.2436110175391308e-06, "loss": 0.9973, "step": 35914 }, { "epoch": 0.68, "learning_rate": 1.2434789472222786e-06, "loss": 1.0149, "step": 35915 }, { "epoch": 0.68, "learning_rate": 1.2433468815972355e-06, "loss": 1.0134, "step": 35916 }, { "epoch": 0.68, "learning_rate": 1.2432148206644984e-06, "loss": 0.9377, "step": 35917 }, { "epoch": 0.68, "learning_rate": 1.2430827644245576e-06, "loss": 0.9251, "step": 35918 }, { "epoch": 0.68, "learning_rate": 1.2429507128779074e-06, "loss": 0.8909, "step": 35919 }, { "epoch": 0.68, "learning_rate": 1.2428186660250408e-06, "loss": 0.8916, "step": 35920 }, { "epoch": 0.68, "learning_rate": 1.2426866238664506e-06, "loss": 0.9965, "step": 35921 }, { "epoch": 0.68, "learning_rate": 1.24255458640263e-06, "loss": 0.9488, "step": 35922 }, { "epoch": 0.68, "learning_rate": 1.242422553634072e-06, "loss": 0.742, "step": 35923 }, { "epoch": 0.68, "learning_rate": 1.2422905255612707e-06, "loss": 0.8765, "step": 35924 }, { "epoch": 0.68, "learning_rate": 1.242158502184716e-06, "loss": 1.0546, "step": 35925 }, { "epoch": 0.68, "learning_rate": 1.242026483504904e-06, "loss": 0.9754, "step": 35926 }, { "epoch": 0.68, "learning_rate": 1.2418944695223272e-06, "loss": 0.9787, "step": 35927 }, { "epoch": 0.68, "learning_rate": 1.2417624602374762e-06, "loss": 0.9268, "step": 35928 }, { "epoch": 0.68, "learning_rate": 1.2416304556508473e-06, "loss": 0.7932, "step": 35929 }, { "epoch": 0.68, "learning_rate": 1.241498455762931e-06, "loss": 0.8467, "step": 35930 }, { "epoch": 0.68, "learning_rate": 1.2413664605742208e-06, "loss": 1.1504, "step": 35931 }, { "epoch": 0.68, "learning_rate": 1.2412344700852094e-06, "loss": 1.0248, "step": 35932 }, { "epoch": 0.68, "learning_rate": 1.2411024842963904e-06, "loss": 0.9283, "step": 35933 }, { "epoch": 0.68, "learning_rate": 1.2409705032082556e-06, "loss": 0.7781, "step": 35934 }, { "epoch": 0.68, "learning_rate": 1.2408385268212986e-06, "loss": 0.7821, "step": 35935 }, { "epoch": 0.68, "learning_rate": 1.240706555136013e-06, "loss": 0.7412, "step": 35936 }, { "epoch": 0.68, "learning_rate": 1.2405745881528884e-06, "loss": 0.9847, "step": 35937 }, { "epoch": 0.68, "learning_rate": 1.2404426258724216e-06, "loss": 1.1727, "step": 35938 }, { "epoch": 0.68, "learning_rate": 1.2403106682951024e-06, "loss": 0.9264, "step": 35939 }, { "epoch": 0.68, "learning_rate": 1.240178715421425e-06, "loss": 0.8408, "step": 35940 }, { "epoch": 0.68, "learning_rate": 1.240046767251881e-06, "loss": 0.8099, "step": 35941 }, { "epoch": 0.68, "learning_rate": 1.239914823786964e-06, "loss": 0.9131, "step": 35942 }, { "epoch": 0.68, "learning_rate": 1.2397828850271665e-06, "loss": 0.8247, "step": 35943 }, { "epoch": 0.68, "learning_rate": 1.239650950972981e-06, "loss": 0.9455, "step": 35944 }, { "epoch": 0.68, "learning_rate": 1.2395190216249011e-06, "loss": 0.815, "step": 35945 }, { "epoch": 0.68, "learning_rate": 1.2393870969834168e-06, "loss": 0.9804, "step": 35946 }, { "epoch": 0.68, "learning_rate": 1.2392551770490232e-06, "loss": 0.8469, "step": 35947 }, { "epoch": 0.68, "learning_rate": 1.2391232618222133e-06, "loss": 0.8198, "step": 35948 }, { "epoch": 0.68, "learning_rate": 1.2389913513034762e-06, "loss": 0.8209, "step": 35949 }, { "epoch": 0.68, "learning_rate": 1.2388594454933089e-06, "loss": 1.0651, "step": 35950 }, { "epoch": 0.68, "learning_rate": 1.2387275443922009e-06, "loss": 0.8221, "step": 35951 }, { "epoch": 0.68, "learning_rate": 1.2385956480006452e-06, "loss": 0.9901, "step": 35952 }, { "epoch": 0.68, "learning_rate": 1.238463756319135e-06, "loss": 0.9368, "step": 35953 }, { "epoch": 0.68, "learning_rate": 1.2383318693481625e-06, "loss": 0.8535, "step": 35954 }, { "epoch": 0.68, "learning_rate": 1.2381999870882199e-06, "loss": 0.8297, "step": 35955 }, { "epoch": 0.68, "learning_rate": 1.2380681095397998e-06, "loss": 1.2593, "step": 35956 }, { "epoch": 0.68, "learning_rate": 1.2379362367033958e-06, "loss": 0.9985, "step": 35957 }, { "epoch": 0.68, "learning_rate": 1.2378043685794974e-06, "loss": 0.7352, "step": 35958 }, { "epoch": 0.68, "learning_rate": 1.2376725051686006e-06, "loss": 0.9227, "step": 35959 }, { "epoch": 0.68, "learning_rate": 1.237540646471195e-06, "loss": 0.764, "step": 35960 }, { "epoch": 0.68, "learning_rate": 1.2374087924877736e-06, "loss": 0.7656, "step": 35961 }, { "epoch": 0.68, "learning_rate": 1.2372769432188294e-06, "loss": 1.2006, "step": 35962 }, { "epoch": 0.68, "learning_rate": 1.2371450986648545e-06, "loss": 0.8753, "step": 35963 }, { "epoch": 0.68, "learning_rate": 1.2370132588263408e-06, "loss": 0.9272, "step": 35964 }, { "epoch": 0.68, "learning_rate": 1.236881423703781e-06, "loss": 0.9604, "step": 35965 }, { "epoch": 0.68, "learning_rate": 1.2367495932976683e-06, "loss": 0.8734, "step": 35966 }, { "epoch": 0.68, "learning_rate": 1.2366177676084917e-06, "loss": 1.0153, "step": 35967 }, { "epoch": 0.68, "learning_rate": 1.2364859466367468e-06, "loss": 0.8681, "step": 35968 }, { "epoch": 0.68, "learning_rate": 1.2363541303829254e-06, "loss": 0.8708, "step": 35969 }, { "epoch": 0.68, "learning_rate": 1.2362223188475172e-06, "loss": 0.9166, "step": 35970 }, { "epoch": 0.68, "learning_rate": 1.236090512031018e-06, "loss": 0.7924, "step": 35971 }, { "epoch": 0.68, "learning_rate": 1.235958709933917e-06, "loss": 0.9498, "step": 35972 }, { "epoch": 0.68, "learning_rate": 1.2358269125567076e-06, "loss": 0.8017, "step": 35973 }, { "epoch": 0.68, "learning_rate": 1.2356951198998815e-06, "loss": 0.7995, "step": 35974 }, { "epoch": 0.68, "learning_rate": 1.2355633319639313e-06, "loss": 1.1125, "step": 35975 }, { "epoch": 0.68, "learning_rate": 1.2354315487493488e-06, "loss": 0.8971, "step": 35976 }, { "epoch": 0.68, "learning_rate": 1.235299770256626e-06, "loss": 0.9402, "step": 35977 }, { "epoch": 0.68, "learning_rate": 1.2351679964862562e-06, "loss": 1.0902, "step": 35978 }, { "epoch": 0.68, "learning_rate": 1.2350362274387284e-06, "loss": 0.9625, "step": 35979 }, { "epoch": 0.68, "learning_rate": 1.2349044631145381e-06, "loss": 0.9294, "step": 35980 }, { "epoch": 0.68, "learning_rate": 1.2347727035141753e-06, "loss": 0.98, "step": 35981 }, { "epoch": 0.68, "learning_rate": 1.2346409486381323e-06, "loss": 0.8058, "step": 35982 }, { "epoch": 0.68, "learning_rate": 1.234509198486901e-06, "loss": 0.9067, "step": 35983 }, { "epoch": 0.68, "learning_rate": 1.2343774530609737e-06, "loss": 0.9613, "step": 35984 }, { "epoch": 0.68, "learning_rate": 1.234245712360842e-06, "loss": 0.7669, "step": 35985 }, { "epoch": 0.68, "learning_rate": 1.2341139763869984e-06, "loss": 0.9021, "step": 35986 }, { "epoch": 0.68, "learning_rate": 1.233982245139935e-06, "loss": 0.9166, "step": 35987 }, { "epoch": 0.68, "learning_rate": 1.233850518620141e-06, "loss": 0.9536, "step": 35988 }, { "epoch": 0.68, "learning_rate": 1.2337187968281116e-06, "loss": 0.7772, "step": 35989 }, { "epoch": 0.68, "learning_rate": 1.2335870797643384e-06, "loss": 0.9553, "step": 35990 }, { "epoch": 0.68, "learning_rate": 1.23345536742931e-06, "loss": 0.823, "step": 35991 }, { "epoch": 0.68, "learning_rate": 1.233323659823523e-06, "loss": 0.7675, "step": 35992 }, { "epoch": 0.68, "learning_rate": 1.2331919569474652e-06, "loss": 0.9706, "step": 35993 }, { "epoch": 0.68, "learning_rate": 1.2330602588016296e-06, "loss": 1.0283, "step": 35994 }, { "epoch": 0.68, "learning_rate": 1.2329285653865084e-06, "loss": 1.1032, "step": 35995 }, { "epoch": 0.68, "learning_rate": 1.232796876702593e-06, "loss": 0.7668, "step": 35996 }, { "epoch": 0.68, "learning_rate": 1.2326651927503753e-06, "loss": 0.984, "step": 35997 }, { "epoch": 0.68, "learning_rate": 1.2325335135303468e-06, "loss": 0.8943, "step": 35998 }, { "epoch": 0.68, "learning_rate": 1.2324018390430003e-06, "loss": 1.1266, "step": 35999 }, { "epoch": 0.68, "learning_rate": 1.2322701692888244e-06, "loss": 1.0931, "step": 36000 }, { "epoch": 0.68, "learning_rate": 1.2321385042683152e-06, "loss": 0.943, "step": 36001 }, { "epoch": 0.68, "learning_rate": 1.2320068439819604e-06, "loss": 0.7437, "step": 36002 }, { "epoch": 0.68, "learning_rate": 1.2318751884302536e-06, "loss": 0.8538, "step": 36003 }, { "epoch": 0.68, "learning_rate": 1.2317435376136858e-06, "loss": 1.0052, "step": 36004 }, { "epoch": 0.68, "learning_rate": 1.2316118915327488e-06, "loss": 1.1004, "step": 36005 }, { "epoch": 0.68, "learning_rate": 1.231480250187934e-06, "loss": 1.1698, "step": 36006 }, { "epoch": 0.68, "learning_rate": 1.231348613579733e-06, "loss": 0.9825, "step": 36007 }, { "epoch": 0.68, "learning_rate": 1.2312169817086386e-06, "loss": 0.8348, "step": 36008 }, { "epoch": 0.68, "learning_rate": 1.2310853545751392e-06, "loss": 0.7639, "step": 36009 }, { "epoch": 0.68, "learning_rate": 1.2309537321797288e-06, "loss": 0.9387, "step": 36010 }, { "epoch": 0.68, "learning_rate": 1.2308221145228994e-06, "loss": 0.7248, "step": 36011 }, { "epoch": 0.68, "learning_rate": 1.2306905016051395e-06, "loss": 0.9118, "step": 36012 }, { "epoch": 0.68, "learning_rate": 1.2305588934269442e-06, "loss": 0.9154, "step": 36013 }, { "epoch": 0.68, "learning_rate": 1.230427289988802e-06, "loss": 0.8797, "step": 36014 }, { "epoch": 0.68, "learning_rate": 1.2302956912912053e-06, "loss": 0.8854, "step": 36015 }, { "epoch": 0.68, "learning_rate": 1.2301640973346458e-06, "loss": 0.709, "step": 36016 }, { "epoch": 0.68, "learning_rate": 1.2300325081196147e-06, "loss": 0.763, "step": 36017 }, { "epoch": 0.68, "learning_rate": 1.2299009236466029e-06, "loss": 1.1014, "step": 36018 }, { "epoch": 0.68, "learning_rate": 1.2297693439161023e-06, "loss": 1.2732, "step": 36019 }, { "epoch": 0.68, "learning_rate": 1.2296377689286052e-06, "loss": 0.812, "step": 36020 }, { "epoch": 0.68, "learning_rate": 1.2295061986845994e-06, "loss": 1.0179, "step": 36021 }, { "epoch": 0.68, "learning_rate": 1.2293746331845808e-06, "loss": 1.0239, "step": 36022 }, { "epoch": 0.68, "learning_rate": 1.229243072429037e-06, "loss": 1.0162, "step": 36023 }, { "epoch": 0.68, "learning_rate": 1.2291115164184608e-06, "loss": 0.8902, "step": 36024 }, { "epoch": 0.68, "learning_rate": 1.2289799651533433e-06, "loss": 1.1252, "step": 36025 }, { "epoch": 0.68, "learning_rate": 1.2288484186341756e-06, "loss": 0.7686, "step": 36026 }, { "epoch": 0.68, "learning_rate": 1.2287168768614488e-06, "loss": 0.9861, "step": 36027 }, { "epoch": 0.68, "learning_rate": 1.2285853398356546e-06, "loss": 0.8354, "step": 36028 }, { "epoch": 0.68, "learning_rate": 1.2284538075572844e-06, "loss": 0.9513, "step": 36029 }, { "epoch": 0.68, "learning_rate": 1.2283222800268265e-06, "loss": 0.8294, "step": 36030 }, { "epoch": 0.68, "learning_rate": 1.2281907572447758e-06, "loss": 1.0983, "step": 36031 }, { "epoch": 0.68, "learning_rate": 1.2280592392116223e-06, "loss": 0.8402, "step": 36032 }, { "epoch": 0.68, "learning_rate": 1.227927725927855e-06, "loss": 0.6992, "step": 36033 }, { "epoch": 0.68, "learning_rate": 1.2277962173939684e-06, "loss": 0.8932, "step": 36034 }, { "epoch": 0.68, "learning_rate": 1.2276647136104506e-06, "loss": 0.7437, "step": 36035 }, { "epoch": 0.68, "learning_rate": 1.2275332145777939e-06, "loss": 0.7603, "step": 36036 }, { "epoch": 0.68, "learning_rate": 1.227401720296489e-06, "loss": 1.1005, "step": 36037 }, { "epoch": 0.68, "learning_rate": 1.2272702307670272e-06, "loss": 0.9572, "step": 36038 }, { "epoch": 0.68, "learning_rate": 1.2271387459898992e-06, "loss": 1.0245, "step": 36039 }, { "epoch": 0.68, "learning_rate": 1.2270072659655962e-06, "loss": 1.0142, "step": 36040 }, { "epoch": 0.68, "learning_rate": 1.22687579069461e-06, "loss": 0.8916, "step": 36041 }, { "epoch": 0.68, "learning_rate": 1.2267443201774287e-06, "loss": 0.8633, "step": 36042 }, { "epoch": 0.68, "learning_rate": 1.226612854414547e-06, "loss": 0.9867, "step": 36043 }, { "epoch": 0.68, "learning_rate": 1.226481393406453e-06, "loss": 0.7828, "step": 36044 }, { "epoch": 0.68, "learning_rate": 1.226349937153638e-06, "loss": 0.8672, "step": 36045 }, { "epoch": 0.68, "learning_rate": 1.2262184856565937e-06, "loss": 0.9472, "step": 36046 }, { "epoch": 0.68, "learning_rate": 1.2260870389158103e-06, "loss": 0.717, "step": 36047 }, { "epoch": 0.68, "learning_rate": 1.2259555969317789e-06, "loss": 0.9505, "step": 36048 }, { "epoch": 0.68, "learning_rate": 1.2258241597049902e-06, "loss": 1.0964, "step": 36049 }, { "epoch": 0.68, "learning_rate": 1.225692727235936e-06, "loss": 1.2026, "step": 36050 }, { "epoch": 0.68, "learning_rate": 1.2255612995251042e-06, "loss": 0.5494, "step": 36051 }, { "epoch": 0.68, "learning_rate": 1.2254298765729883e-06, "loss": 0.8443, "step": 36052 }, { "epoch": 0.68, "learning_rate": 1.2252984583800792e-06, "loss": 0.8873, "step": 36053 }, { "epoch": 0.68, "learning_rate": 1.2251670449468647e-06, "loss": 0.7941, "step": 36054 }, { "epoch": 0.68, "learning_rate": 1.2250356362738392e-06, "loss": 0.9062, "step": 36055 }, { "epoch": 0.68, "learning_rate": 1.2249042323614906e-06, "loss": 1.0307, "step": 36056 }, { "epoch": 0.68, "learning_rate": 1.2247728332103106e-06, "loss": 0.9243, "step": 36057 }, { "epoch": 0.68, "learning_rate": 1.2246414388207898e-06, "loss": 0.8979, "step": 36058 }, { "epoch": 0.68, "learning_rate": 1.2245100491934183e-06, "loss": 0.8837, "step": 36059 }, { "epoch": 0.68, "learning_rate": 1.2243786643286875e-06, "loss": 0.7963, "step": 36060 }, { "epoch": 0.68, "learning_rate": 1.2242472842270877e-06, "loss": 0.9222, "step": 36061 }, { "epoch": 0.68, "learning_rate": 1.2241159088891105e-06, "loss": 1.1744, "step": 36062 }, { "epoch": 0.68, "learning_rate": 1.2239845383152441e-06, "loss": 1.1057, "step": 36063 }, { "epoch": 0.68, "learning_rate": 1.2238531725059804e-06, "loss": 0.9202, "step": 36064 }, { "epoch": 0.68, "learning_rate": 1.2237218114618103e-06, "loss": 0.8338, "step": 36065 }, { "epoch": 0.68, "learning_rate": 1.2235904551832232e-06, "loss": 0.9084, "step": 36066 }, { "epoch": 0.68, "learning_rate": 1.2234591036707103e-06, "loss": 0.8798, "step": 36067 }, { "epoch": 0.68, "learning_rate": 1.2233277569247623e-06, "loss": 0.7189, "step": 36068 }, { "epoch": 0.68, "learning_rate": 1.22319641494587e-06, "loss": 1.1705, "step": 36069 }, { "epoch": 0.68, "learning_rate": 1.2230650777345212e-06, "loss": 0.9002, "step": 36070 }, { "epoch": 0.68, "learning_rate": 1.2229337452912102e-06, "loss": 1.0096, "step": 36071 }, { "epoch": 0.68, "learning_rate": 1.2228024176164246e-06, "loss": 0.7119, "step": 36072 }, { "epoch": 0.68, "learning_rate": 1.2226710947106546e-06, "loss": 0.7806, "step": 36073 }, { "epoch": 0.68, "learning_rate": 1.2225397765743934e-06, "loss": 1.0891, "step": 36074 }, { "epoch": 0.68, "learning_rate": 1.2224084632081287e-06, "loss": 0.9726, "step": 36075 }, { "epoch": 0.68, "learning_rate": 1.2222771546123515e-06, "loss": 0.7543, "step": 36076 }, { "epoch": 0.68, "learning_rate": 1.2221458507875522e-06, "loss": 0.8273, "step": 36077 }, { "epoch": 0.68, "learning_rate": 1.2220145517342214e-06, "loss": 1.0769, "step": 36078 }, { "epoch": 0.68, "learning_rate": 1.2218832574528486e-06, "loss": 0.8978, "step": 36079 }, { "epoch": 0.68, "learning_rate": 1.2217519679439249e-06, "loss": 0.7732, "step": 36080 }, { "epoch": 0.68, "learning_rate": 1.2216206832079411e-06, "loss": 1.1239, "step": 36081 }, { "epoch": 0.68, "learning_rate": 1.2214894032453845e-06, "loss": 0.9482, "step": 36082 }, { "epoch": 0.68, "learning_rate": 1.221358128056749e-06, "loss": 0.7442, "step": 36083 }, { "epoch": 0.68, "learning_rate": 1.2212268576425223e-06, "loss": 0.8671, "step": 36084 }, { "epoch": 0.68, "learning_rate": 1.2210955920031954e-06, "loss": 0.9481, "step": 36085 }, { "epoch": 0.68, "learning_rate": 1.220964331139258e-06, "loss": 0.7771, "step": 36086 }, { "epoch": 0.68, "learning_rate": 1.2208330750512006e-06, "loss": 1.0145, "step": 36087 }, { "epoch": 0.68, "learning_rate": 1.2207018237395135e-06, "loss": 1.0704, "step": 36088 }, { "epoch": 0.68, "learning_rate": 1.2205705772046867e-06, "loss": 0.8702, "step": 36089 }, { "epoch": 0.68, "learning_rate": 1.2204393354472108e-06, "loss": 0.8531, "step": 36090 }, { "epoch": 0.68, "learning_rate": 1.2203080984675733e-06, "loss": 1.0276, "step": 36091 }, { "epoch": 0.68, "learning_rate": 1.2201768662662683e-06, "loss": 0.9191, "step": 36092 }, { "epoch": 0.68, "learning_rate": 1.2200456388437824e-06, "loss": 0.9749, "step": 36093 }, { "epoch": 0.68, "learning_rate": 1.219914416200606e-06, "loss": 0.9807, "step": 36094 }, { "epoch": 0.68, "learning_rate": 1.2197831983372318e-06, "loss": 0.9167, "step": 36095 }, { "epoch": 0.68, "learning_rate": 1.2196519852541469e-06, "loss": 0.9185, "step": 36096 }, { "epoch": 0.68, "learning_rate": 1.2195207769518422e-06, "loss": 0.7145, "step": 36097 }, { "epoch": 0.68, "learning_rate": 1.2193895734308078e-06, "loss": 0.8735, "step": 36098 }, { "epoch": 0.68, "learning_rate": 1.2192583746915335e-06, "loss": 0.8256, "step": 36099 }, { "epoch": 0.68, "learning_rate": 1.2191271807345089e-06, "loss": 0.9354, "step": 36100 }, { "epoch": 0.68, "learning_rate": 1.2189959915602245e-06, "loss": 0.9682, "step": 36101 }, { "epoch": 0.68, "learning_rate": 1.2188648071691705e-06, "loss": 0.7144, "step": 36102 }, { "epoch": 0.68, "learning_rate": 1.2187336275618342e-06, "loss": 0.8386, "step": 36103 }, { "epoch": 0.68, "learning_rate": 1.2186024527387092e-06, "loss": 0.7705, "step": 36104 }, { "epoch": 0.68, "learning_rate": 1.218471282700282e-06, "loss": 1.0909, "step": 36105 }, { "epoch": 0.68, "learning_rate": 1.218340117447044e-06, "loss": 1.2303, "step": 36106 }, { "epoch": 0.68, "learning_rate": 1.2182089569794849e-06, "loss": 0.8163, "step": 36107 }, { "epoch": 0.68, "learning_rate": 1.2180778012980943e-06, "loss": 0.9165, "step": 36108 }, { "epoch": 0.68, "learning_rate": 1.2179466504033616e-06, "loss": 0.866, "step": 36109 }, { "epoch": 0.68, "learning_rate": 1.2178155042957768e-06, "loss": 0.7681, "step": 36110 }, { "epoch": 0.68, "learning_rate": 1.217684362975831e-06, "loss": 0.7536, "step": 36111 }, { "epoch": 0.68, "learning_rate": 1.21755322644401e-06, "loss": 1.0782, "step": 36112 }, { "epoch": 0.68, "learning_rate": 1.217422094700808e-06, "loss": 1.1516, "step": 36113 }, { "epoch": 0.68, "learning_rate": 1.2172909677467118e-06, "loss": 1.0531, "step": 36114 }, { "epoch": 0.68, "learning_rate": 1.2171598455822105e-06, "loss": 0.8011, "step": 36115 }, { "epoch": 0.68, "learning_rate": 1.2170287282077973e-06, "loss": 0.8625, "step": 36116 }, { "epoch": 0.68, "learning_rate": 1.2168976156239584e-06, "loss": 0.9576, "step": 36117 }, { "epoch": 0.68, "learning_rate": 1.2167665078311844e-06, "loss": 1.1326, "step": 36118 }, { "epoch": 0.68, "learning_rate": 1.216635404829965e-06, "loss": 1.0025, "step": 36119 }, { "epoch": 0.68, "learning_rate": 1.2165043066207893e-06, "loss": 0.902, "step": 36120 }, { "epoch": 0.68, "learning_rate": 1.2163732132041475e-06, "loss": 0.7138, "step": 36121 }, { "epoch": 0.68, "learning_rate": 1.2162421245805289e-06, "loss": 0.8578, "step": 36122 }, { "epoch": 0.68, "learning_rate": 1.2161110407504237e-06, "loss": 0.7047, "step": 36123 }, { "epoch": 0.68, "learning_rate": 1.2159799617143183e-06, "loss": 0.9395, "step": 36124 }, { "epoch": 0.68, "learning_rate": 1.2158488874727065e-06, "loss": 1.134, "step": 36125 }, { "epoch": 0.68, "learning_rate": 1.2157178180260748e-06, "loss": 0.9228, "step": 36126 }, { "epoch": 0.68, "learning_rate": 1.215586753374913e-06, "loss": 0.8677, "step": 36127 }, { "epoch": 0.68, "learning_rate": 1.2154556935197112e-06, "loss": 0.8664, "step": 36128 }, { "epoch": 0.68, "learning_rate": 1.2153246384609581e-06, "loss": 0.7651, "step": 36129 }, { "epoch": 0.68, "learning_rate": 1.2151935881991439e-06, "loss": 0.8605, "step": 36130 }, { "epoch": 0.68, "learning_rate": 1.2150625427347573e-06, "loss": 1.0231, "step": 36131 }, { "epoch": 0.68, "learning_rate": 1.2149315020682886e-06, "loss": 1.0086, "step": 36132 }, { "epoch": 0.68, "learning_rate": 1.2148004662002244e-06, "loss": 0.9314, "step": 36133 }, { "epoch": 0.68, "learning_rate": 1.2146694351310576e-06, "loss": 0.7485, "step": 36134 }, { "epoch": 0.68, "learning_rate": 1.214538408861275e-06, "loss": 0.8061, "step": 36135 }, { "epoch": 0.68, "learning_rate": 1.2144073873913656e-06, "loss": 0.9294, "step": 36136 }, { "epoch": 0.68, "learning_rate": 1.2142763707218214e-06, "loss": 0.8803, "step": 36137 }, { "epoch": 0.68, "learning_rate": 1.2141453588531288e-06, "loss": 0.8979, "step": 36138 }, { "epoch": 0.68, "learning_rate": 1.214014351785778e-06, "loss": 0.9752, "step": 36139 }, { "epoch": 0.68, "learning_rate": 1.2138833495202584e-06, "loss": 0.9635, "step": 36140 }, { "epoch": 0.68, "learning_rate": 1.2137523520570588e-06, "loss": 0.7803, "step": 36141 }, { "epoch": 0.68, "learning_rate": 1.2136213593966687e-06, "loss": 0.8513, "step": 36142 }, { "epoch": 0.68, "learning_rate": 1.2134903715395765e-06, "loss": 1.0238, "step": 36143 }, { "epoch": 0.68, "learning_rate": 1.2133593884862733e-06, "loss": 0.8255, "step": 36144 }, { "epoch": 0.68, "learning_rate": 1.2132284102372444e-06, "loss": 1.0305, "step": 36145 }, { "epoch": 0.68, "learning_rate": 1.2130974367929832e-06, "loss": 0.7097, "step": 36146 }, { "epoch": 0.68, "learning_rate": 1.212966468153976e-06, "loss": 1.0358, "step": 36147 }, { "epoch": 0.68, "learning_rate": 1.2128355043207122e-06, "loss": 0.7817, "step": 36148 }, { "epoch": 0.68, "learning_rate": 1.2127045452936815e-06, "loss": 0.9974, "step": 36149 }, { "epoch": 0.68, "learning_rate": 1.2125735910733722e-06, "loss": 1.1501, "step": 36150 }, { "epoch": 0.68, "learning_rate": 1.2124426416602738e-06, "loss": 0.9926, "step": 36151 }, { "epoch": 0.68, "learning_rate": 1.212311697054875e-06, "loss": 0.7691, "step": 36152 }, { "epoch": 0.68, "learning_rate": 1.2121807572576657e-06, "loss": 0.9565, "step": 36153 }, { "epoch": 0.68, "learning_rate": 1.2120498222691323e-06, "loss": 0.7531, "step": 36154 }, { "epoch": 0.68, "learning_rate": 1.2119188920897674e-06, "loss": 0.8873, "step": 36155 }, { "epoch": 0.68, "learning_rate": 1.2117879667200565e-06, "loss": 1.0912, "step": 36156 }, { "epoch": 0.68, "learning_rate": 1.2116570461604893e-06, "loss": 1.0447, "step": 36157 }, { "epoch": 0.68, "learning_rate": 1.2115261304115569e-06, "loss": 0.6796, "step": 36158 }, { "epoch": 0.68, "learning_rate": 1.2113952194737454e-06, "loss": 0.8804, "step": 36159 }, { "epoch": 0.68, "learning_rate": 1.2112643133475448e-06, "loss": 0.9349, "step": 36160 }, { "epoch": 0.68, "learning_rate": 1.2111334120334436e-06, "loss": 0.9685, "step": 36161 }, { "epoch": 0.68, "learning_rate": 1.2110025155319308e-06, "loss": 0.9485, "step": 36162 }, { "epoch": 0.68, "learning_rate": 1.210871623843495e-06, "loss": 0.9524, "step": 36163 }, { "epoch": 0.68, "learning_rate": 1.2107407369686252e-06, "loss": 0.89, "step": 36164 }, { "epoch": 0.68, "learning_rate": 1.2106098549078108e-06, "loss": 0.9802, "step": 36165 }, { "epoch": 0.68, "learning_rate": 1.2104789776615378e-06, "loss": 0.8519, "step": 36166 }, { "epoch": 0.68, "learning_rate": 1.2103481052302987e-06, "loss": 0.7425, "step": 36167 }, { "epoch": 0.68, "learning_rate": 1.210217237614579e-06, "loss": 1.0041, "step": 36168 }, { "epoch": 0.68, "learning_rate": 1.210086374814869e-06, "loss": 1.1457, "step": 36169 }, { "epoch": 0.68, "learning_rate": 1.2099555168316568e-06, "loss": 0.9554, "step": 36170 }, { "epoch": 0.68, "learning_rate": 1.209824663665431e-06, "loss": 0.8852, "step": 36171 }, { "epoch": 0.68, "learning_rate": 1.2096938153166804e-06, "loss": 0.9641, "step": 36172 }, { "epoch": 0.68, "learning_rate": 1.2095629717858938e-06, "loss": 0.803, "step": 36173 }, { "epoch": 0.68, "learning_rate": 1.2094321330735602e-06, "loss": 0.9698, "step": 36174 }, { "epoch": 0.68, "learning_rate": 1.2093012991801653e-06, "loss": 0.8821, "step": 36175 }, { "epoch": 0.68, "learning_rate": 1.2091704701062019e-06, "loss": 0.9749, "step": 36176 }, { "epoch": 0.68, "learning_rate": 1.2090396458521555e-06, "loss": 0.7296, "step": 36177 }, { "epoch": 0.68, "learning_rate": 1.2089088264185146e-06, "loss": 0.8481, "step": 36178 }, { "epoch": 0.68, "learning_rate": 1.20877801180577e-06, "loss": 0.9122, "step": 36179 }, { "epoch": 0.68, "learning_rate": 1.2086472020144083e-06, "loss": 0.7788, "step": 36180 }, { "epoch": 0.68, "learning_rate": 1.2085163970449182e-06, "loss": 1.0615, "step": 36181 }, { "epoch": 0.68, "learning_rate": 1.2083855968977884e-06, "loss": 1.0119, "step": 36182 }, { "epoch": 0.68, "learning_rate": 1.208254801573507e-06, "loss": 0.8797, "step": 36183 }, { "epoch": 0.68, "learning_rate": 1.2081240110725627e-06, "loss": 0.9474, "step": 36184 }, { "epoch": 0.68, "learning_rate": 1.2079932253954435e-06, "loss": 0.7731, "step": 36185 }, { "epoch": 0.68, "learning_rate": 1.207862444542639e-06, "loss": 0.9174, "step": 36186 }, { "epoch": 0.68, "learning_rate": 1.2077316685146346e-06, "loss": 0.8876, "step": 36187 }, { "epoch": 0.68, "learning_rate": 1.2076008973119225e-06, "loss": 1.0233, "step": 36188 }, { "epoch": 0.68, "learning_rate": 1.2074701309349882e-06, "loss": 0.9506, "step": 36189 }, { "epoch": 0.68, "learning_rate": 1.2073393693843205e-06, "loss": 0.9522, "step": 36190 }, { "epoch": 0.68, "learning_rate": 1.2072086126604083e-06, "loss": 1.0555, "step": 36191 }, { "epoch": 0.68, "learning_rate": 1.2070778607637393e-06, "loss": 0.9005, "step": 36192 }, { "epoch": 0.68, "learning_rate": 1.2069471136948018e-06, "loss": 1.0922, "step": 36193 }, { "epoch": 0.68, "learning_rate": 1.2068163714540844e-06, "loss": 1.1309, "step": 36194 }, { "epoch": 0.68, "learning_rate": 1.206685634042076e-06, "loss": 1.0035, "step": 36195 }, { "epoch": 0.68, "learning_rate": 1.2065549014592617e-06, "loss": 0.8026, "step": 36196 }, { "epoch": 0.68, "learning_rate": 1.2064241737061336e-06, "loss": 0.8693, "step": 36197 }, { "epoch": 0.68, "learning_rate": 1.2062934507831772e-06, "loss": 0.835, "step": 36198 }, { "epoch": 0.68, "learning_rate": 1.2061627326908804e-06, "loss": 0.8845, "step": 36199 }, { "epoch": 0.68, "learning_rate": 1.2060320194297339e-06, "loss": 1.4014, "step": 36200 }, { "epoch": 0.68, "learning_rate": 1.2059013110002236e-06, "loss": 0.9831, "step": 36201 }, { "epoch": 0.68, "learning_rate": 1.205770607402838e-06, "loss": 0.7406, "step": 36202 }, { "epoch": 0.68, "learning_rate": 1.2056399086380651e-06, "loss": 0.7352, "step": 36203 }, { "epoch": 0.68, "learning_rate": 1.2055092147063934e-06, "loss": 0.8001, "step": 36204 }, { "epoch": 0.68, "learning_rate": 1.2053785256083103e-06, "loss": 0.7947, "step": 36205 }, { "epoch": 0.68, "learning_rate": 1.2052478413443044e-06, "loss": 0.6176, "step": 36206 }, { "epoch": 0.68, "learning_rate": 1.2051171619148642e-06, "loss": 0.8243, "step": 36207 }, { "epoch": 0.68, "learning_rate": 1.2049864873204748e-06, "loss": 0.8026, "step": 36208 }, { "epoch": 0.68, "learning_rate": 1.2048558175616282e-06, "loss": 0.8056, "step": 36209 }, { "epoch": 0.68, "learning_rate": 1.2047251526388092e-06, "loss": 0.9522, "step": 36210 }, { "epoch": 0.68, "learning_rate": 1.2045944925525069e-06, "loss": 0.9663, "step": 36211 }, { "epoch": 0.68, "learning_rate": 1.2044638373032089e-06, "loss": 1.1949, "step": 36212 }, { "epoch": 0.68, "learning_rate": 1.2043331868914032e-06, "loss": 0.9813, "step": 36213 }, { "epoch": 0.68, "learning_rate": 1.2042025413175775e-06, "loss": 0.9995, "step": 36214 }, { "epoch": 0.68, "learning_rate": 1.2040719005822201e-06, "loss": 0.7262, "step": 36215 }, { "epoch": 0.68, "learning_rate": 1.2039412646858195e-06, "loss": 1.0237, "step": 36216 }, { "epoch": 0.68, "learning_rate": 1.2038106336288605e-06, "loss": 0.7386, "step": 36217 }, { "epoch": 0.68, "learning_rate": 1.2036800074118346e-06, "loss": 1.0619, "step": 36218 }, { "epoch": 0.68, "learning_rate": 1.2035493860352268e-06, "loss": 1.0661, "step": 36219 }, { "epoch": 0.68, "learning_rate": 1.203418769499525e-06, "loss": 0.7834, "step": 36220 }, { "epoch": 0.68, "learning_rate": 1.2032881578052197e-06, "loss": 0.9141, "step": 36221 }, { "epoch": 0.68, "learning_rate": 1.2031575509527957e-06, "loss": 0.9554, "step": 36222 }, { "epoch": 0.68, "learning_rate": 1.2030269489427416e-06, "loss": 0.8627, "step": 36223 }, { "epoch": 0.68, "learning_rate": 1.2028963517755452e-06, "loss": 0.8962, "step": 36224 }, { "epoch": 0.68, "learning_rate": 1.202765759451694e-06, "loss": 0.9164, "step": 36225 }, { "epoch": 0.68, "learning_rate": 1.2026351719716755e-06, "loss": 0.8489, "step": 36226 }, { "epoch": 0.68, "learning_rate": 1.2025045893359777e-06, "loss": 0.7918, "step": 36227 }, { "epoch": 0.68, "learning_rate": 1.2023740115450892e-06, "loss": 0.9595, "step": 36228 }, { "epoch": 0.68, "learning_rate": 1.2022434385994938e-06, "loss": 0.8701, "step": 36229 }, { "epoch": 0.68, "learning_rate": 1.202112870499684e-06, "loss": 1.0367, "step": 36230 }, { "epoch": 0.68, "learning_rate": 1.201982307246144e-06, "loss": 1.0573, "step": 36231 }, { "epoch": 0.68, "learning_rate": 1.201851748839362e-06, "loss": 0.9701, "step": 36232 }, { "epoch": 0.68, "learning_rate": 1.2017211952798258e-06, "loss": 0.6636, "step": 36233 }, { "epoch": 0.68, "learning_rate": 1.201590646568023e-06, "loss": 0.8379, "step": 36234 }, { "epoch": 0.68, "learning_rate": 1.2014601027044408e-06, "loss": 0.8446, "step": 36235 }, { "epoch": 0.68, "learning_rate": 1.201329563689567e-06, "loss": 0.9548, "step": 36236 }, { "epoch": 0.68, "learning_rate": 1.2011990295238893e-06, "loss": 1.0377, "step": 36237 }, { "epoch": 0.68, "learning_rate": 1.2010685002078931e-06, "loss": 0.9621, "step": 36238 }, { "epoch": 0.68, "learning_rate": 1.2009379757420689e-06, "loss": 0.8201, "step": 36239 }, { "epoch": 0.68, "learning_rate": 1.2008074561269018e-06, "loss": 0.9766, "step": 36240 }, { "epoch": 0.68, "learning_rate": 1.2006769413628788e-06, "loss": 0.8033, "step": 36241 }, { "epoch": 0.68, "learning_rate": 1.20054643145049e-06, "loss": 0.7922, "step": 36242 }, { "epoch": 0.68, "learning_rate": 1.2004159263902202e-06, "loss": 1.1329, "step": 36243 }, { "epoch": 0.68, "learning_rate": 1.2002854261825575e-06, "loss": 0.987, "step": 36244 }, { "epoch": 0.68, "learning_rate": 1.2001549308279888e-06, "loss": 0.9482, "step": 36245 }, { "epoch": 0.68, "learning_rate": 1.2000244403270022e-06, "loss": 0.8992, "step": 36246 }, { "epoch": 0.68, "learning_rate": 1.1998939546800843e-06, "loss": 0.8861, "step": 36247 }, { "epoch": 0.68, "learning_rate": 1.1997634738877226e-06, "loss": 0.848, "step": 36248 }, { "epoch": 0.68, "learning_rate": 1.1996329979504051e-06, "loss": 0.8488, "step": 36249 }, { "epoch": 0.68, "learning_rate": 1.1995025268686162e-06, "loss": 1.1447, "step": 36250 }, { "epoch": 0.68, "learning_rate": 1.199372060642847e-06, "loss": 1.1331, "step": 36251 }, { "epoch": 0.68, "learning_rate": 1.1992415992735814e-06, "loss": 0.8455, "step": 36252 }, { "epoch": 0.68, "learning_rate": 1.199111142761308e-06, "loss": 0.9292, "step": 36253 }, { "epoch": 0.68, "learning_rate": 1.1989806911065138e-06, "loss": 0.9404, "step": 36254 }, { "epoch": 0.68, "learning_rate": 1.1988502443096856e-06, "loss": 0.6931, "step": 36255 }, { "epoch": 0.68, "learning_rate": 1.198719802371311e-06, "loss": 1.2945, "step": 36256 }, { "epoch": 0.68, "learning_rate": 1.1985893652918765e-06, "loss": 0.979, "step": 36257 }, { "epoch": 0.68, "learning_rate": 1.1984589330718702e-06, "loss": 0.7043, "step": 36258 }, { "epoch": 0.68, "learning_rate": 1.1983285057117766e-06, "loss": 1.0178, "step": 36259 }, { "epoch": 0.68, "learning_rate": 1.1981980832120866e-06, "loss": 0.9425, "step": 36260 }, { "epoch": 0.68, "learning_rate": 1.1980676655732837e-06, "loss": 0.8831, "step": 36261 }, { "epoch": 0.68, "learning_rate": 1.1979372527958555e-06, "loss": 1.086, "step": 36262 }, { "epoch": 0.68, "learning_rate": 1.1978068448802915e-06, "loss": 0.8654, "step": 36263 }, { "epoch": 0.68, "learning_rate": 1.197676441827076e-06, "loss": 1.0674, "step": 36264 }, { "epoch": 0.68, "learning_rate": 1.1975460436366967e-06, "loss": 1.0358, "step": 36265 }, { "epoch": 0.68, "learning_rate": 1.1974156503096405e-06, "loss": 0.639, "step": 36266 }, { "epoch": 0.68, "learning_rate": 1.1972852618463942e-06, "loss": 0.9261, "step": 36267 }, { "epoch": 0.68, "learning_rate": 1.197154878247445e-06, "loss": 0.9523, "step": 36268 }, { "epoch": 0.68, "learning_rate": 1.1970244995132793e-06, "loss": 0.8692, "step": 36269 }, { "epoch": 0.68, "learning_rate": 1.1968941256443853e-06, "loss": 0.9568, "step": 36270 }, { "epoch": 0.68, "learning_rate": 1.1967637566412469e-06, "loss": 0.9138, "step": 36271 }, { "epoch": 0.68, "learning_rate": 1.196633392504354e-06, "loss": 0.984, "step": 36272 }, { "epoch": 0.68, "learning_rate": 1.1965030332341917e-06, "loss": 1.1643, "step": 36273 }, { "epoch": 0.68, "learning_rate": 1.1963726788312469e-06, "loss": 1.0793, "step": 36274 }, { "epoch": 0.68, "learning_rate": 1.1962423292960065e-06, "loss": 1.1563, "step": 36275 }, { "epoch": 0.68, "learning_rate": 1.1961119846289573e-06, "loss": 1.0671, "step": 36276 }, { "epoch": 0.68, "learning_rate": 1.195981644830586e-06, "loss": 0.8547, "step": 36277 }, { "epoch": 0.68, "learning_rate": 1.1958513099013794e-06, "loss": 1.0554, "step": 36278 }, { "epoch": 0.68, "learning_rate": 1.1957209798418248e-06, "loss": 0.8752, "step": 36279 }, { "epoch": 0.68, "learning_rate": 1.1955906546524062e-06, "loss": 1.1456, "step": 36280 }, { "epoch": 0.68, "learning_rate": 1.195460334333614e-06, "loss": 0.887, "step": 36281 }, { "epoch": 0.68, "learning_rate": 1.1953300188859317e-06, "loss": 0.8975, "step": 36282 }, { "epoch": 0.68, "learning_rate": 1.1951997083098466e-06, "loss": 0.8217, "step": 36283 }, { "epoch": 0.68, "learning_rate": 1.1950694026058477e-06, "loss": 0.6878, "step": 36284 }, { "epoch": 0.68, "learning_rate": 1.1949391017744183e-06, "loss": 0.763, "step": 36285 }, { "epoch": 0.68, "learning_rate": 1.1948088058160464e-06, "loss": 0.9962, "step": 36286 }, { "epoch": 0.68, "learning_rate": 1.1946785147312187e-06, "loss": 1.1414, "step": 36287 }, { "epoch": 0.68, "learning_rate": 1.194548228520421e-06, "loss": 0.8618, "step": 36288 }, { "epoch": 0.68, "learning_rate": 1.1944179471841405e-06, "loss": 0.8834, "step": 36289 }, { "epoch": 0.68, "learning_rate": 1.1942876707228631e-06, "loss": 0.7663, "step": 36290 }, { "epoch": 0.68, "learning_rate": 1.1941573991370767e-06, "loss": 0.7826, "step": 36291 }, { "epoch": 0.68, "learning_rate": 1.1940271324272645e-06, "loss": 0.8859, "step": 36292 }, { "epoch": 0.68, "learning_rate": 1.1938968705939168e-06, "loss": 1.1486, "step": 36293 }, { "epoch": 0.68, "learning_rate": 1.1937666136375173e-06, "loss": 1.0836, "step": 36294 }, { "epoch": 0.68, "learning_rate": 1.193636361558553e-06, "loss": 0.9788, "step": 36295 }, { "epoch": 0.68, "learning_rate": 1.1935061143575108e-06, "loss": 0.6974, "step": 36296 }, { "epoch": 0.68, "learning_rate": 1.1933758720348764e-06, "loss": 0.699, "step": 36297 }, { "epoch": 0.68, "learning_rate": 1.1932456345911375e-06, "loss": 0.9205, "step": 36298 }, { "epoch": 0.68, "learning_rate": 1.1931154020267777e-06, "loss": 0.8963, "step": 36299 }, { "epoch": 0.68, "learning_rate": 1.1929851743422865e-06, "loss": 1.1514, "step": 36300 }, { "epoch": 0.68, "learning_rate": 1.1928549515381478e-06, "loss": 0.7954, "step": 36301 }, { "epoch": 0.68, "learning_rate": 1.1927247336148484e-06, "loss": 0.708, "step": 36302 }, { "epoch": 0.68, "learning_rate": 1.1925945205728747e-06, "loss": 0.909, "step": 36303 }, { "epoch": 0.68, "learning_rate": 1.1924643124127134e-06, "loss": 0.9965, "step": 36304 }, { "epoch": 0.68, "learning_rate": 1.19233410913485e-06, "loss": 0.9116, "step": 36305 }, { "epoch": 0.68, "learning_rate": 1.1922039107397708e-06, "loss": 0.9578, "step": 36306 }, { "epoch": 0.68, "learning_rate": 1.1920737172279633e-06, "loss": 0.8471, "step": 36307 }, { "epoch": 0.69, "learning_rate": 1.1919435285999106e-06, "loss": 0.8726, "step": 36308 }, { "epoch": 0.69, "learning_rate": 1.1918133448561014e-06, "loss": 0.9659, "step": 36309 }, { "epoch": 0.69, "learning_rate": 1.1916831659970221e-06, "loss": 0.7728, "step": 36310 }, { "epoch": 0.69, "learning_rate": 1.191552992023156e-06, "loss": 1.0199, "step": 36311 }, { "epoch": 0.69, "learning_rate": 1.1914228229349926e-06, "loss": 1.2845, "step": 36312 }, { "epoch": 0.69, "learning_rate": 1.1912926587330153e-06, "loss": 1.0151, "step": 36313 }, { "epoch": 0.69, "learning_rate": 1.1911624994177113e-06, "loss": 1.0382, "step": 36314 }, { "epoch": 0.69, "learning_rate": 1.191032344989566e-06, "loss": 0.9122, "step": 36315 }, { "epoch": 0.69, "learning_rate": 1.1909021954490663e-06, "loss": 0.7539, "step": 36316 }, { "epoch": 0.69, "learning_rate": 1.190772050796697e-06, "loss": 0.847, "step": 36317 }, { "epoch": 0.69, "learning_rate": 1.1906419110329453e-06, "loss": 1.0667, "step": 36318 }, { "epoch": 0.69, "learning_rate": 1.1905117761582974e-06, "loss": 1.1006, "step": 36319 }, { "epoch": 0.69, "learning_rate": 1.1903816461732364e-06, "loss": 1.007, "step": 36320 }, { "epoch": 0.69, "learning_rate": 1.1902515210782524e-06, "loss": 0.7982, "step": 36321 }, { "epoch": 0.69, "learning_rate": 1.1901214008738277e-06, "loss": 1.0685, "step": 36322 }, { "epoch": 0.69, "learning_rate": 1.1899912855604496e-06, "loss": 0.8538, "step": 36323 }, { "epoch": 0.69, "learning_rate": 1.189861175138604e-06, "loss": 0.7841, "step": 36324 }, { "epoch": 0.69, "learning_rate": 1.1897310696087763e-06, "loss": 1.0867, "step": 36325 }, { "epoch": 0.69, "learning_rate": 1.1896009689714527e-06, "loss": 0.8983, "step": 36326 }, { "epoch": 0.69, "learning_rate": 1.189470873227119e-06, "loss": 0.9857, "step": 36327 }, { "epoch": 0.69, "learning_rate": 1.189340782376262e-06, "loss": 0.762, "step": 36328 }, { "epoch": 0.69, "learning_rate": 1.1892106964193641e-06, "loss": 0.6146, "step": 36329 }, { "epoch": 0.69, "learning_rate": 1.1890806153569145e-06, "loss": 1.0101, "step": 36330 }, { "epoch": 0.69, "learning_rate": 1.1889505391893985e-06, "loss": 0.9272, "step": 36331 }, { "epoch": 0.69, "learning_rate": 1.188820467917299e-06, "loss": 1.0905, "step": 36332 }, { "epoch": 0.69, "learning_rate": 1.1886904015411058e-06, "loss": 0.7292, "step": 36333 }, { "epoch": 0.69, "learning_rate": 1.1885603400613013e-06, "loss": 0.9672, "step": 36334 }, { "epoch": 0.69, "learning_rate": 1.1884302834783726e-06, "loss": 0.8134, "step": 36335 }, { "epoch": 0.69, "learning_rate": 1.1883002317928046e-06, "loss": 0.8021, "step": 36336 }, { "epoch": 0.69, "learning_rate": 1.1881701850050835e-06, "loss": 0.945, "step": 36337 }, { "epoch": 0.69, "learning_rate": 1.1880401431156949e-06, "loss": 1.0408, "step": 36338 }, { "epoch": 0.69, "learning_rate": 1.1879101061251238e-06, "loss": 0.8774, "step": 36339 }, { "epoch": 0.69, "learning_rate": 1.1877800740338574e-06, "loss": 0.8506, "step": 36340 }, { "epoch": 0.69, "learning_rate": 1.187650046842378e-06, "loss": 0.7726, "step": 36341 }, { "epoch": 0.69, "learning_rate": 1.1875200245511748e-06, "loss": 0.9362, "step": 36342 }, { "epoch": 0.69, "learning_rate": 1.1873900071607306e-06, "loss": 0.8923, "step": 36343 }, { "epoch": 0.69, "learning_rate": 1.1872599946715322e-06, "loss": 1.0312, "step": 36344 }, { "epoch": 0.69, "learning_rate": 1.1871299870840645e-06, "loss": 0.7753, "step": 36345 }, { "epoch": 0.69, "learning_rate": 1.1869999843988132e-06, "loss": 0.6382, "step": 36346 }, { "epoch": 0.69, "learning_rate": 1.1868699866162637e-06, "loss": 0.9549, "step": 36347 }, { "epoch": 0.69, "learning_rate": 1.1867399937369014e-06, "loss": 0.8273, "step": 36348 }, { "epoch": 0.69, "learning_rate": 1.1866100057612126e-06, "loss": 0.9459, "step": 36349 }, { "epoch": 0.69, "learning_rate": 1.18648002268968e-06, "loss": 1.1289, "step": 36350 }, { "epoch": 0.69, "learning_rate": 1.186350044522792e-06, "loss": 0.9603, "step": 36351 }, { "epoch": 0.69, "learning_rate": 1.1862200712610331e-06, "loss": 0.8962, "step": 36352 }, { "epoch": 0.69, "learning_rate": 1.1860901029048862e-06, "loss": 1.0266, "step": 36353 }, { "epoch": 0.69, "learning_rate": 1.1859601394548407e-06, "loss": 0.9373, "step": 36354 }, { "epoch": 0.69, "learning_rate": 1.1858301809113786e-06, "loss": 1.0415, "step": 36355 }, { "epoch": 0.69, "learning_rate": 1.1857002272749867e-06, "loss": 1.0804, "step": 36356 }, { "epoch": 0.69, "learning_rate": 1.1855702785461496e-06, "loss": 0.974, "step": 36357 }, { "epoch": 0.69, "learning_rate": 1.185440334725353e-06, "loss": 0.9715, "step": 36358 }, { "epoch": 0.69, "learning_rate": 1.1853103958130816e-06, "loss": 1.0157, "step": 36359 }, { "epoch": 0.69, "learning_rate": 1.185180461809821e-06, "loss": 0.7668, "step": 36360 }, { "epoch": 0.69, "learning_rate": 1.185050532716057e-06, "loss": 0.9975, "step": 36361 }, { "epoch": 0.69, "learning_rate": 1.1849206085322724e-06, "loss": 0.8596, "step": 36362 }, { "epoch": 0.69, "learning_rate": 1.1847906892589556e-06, "loss": 0.9006, "step": 36363 }, { "epoch": 0.69, "learning_rate": 1.1846607748965891e-06, "loss": 0.9521, "step": 36364 }, { "epoch": 0.69, "learning_rate": 1.184530865445659e-06, "loss": 0.9211, "step": 36365 }, { "epoch": 0.69, "learning_rate": 1.1844009609066504e-06, "loss": 1.0128, "step": 36366 }, { "epoch": 0.69, "learning_rate": 1.1842710612800481e-06, "loss": 1.163, "step": 36367 }, { "epoch": 0.69, "learning_rate": 1.1841411665663377e-06, "loss": 1.0887, "step": 36368 }, { "epoch": 0.69, "learning_rate": 1.1840112767660033e-06, "loss": 0.7089, "step": 36369 }, { "epoch": 0.69, "learning_rate": 1.1838813918795316e-06, "loss": 0.7475, "step": 36370 }, { "epoch": 0.69, "learning_rate": 1.1837515119074048e-06, "loss": 0.9221, "step": 36371 }, { "epoch": 0.69, "learning_rate": 1.1836216368501101e-06, "loss": 0.7983, "step": 36372 }, { "epoch": 0.69, "learning_rate": 1.183491766708133e-06, "loss": 0.9681, "step": 36373 }, { "epoch": 0.69, "learning_rate": 1.1833619014819553e-06, "loss": 1.009, "step": 36374 }, { "epoch": 0.69, "learning_rate": 1.1832320411720657e-06, "loss": 0.9542, "step": 36375 }, { "epoch": 0.69, "learning_rate": 1.1831021857789465e-06, "loss": 0.883, "step": 36376 }, { "epoch": 0.69, "learning_rate": 1.1829723353030833e-06, "loss": 1.019, "step": 36377 }, { "epoch": 0.69, "learning_rate": 1.182842489744961e-06, "loss": 0.8934, "step": 36378 }, { "epoch": 0.69, "learning_rate": 1.1827126491050644e-06, "loss": 0.8466, "step": 36379 }, { "epoch": 0.69, "learning_rate": 1.1825828133838784e-06, "loss": 0.947, "step": 36380 }, { "epoch": 0.69, "learning_rate": 1.1824529825818882e-06, "loss": 1.1895, "step": 36381 }, { "epoch": 0.69, "learning_rate": 1.1823231566995785e-06, "loss": 0.8732, "step": 36382 }, { "epoch": 0.69, "learning_rate": 1.1821933357374321e-06, "loss": 0.8886, "step": 36383 }, { "epoch": 0.69, "learning_rate": 1.1820635196959373e-06, "loss": 0.7721, "step": 36384 }, { "epoch": 0.69, "learning_rate": 1.1819337085755758e-06, "loss": 0.8153, "step": 36385 }, { "epoch": 0.69, "learning_rate": 1.1818039023768338e-06, "loss": 0.8329, "step": 36386 }, { "epoch": 0.69, "learning_rate": 1.1816741011001953e-06, "loss": 0.9089, "step": 36387 }, { "epoch": 0.69, "learning_rate": 1.1815443047461452e-06, "loss": 1.1666, "step": 36388 }, { "epoch": 0.69, "learning_rate": 1.1814145133151683e-06, "loss": 0.8972, "step": 36389 }, { "epoch": 0.69, "learning_rate": 1.1812847268077494e-06, "loss": 0.7162, "step": 36390 }, { "epoch": 0.69, "learning_rate": 1.1811549452243737e-06, "loss": 0.7828, "step": 36391 }, { "epoch": 0.69, "learning_rate": 1.181025168565523e-06, "loss": 0.9023, "step": 36392 }, { "epoch": 0.69, "learning_rate": 1.180895396831685e-06, "loss": 0.8913, "step": 36393 }, { "epoch": 0.69, "learning_rate": 1.180765630023344e-06, "loss": 1.0089, "step": 36394 }, { "epoch": 0.69, "learning_rate": 1.180635868140982e-06, "loss": 0.944, "step": 36395 }, { "epoch": 0.69, "learning_rate": 1.1805061111850869e-06, "loss": 0.8836, "step": 36396 }, { "epoch": 0.69, "learning_rate": 1.1803763591561404e-06, "loss": 0.8779, "step": 36397 }, { "epoch": 0.69, "learning_rate": 1.1802466120546286e-06, "loss": 0.8491, "step": 36398 }, { "epoch": 0.69, "learning_rate": 1.180116869881035e-06, "loss": 0.9598, "step": 36399 }, { "epoch": 0.69, "learning_rate": 1.1799871326358448e-06, "loss": 1.2478, "step": 36400 }, { "epoch": 0.69, "learning_rate": 1.179857400319542e-06, "loss": 0.8607, "step": 36401 }, { "epoch": 0.69, "learning_rate": 1.1797276729326116e-06, "loss": 0.7886, "step": 36402 }, { "epoch": 0.69, "learning_rate": 1.1795979504755381e-06, "loss": 1.0587, "step": 36403 }, { "epoch": 0.69, "learning_rate": 1.1794682329488036e-06, "loss": 0.8831, "step": 36404 }, { "epoch": 0.69, "learning_rate": 1.1793385203528962e-06, "loss": 1.0356, "step": 36405 }, { "epoch": 0.69, "learning_rate": 1.1792088126882971e-06, "loss": 0.9735, "step": 36406 }, { "epoch": 0.69, "learning_rate": 1.1790791099554921e-06, "loss": 1.0741, "step": 36407 }, { "epoch": 0.69, "learning_rate": 1.178949412154965e-06, "loss": 0.9399, "step": 36408 }, { "epoch": 0.69, "learning_rate": 1.1788197192872004e-06, "loss": 0.9355, "step": 36409 }, { "epoch": 0.69, "learning_rate": 1.1786900313526825e-06, "loss": 0.8706, "step": 36410 }, { "epoch": 0.69, "learning_rate": 1.1785603483518954e-06, "loss": 0.8296, "step": 36411 }, { "epoch": 0.69, "learning_rate": 1.1784306702853244e-06, "loss": 0.9163, "step": 36412 }, { "epoch": 0.69, "learning_rate": 1.178300997153451e-06, "loss": 0.9298, "step": 36413 }, { "epoch": 0.69, "learning_rate": 1.1781713289567618e-06, "loss": 0.8554, "step": 36414 }, { "epoch": 0.69, "learning_rate": 1.1780416656957413e-06, "loss": 0.8573, "step": 36415 }, { "epoch": 0.69, "learning_rate": 1.177912007370871e-06, "loss": 0.9269, "step": 36416 }, { "epoch": 0.69, "learning_rate": 1.1777823539826385e-06, "loss": 0.8997, "step": 36417 }, { "epoch": 0.69, "learning_rate": 1.1776527055315255e-06, "loss": 1.2917, "step": 36418 }, { "epoch": 0.69, "learning_rate": 1.1775230620180164e-06, "loss": 0.9888, "step": 36419 }, { "epoch": 0.69, "learning_rate": 1.177393423442596e-06, "loss": 1.0183, "step": 36420 }, { "epoch": 0.69, "learning_rate": 1.1772637898057477e-06, "loss": 0.8588, "step": 36421 }, { "epoch": 0.69, "learning_rate": 1.177134161107956e-06, "loss": 0.7172, "step": 36422 }, { "epoch": 0.69, "learning_rate": 1.1770045373497047e-06, "loss": 0.7256, "step": 36423 }, { "epoch": 0.69, "learning_rate": 1.1768749185314786e-06, "loss": 0.9163, "step": 36424 }, { "epoch": 0.69, "learning_rate": 1.1767453046537594e-06, "loss": 1.1161, "step": 36425 }, { "epoch": 0.69, "learning_rate": 1.1766156957170347e-06, "loss": 0.89, "step": 36426 }, { "epoch": 0.69, "learning_rate": 1.1764860917217853e-06, "loss": 0.8218, "step": 36427 }, { "epoch": 0.69, "learning_rate": 1.1763564926684962e-06, "loss": 0.8375, "step": 36428 }, { "epoch": 0.69, "learning_rate": 1.1762268985576514e-06, "loss": 0.7328, "step": 36429 }, { "epoch": 0.69, "learning_rate": 1.1760973093897346e-06, "loss": 0.8746, "step": 36430 }, { "epoch": 0.69, "learning_rate": 1.1759677251652303e-06, "loss": 1.1641, "step": 36431 }, { "epoch": 0.69, "learning_rate": 1.1758381458846213e-06, "loss": 1.1185, "step": 36432 }, { "epoch": 0.69, "learning_rate": 1.1757085715483934e-06, "loss": 0.821, "step": 36433 }, { "epoch": 0.69, "learning_rate": 1.175579002157027e-06, "loss": 0.7701, "step": 36434 }, { "epoch": 0.69, "learning_rate": 1.1754494377110093e-06, "loss": 0.9314, "step": 36435 }, { "epoch": 0.69, "learning_rate": 1.1753198782108236e-06, "loss": 0.8839, "step": 36436 }, { "epoch": 0.69, "learning_rate": 1.1751903236569508e-06, "loss": 1.0355, "step": 36437 }, { "epoch": 0.69, "learning_rate": 1.1750607740498788e-06, "loss": 1.0093, "step": 36438 }, { "epoch": 0.69, "learning_rate": 1.174931229390088e-06, "loss": 0.8499, "step": 36439 }, { "epoch": 0.69, "learning_rate": 1.1748016896780637e-06, "loss": 0.8924, "step": 36440 }, { "epoch": 0.69, "learning_rate": 1.1746721549142892e-06, "loss": 0.9626, "step": 36441 }, { "epoch": 0.69, "learning_rate": 1.1745426250992482e-06, "loss": 0.8442, "step": 36442 }, { "epoch": 0.69, "learning_rate": 1.174413100233424e-06, "loss": 1.0461, "step": 36443 }, { "epoch": 0.69, "learning_rate": 1.1742835803173012e-06, "loss": 1.0186, "step": 36444 }, { "epoch": 0.69, "learning_rate": 1.1741540653513637e-06, "loss": 0.805, "step": 36445 }, { "epoch": 0.69, "learning_rate": 1.174024555336092e-06, "loss": 0.8389, "step": 36446 }, { "epoch": 0.69, "learning_rate": 1.1738950502719742e-06, "loss": 0.8192, "step": 36447 }, { "epoch": 0.69, "learning_rate": 1.1737655501594909e-06, "loss": 0.7737, "step": 36448 }, { "epoch": 0.69, "learning_rate": 1.173636054999126e-06, "loss": 1.0602, "step": 36449 }, { "epoch": 0.69, "learning_rate": 1.1735065647913636e-06, "loss": 1.0327, "step": 36450 }, { "epoch": 0.69, "learning_rate": 1.1733770795366867e-06, "loss": 0.8098, "step": 36451 }, { "epoch": 0.69, "learning_rate": 1.1732475992355794e-06, "loss": 0.7371, "step": 36452 }, { "epoch": 0.69, "learning_rate": 1.1731181238885247e-06, "loss": 0.9695, "step": 36453 }, { "epoch": 0.69, "learning_rate": 1.1729886534960073e-06, "loss": 0.9291, "step": 36454 }, { "epoch": 0.69, "learning_rate": 1.1728591880585077e-06, "loss": 0.7958, "step": 36455 }, { "epoch": 0.69, "learning_rate": 1.172729727576512e-06, "loss": 1.1616, "step": 36456 }, { "epoch": 0.69, "learning_rate": 1.1726002720505038e-06, "loss": 0.926, "step": 36457 }, { "epoch": 0.69, "learning_rate": 1.1724708214809639e-06, "loss": 0.8226, "step": 36458 }, { "epoch": 0.69, "learning_rate": 1.1723413758683789e-06, "loss": 1.0691, "step": 36459 }, { "epoch": 0.69, "learning_rate": 1.1722119352132295e-06, "loss": 0.6876, "step": 36460 }, { "epoch": 0.69, "learning_rate": 1.1720824995159999e-06, "loss": 0.9063, "step": 36461 }, { "epoch": 0.69, "learning_rate": 1.1719530687771739e-06, "loss": 1.1976, "step": 36462 }, { "epoch": 0.69, "learning_rate": 1.171823642997234e-06, "loss": 1.0875, "step": 36463 }, { "epoch": 0.69, "learning_rate": 1.1716942221766641e-06, "loss": 0.9107, "step": 36464 }, { "epoch": 0.69, "learning_rate": 1.1715648063159475e-06, "loss": 0.8095, "step": 36465 }, { "epoch": 0.69, "learning_rate": 1.1714353954155678e-06, "loss": 0.9263, "step": 36466 }, { "epoch": 0.69, "learning_rate": 1.171305989476006e-06, "loss": 0.8221, "step": 36467 }, { "epoch": 0.69, "learning_rate": 1.1711765884977486e-06, "loss": 0.8266, "step": 36468 }, { "epoch": 0.69, "learning_rate": 1.171047192481276e-06, "loss": 1.0511, "step": 36469 }, { "epoch": 0.69, "learning_rate": 1.1709178014270725e-06, "loss": 1.0092, "step": 36470 }, { "epoch": 0.69, "learning_rate": 1.1707884153356214e-06, "loss": 0.9387, "step": 36471 }, { "epoch": 0.69, "learning_rate": 1.1706590342074052e-06, "loss": 0.9079, "step": 36472 }, { "epoch": 0.69, "learning_rate": 1.1705296580429076e-06, "loss": 0.8201, "step": 36473 }, { "epoch": 0.69, "learning_rate": 1.1704002868426117e-06, "loss": 0.8823, "step": 36474 }, { "epoch": 0.69, "learning_rate": 1.1702709206070012e-06, "loss": 0.9958, "step": 36475 }, { "epoch": 0.69, "learning_rate": 1.1701415593365564e-06, "loss": 0.8011, "step": 36476 }, { "epoch": 0.69, "learning_rate": 1.1700122030317632e-06, "loss": 0.9463, "step": 36477 }, { "epoch": 0.69, "learning_rate": 1.1698828516931044e-06, "loss": 0.8562, "step": 36478 }, { "epoch": 0.69, "learning_rate": 1.1697535053210607e-06, "loss": 1.084, "step": 36479 }, { "epoch": 0.69, "learning_rate": 1.1696241639161183e-06, "loss": 1.1424, "step": 36480 }, { "epoch": 0.69, "learning_rate": 1.1694948274787574e-06, "loss": 0.8612, "step": 36481 }, { "epoch": 0.69, "learning_rate": 1.1693654960094622e-06, "loss": 0.9542, "step": 36482 }, { "epoch": 0.69, "learning_rate": 1.1692361695087155e-06, "loss": 0.8822, "step": 36483 }, { "epoch": 0.69, "learning_rate": 1.1691068479770001e-06, "loss": 0.7681, "step": 36484 }, { "epoch": 0.69, "learning_rate": 1.1689775314147989e-06, "loss": 0.9694, "step": 36485 }, { "epoch": 0.69, "learning_rate": 1.1688482198225948e-06, "loss": 0.8651, "step": 36486 }, { "epoch": 0.69, "learning_rate": 1.1687189132008716e-06, "loss": 1.1431, "step": 36487 }, { "epoch": 0.69, "learning_rate": 1.1685896115501092e-06, "loss": 0.9517, "step": 36488 }, { "epoch": 0.69, "learning_rate": 1.1684603148707943e-06, "loss": 0.886, "step": 36489 }, { "epoch": 0.69, "learning_rate": 1.1683310231634067e-06, "loss": 0.898, "step": 36490 }, { "epoch": 0.69, "learning_rate": 1.1682017364284295e-06, "loss": 0.9157, "step": 36491 }, { "epoch": 0.69, "learning_rate": 1.168072454666348e-06, "loss": 0.9934, "step": 36492 }, { "epoch": 0.69, "learning_rate": 1.167943177877642e-06, "loss": 0.8494, "step": 36493 }, { "epoch": 0.69, "learning_rate": 1.1678139060627955e-06, "loss": 0.9557, "step": 36494 }, { "epoch": 0.69, "learning_rate": 1.167684639222291e-06, "loss": 0.8626, "step": 36495 }, { "epoch": 0.69, "learning_rate": 1.1675553773566111e-06, "loss": 0.8965, "step": 36496 }, { "epoch": 0.69, "learning_rate": 1.1674261204662388e-06, "loss": 0.9366, "step": 36497 }, { "epoch": 0.69, "learning_rate": 1.1672968685516564e-06, "loss": 0.831, "step": 36498 }, { "epoch": 0.69, "learning_rate": 1.1671676216133476e-06, "loss": 1.0008, "step": 36499 }, { "epoch": 0.69, "learning_rate": 1.167038379651792e-06, "loss": 1.2711, "step": 36500 }, { "epoch": 0.69, "learning_rate": 1.166909142667476e-06, "loss": 1.0092, "step": 36501 }, { "epoch": 0.69, "learning_rate": 1.1667799106608798e-06, "loss": 0.8409, "step": 36502 }, { "epoch": 0.69, "learning_rate": 1.1666506836324864e-06, "loss": 0.8601, "step": 36503 }, { "epoch": 0.69, "learning_rate": 1.1665214615827786e-06, "loss": 0.6704, "step": 36504 }, { "epoch": 0.69, "learning_rate": 1.1663922445122385e-06, "loss": 0.9747, "step": 36505 }, { "epoch": 0.69, "learning_rate": 1.1662630324213492e-06, "loss": 0.9837, "step": 36506 }, { "epoch": 0.69, "learning_rate": 1.1661338253105925e-06, "loss": 0.8641, "step": 36507 }, { "epoch": 0.69, "learning_rate": 1.1660046231804522e-06, "loss": 0.7696, "step": 36508 }, { "epoch": 0.69, "learning_rate": 1.1658754260314081e-06, "loss": 0.9049, "step": 36509 }, { "epoch": 0.69, "learning_rate": 1.1657462338639459e-06, "loss": 0.9225, "step": 36510 }, { "epoch": 0.69, "learning_rate": 1.1656170466785455e-06, "loss": 0.9617, "step": 36511 }, { "epoch": 0.69, "learning_rate": 1.1654878644756892e-06, "loss": 0.9875, "step": 36512 }, { "epoch": 0.69, "learning_rate": 1.1653586872558622e-06, "loss": 0.868, "step": 36513 }, { "epoch": 0.69, "learning_rate": 1.165229515019544e-06, "loss": 0.8843, "step": 36514 }, { "epoch": 0.69, "learning_rate": 1.1651003477672176e-06, "loss": 0.7462, "step": 36515 }, { "epoch": 0.69, "learning_rate": 1.164971185499366e-06, "loss": 1.0317, "step": 36516 }, { "epoch": 0.69, "learning_rate": 1.1648420282164707e-06, "loss": 0.8842, "step": 36517 }, { "epoch": 0.69, "learning_rate": 1.1647128759190147e-06, "loss": 1.0473, "step": 36518 }, { "epoch": 0.69, "learning_rate": 1.1645837286074796e-06, "loss": 0.9677, "step": 36519 }, { "epoch": 0.69, "learning_rate": 1.164454586282349e-06, "loss": 0.9396, "step": 36520 }, { "epoch": 0.69, "learning_rate": 1.1643254489441019e-06, "loss": 0.7138, "step": 36521 }, { "epoch": 0.69, "learning_rate": 1.1641963165932246e-06, "loss": 0.8138, "step": 36522 }, { "epoch": 0.69, "learning_rate": 1.1640671892301965e-06, "loss": 0.8955, "step": 36523 }, { "epoch": 0.69, "learning_rate": 1.1639380668555005e-06, "loss": 1.0519, "step": 36524 }, { "epoch": 0.69, "learning_rate": 1.163808949469619e-06, "loss": 1.1088, "step": 36525 }, { "epoch": 0.69, "learning_rate": 1.1636798370730335e-06, "loss": 1.0311, "step": 36526 }, { "epoch": 0.69, "learning_rate": 1.1635507296662268e-06, "loss": 1.1107, "step": 36527 }, { "epoch": 0.69, "learning_rate": 1.1634216272496807e-06, "loss": 0.8226, "step": 36528 }, { "epoch": 0.69, "learning_rate": 1.1632925298238779e-06, "loss": 0.8887, "step": 36529 }, { "epoch": 0.69, "learning_rate": 1.163163437389299e-06, "loss": 0.9042, "step": 36530 }, { "epoch": 0.69, "learning_rate": 1.1630343499464269e-06, "loss": 1.1144, "step": 36531 }, { "epoch": 0.69, "learning_rate": 1.1629052674957437e-06, "loss": 0.7454, "step": 36532 }, { "epoch": 0.69, "learning_rate": 1.162776190037731e-06, "loss": 0.8665, "step": 36533 }, { "epoch": 0.69, "learning_rate": 1.1626471175728713e-06, "loss": 0.8345, "step": 36534 }, { "epoch": 0.69, "learning_rate": 1.1625180501016458e-06, "loss": 0.8751, "step": 36535 }, { "epoch": 0.69, "learning_rate": 1.1623889876245384e-06, "loss": 0.8191, "step": 36536 }, { "epoch": 0.69, "learning_rate": 1.1622599301420273e-06, "loss": 0.8925, "step": 36537 }, { "epoch": 0.69, "learning_rate": 1.1621308776545976e-06, "loss": 0.9517, "step": 36538 }, { "epoch": 0.69, "learning_rate": 1.1620018301627308e-06, "loss": 0.9412, "step": 36539 }, { "epoch": 0.69, "learning_rate": 1.1618727876669066e-06, "loss": 0.8835, "step": 36540 }, { "epoch": 0.69, "learning_rate": 1.1617437501676104e-06, "loss": 0.8881, "step": 36541 }, { "epoch": 0.69, "learning_rate": 1.1616147176653208e-06, "loss": 0.6802, "step": 36542 }, { "epoch": 0.69, "learning_rate": 1.161485690160521e-06, "loss": 1.136, "step": 36543 }, { "epoch": 0.69, "learning_rate": 1.1613566676536924e-06, "loss": 0.8566, "step": 36544 }, { "epoch": 0.69, "learning_rate": 1.1612276501453171e-06, "loss": 0.9205, "step": 36545 }, { "epoch": 0.69, "learning_rate": 1.1610986376358765e-06, "loss": 0.8401, "step": 36546 }, { "epoch": 0.69, "learning_rate": 1.1609696301258527e-06, "loss": 0.7688, "step": 36547 }, { "epoch": 0.69, "learning_rate": 1.1608406276157282e-06, "loss": 0.7129, "step": 36548 }, { "epoch": 0.69, "learning_rate": 1.1607116301059818e-06, "loss": 0.9384, "step": 36549 }, { "epoch": 0.69, "learning_rate": 1.1605826375970991e-06, "loss": 0.9785, "step": 36550 }, { "epoch": 0.69, "learning_rate": 1.1604536500895586e-06, "loss": 0.933, "step": 36551 }, { "epoch": 0.69, "learning_rate": 1.1603246675838434e-06, "loss": 0.7791, "step": 36552 }, { "epoch": 0.69, "learning_rate": 1.1601956900804346e-06, "loss": 0.8116, "step": 36553 }, { "epoch": 0.69, "learning_rate": 1.1600667175798142e-06, "loss": 0.7772, "step": 36554 }, { "epoch": 0.69, "learning_rate": 1.1599377500824631e-06, "loss": 1.0933, "step": 36555 }, { "epoch": 0.69, "learning_rate": 1.159808787588864e-06, "loss": 1.0621, "step": 36556 }, { "epoch": 0.69, "learning_rate": 1.1596798300994982e-06, "loss": 0.8926, "step": 36557 }, { "epoch": 0.69, "learning_rate": 1.1595508776148454e-06, "loss": 0.7648, "step": 36558 }, { "epoch": 0.69, "learning_rate": 1.1594219301353893e-06, "loss": 0.844, "step": 36559 }, { "epoch": 0.69, "learning_rate": 1.1592929876616112e-06, "loss": 0.6156, "step": 36560 }, { "epoch": 0.69, "learning_rate": 1.1591640501939908e-06, "loss": 0.9952, "step": 36561 }, { "epoch": 0.69, "learning_rate": 1.159035117733012e-06, "loss": 1.0161, "step": 36562 }, { "epoch": 0.69, "learning_rate": 1.1589061902791544e-06, "loss": 0.9014, "step": 36563 }, { "epoch": 0.69, "learning_rate": 1.1587772678328996e-06, "loss": 0.8086, "step": 36564 }, { "epoch": 0.69, "learning_rate": 1.1586483503947297e-06, "loss": 0.9413, "step": 36565 }, { "epoch": 0.69, "learning_rate": 1.1585194379651255e-06, "loss": 0.8962, "step": 36566 }, { "epoch": 0.69, "learning_rate": 1.1583905305445687e-06, "loss": 0.8044, "step": 36567 }, { "epoch": 0.69, "learning_rate": 1.1582616281335404e-06, "loss": 0.959, "step": 36568 }, { "epoch": 0.69, "learning_rate": 1.1581327307325229e-06, "loss": 1.1655, "step": 36569 }, { "epoch": 0.69, "learning_rate": 1.158003838341995e-06, "loss": 0.9402, "step": 36570 }, { "epoch": 0.69, "learning_rate": 1.1578749509624415e-06, "loss": 1.0253, "step": 36571 }, { "epoch": 0.69, "learning_rate": 1.157746068594341e-06, "loss": 0.9044, "step": 36572 }, { "epoch": 0.69, "learning_rate": 1.157617191238175e-06, "loss": 0.8575, "step": 36573 }, { "epoch": 0.69, "learning_rate": 1.1574883188944258e-06, "loss": 0.9149, "step": 36574 }, { "epoch": 0.69, "learning_rate": 1.1573594515635737e-06, "loss": 0.8034, "step": 36575 }, { "epoch": 0.69, "learning_rate": 1.1572305892461004e-06, "loss": 0.9977, "step": 36576 }, { "epoch": 0.69, "learning_rate": 1.1571017319424867e-06, "loss": 0.925, "step": 36577 }, { "epoch": 0.69, "learning_rate": 1.1569728796532152e-06, "loss": 0.8174, "step": 36578 }, { "epoch": 0.69, "learning_rate": 1.1568440323787638e-06, "loss": 0.6996, "step": 36579 }, { "epoch": 0.69, "learning_rate": 1.1567151901196164e-06, "loss": 0.9375, "step": 36580 }, { "epoch": 0.69, "learning_rate": 1.1565863528762544e-06, "loss": 1.0045, "step": 36581 }, { "epoch": 0.69, "learning_rate": 1.1564575206491558e-06, "loss": 0.9562, "step": 36582 }, { "epoch": 0.69, "learning_rate": 1.1563286934388057e-06, "loss": 0.6805, "step": 36583 }, { "epoch": 0.69, "learning_rate": 1.1561998712456818e-06, "loss": 0.8872, "step": 36584 }, { "epoch": 0.69, "learning_rate": 1.1560710540702665e-06, "loss": 0.9902, "step": 36585 }, { "epoch": 0.69, "learning_rate": 1.1559422419130408e-06, "loss": 0.8878, "step": 36586 }, { "epoch": 0.69, "learning_rate": 1.1558134347744855e-06, "loss": 1.1321, "step": 36587 }, { "epoch": 0.69, "learning_rate": 1.1556846326550817e-06, "loss": 1.0229, "step": 36588 }, { "epoch": 0.69, "learning_rate": 1.1555558355553101e-06, "loss": 1.0449, "step": 36589 }, { "epoch": 0.69, "learning_rate": 1.1554270434756526e-06, "loss": 0.7906, "step": 36590 }, { "epoch": 0.69, "learning_rate": 1.1552982564165877e-06, "loss": 0.7867, "step": 36591 }, { "epoch": 0.69, "learning_rate": 1.1551694743785996e-06, "loss": 0.9079, "step": 36592 }, { "epoch": 0.69, "learning_rate": 1.1550406973621666e-06, "loss": 1.0347, "step": 36593 }, { "epoch": 0.69, "learning_rate": 1.1549119253677704e-06, "loss": 0.9361, "step": 36594 }, { "epoch": 0.69, "learning_rate": 1.1547831583958918e-06, "loss": 0.9016, "step": 36595 }, { "epoch": 0.69, "learning_rate": 1.1546543964470116e-06, "loss": 0.8684, "step": 36596 }, { "epoch": 0.69, "learning_rate": 1.1545256395216106e-06, "loss": 0.8584, "step": 36597 }, { "epoch": 0.69, "learning_rate": 1.1543968876201697e-06, "loss": 0.8862, "step": 36598 }, { "epoch": 0.69, "learning_rate": 1.1542681407431706e-06, "loss": 0.7816, "step": 36599 }, { "epoch": 0.69, "learning_rate": 1.154139398891091e-06, "loss": 0.9738, "step": 36600 }, { "epoch": 0.69, "learning_rate": 1.1540106620644145e-06, "loss": 0.7564, "step": 36601 }, { "epoch": 0.69, "learning_rate": 1.153881930263622e-06, "loss": 0.827, "step": 36602 }, { "epoch": 0.69, "learning_rate": 1.1537532034891912e-06, "loss": 1.1174, "step": 36603 }, { "epoch": 0.69, "learning_rate": 1.1536244817416064e-06, "loss": 0.8671, "step": 36604 }, { "epoch": 0.69, "learning_rate": 1.1534957650213457e-06, "loss": 0.86, "step": 36605 }, { "epoch": 0.69, "learning_rate": 1.1533670533288905e-06, "loss": 1.0546, "step": 36606 }, { "epoch": 0.69, "learning_rate": 1.1532383466647216e-06, "loss": 0.9654, "step": 36607 }, { "epoch": 0.69, "learning_rate": 1.1531096450293192e-06, "loss": 0.8296, "step": 36608 }, { "epoch": 0.69, "learning_rate": 1.152980948423164e-06, "loss": 1.0988, "step": 36609 }, { "epoch": 0.69, "learning_rate": 1.1528522568467367e-06, "loss": 0.7602, "step": 36610 }, { "epoch": 0.69, "learning_rate": 1.1527235703005188e-06, "loss": 0.8516, "step": 36611 }, { "epoch": 0.69, "learning_rate": 1.152594888784988e-06, "loss": 0.8582, "step": 36612 }, { "epoch": 0.69, "learning_rate": 1.1524662123006283e-06, "loss": 0.7909, "step": 36613 }, { "epoch": 0.69, "learning_rate": 1.1523375408479172e-06, "loss": 0.7955, "step": 36614 }, { "epoch": 0.69, "learning_rate": 1.1522088744273368e-06, "loss": 0.817, "step": 36615 }, { "epoch": 0.69, "learning_rate": 1.1520802130393674e-06, "loss": 0.9288, "step": 36616 }, { "epoch": 0.69, "learning_rate": 1.1519515566844888e-06, "loss": 0.9415, "step": 36617 }, { "epoch": 0.69, "learning_rate": 1.1518229053631816e-06, "loss": 1.074, "step": 36618 }, { "epoch": 0.69, "learning_rate": 1.1516942590759267e-06, "loss": 1.1081, "step": 36619 }, { "epoch": 0.69, "learning_rate": 1.1515656178232049e-06, "loss": 0.9384, "step": 36620 }, { "epoch": 0.69, "learning_rate": 1.1514369816054938e-06, "loss": 0.8959, "step": 36621 }, { "epoch": 0.69, "learning_rate": 1.1513083504232764e-06, "loss": 0.9836, "step": 36622 }, { "epoch": 0.69, "learning_rate": 1.1511797242770336e-06, "loss": 0.8978, "step": 36623 }, { "epoch": 0.69, "learning_rate": 1.1510511031672423e-06, "loss": 0.9083, "step": 36624 }, { "epoch": 0.69, "learning_rate": 1.1509224870943866e-06, "loss": 0.9476, "step": 36625 }, { "epoch": 0.69, "learning_rate": 1.150793876058944e-06, "loss": 1.0057, "step": 36626 }, { "epoch": 0.69, "learning_rate": 1.150665270061396e-06, "loss": 0.7246, "step": 36627 }, { "epoch": 0.69, "learning_rate": 1.1505366691022224e-06, "loss": 0.9796, "step": 36628 }, { "epoch": 0.69, "learning_rate": 1.1504080731819035e-06, "loss": 0.955, "step": 36629 }, { "epoch": 0.69, "learning_rate": 1.1502794823009192e-06, "loss": 0.8804, "step": 36630 }, { "epoch": 0.69, "learning_rate": 1.1501508964597502e-06, "loss": 1.0047, "step": 36631 }, { "epoch": 0.69, "learning_rate": 1.1500223156588774e-06, "loss": 1.1735, "step": 36632 }, { "epoch": 0.69, "learning_rate": 1.1498937398987778e-06, "loss": 0.9299, "step": 36633 }, { "epoch": 0.69, "learning_rate": 1.1497651691799356e-06, "loss": 0.9323, "step": 36634 }, { "epoch": 0.69, "learning_rate": 1.1496366035028278e-06, "loss": 0.8267, "step": 36635 }, { "epoch": 0.69, "learning_rate": 1.1495080428679355e-06, "loss": 0.863, "step": 36636 }, { "epoch": 0.69, "learning_rate": 1.1493794872757388e-06, "loss": 1.001, "step": 36637 }, { "epoch": 0.69, "learning_rate": 1.1492509367267177e-06, "loss": 0.9829, "step": 36638 }, { "epoch": 0.69, "learning_rate": 1.1491223912213523e-06, "loss": 0.7568, "step": 36639 }, { "epoch": 0.69, "learning_rate": 1.1489938507601223e-06, "loss": 0.6754, "step": 36640 }, { "epoch": 0.69, "learning_rate": 1.1488653153435087e-06, "loss": 0.9146, "step": 36641 }, { "epoch": 0.69, "learning_rate": 1.1487367849719889e-06, "loss": 0.7567, "step": 36642 }, { "epoch": 0.69, "learning_rate": 1.1486082596460455e-06, "loss": 1.0358, "step": 36643 }, { "epoch": 0.69, "learning_rate": 1.1484797393661581e-06, "loss": 0.9177, "step": 36644 }, { "epoch": 0.69, "learning_rate": 1.1483512241328044e-06, "loss": 0.953, "step": 36645 }, { "epoch": 0.69, "learning_rate": 1.1482227139464674e-06, "loss": 0.6848, "step": 36646 }, { "epoch": 0.69, "learning_rate": 1.1480942088076243e-06, "loss": 0.9659, "step": 36647 }, { "epoch": 0.69, "learning_rate": 1.147965708716756e-06, "loss": 0.7372, "step": 36648 }, { "epoch": 0.69, "learning_rate": 1.1478372136743427e-06, "loss": 0.9624, "step": 36649 }, { "epoch": 0.69, "learning_rate": 1.1477087236808635e-06, "loss": 1.0142, "step": 36650 }, { "epoch": 0.69, "learning_rate": 1.1475802387367985e-06, "loss": 0.9653, "step": 36651 }, { "epoch": 0.69, "learning_rate": 1.1474517588426273e-06, "loss": 0.7517, "step": 36652 }, { "epoch": 0.69, "learning_rate": 1.1473232839988307e-06, "loss": 0.7384, "step": 36653 }, { "epoch": 0.69, "learning_rate": 1.1471948142058858e-06, "loss": 0.9028, "step": 36654 }, { "epoch": 0.69, "learning_rate": 1.147066349464276e-06, "loss": 0.9073, "step": 36655 }, { "epoch": 0.69, "learning_rate": 1.1469378897744777e-06, "loss": 0.9658, "step": 36656 }, { "epoch": 0.69, "learning_rate": 1.1468094351369718e-06, "loss": 1.0443, "step": 36657 }, { "epoch": 0.69, "learning_rate": 1.146680985552238e-06, "loss": 0.8334, "step": 36658 }, { "epoch": 0.69, "learning_rate": 1.1465525410207562e-06, "loss": 0.9735, "step": 36659 }, { "epoch": 0.69, "learning_rate": 1.1464241015430055e-06, "loss": 0.8193, "step": 36660 }, { "epoch": 0.69, "learning_rate": 1.1462956671194657e-06, "loss": 0.9506, "step": 36661 }, { "epoch": 0.69, "learning_rate": 1.1461672377506175e-06, "loss": 1.1313, "step": 36662 }, { "epoch": 0.69, "learning_rate": 1.146038813436937e-06, "loss": 1.0196, "step": 36663 }, { "epoch": 0.69, "learning_rate": 1.1459103941789077e-06, "loss": 0.8873, "step": 36664 }, { "epoch": 0.69, "learning_rate": 1.1457819799770079e-06, "loss": 0.8238, "step": 36665 }, { "epoch": 0.69, "learning_rate": 1.1456535708317148e-06, "loss": 0.8407, "step": 36666 }, { "epoch": 0.69, "learning_rate": 1.1455251667435117e-06, "loss": 0.9166, "step": 36667 }, { "epoch": 0.69, "learning_rate": 1.1453967677128753e-06, "loss": 1.0242, "step": 36668 }, { "epoch": 0.69, "learning_rate": 1.1452683737402856e-06, "loss": 0.851, "step": 36669 }, { "epoch": 0.69, "learning_rate": 1.1451399848262225e-06, "loss": 0.8712, "step": 36670 }, { "epoch": 0.69, "learning_rate": 1.1450116009711648e-06, "loss": 0.861, "step": 36671 }, { "epoch": 0.69, "learning_rate": 1.1448832221755926e-06, "loss": 0.9819, "step": 36672 }, { "epoch": 0.69, "learning_rate": 1.1447548484399848e-06, "loss": 0.7977, "step": 36673 }, { "epoch": 0.69, "learning_rate": 1.1446264797648215e-06, "loss": 1.003, "step": 36674 }, { "epoch": 0.69, "learning_rate": 1.1444981161505798e-06, "loss": 1.0305, "step": 36675 }, { "epoch": 0.69, "learning_rate": 1.1443697575977426e-06, "loss": 0.8955, "step": 36676 }, { "epoch": 0.69, "learning_rate": 1.144241404106786e-06, "loss": 0.8417, "step": 36677 }, { "epoch": 0.69, "learning_rate": 1.14411305567819e-06, "loss": 0.8508, "step": 36678 }, { "epoch": 0.69, "learning_rate": 1.143984712312435e-06, "loss": 1.017, "step": 36679 }, { "epoch": 0.69, "learning_rate": 1.1438563740099991e-06, "loss": 0.9604, "step": 36680 }, { "epoch": 0.69, "learning_rate": 1.1437280407713622e-06, "loss": 1.0812, "step": 36681 }, { "epoch": 0.69, "learning_rate": 1.143599712597003e-06, "loss": 0.9352, "step": 36682 }, { "epoch": 0.69, "learning_rate": 1.1434713894874016e-06, "loss": 0.7001, "step": 36683 }, { "epoch": 0.69, "learning_rate": 1.1433430714430349e-06, "loss": 0.8, "step": 36684 }, { "epoch": 0.69, "learning_rate": 1.1432147584643846e-06, "loss": 0.8267, "step": 36685 }, { "epoch": 0.69, "learning_rate": 1.1430864505519295e-06, "loss": 0.7628, "step": 36686 }, { "epoch": 0.69, "learning_rate": 1.1429581477061464e-06, "loss": 0.9192, "step": 36687 }, { "epoch": 0.69, "learning_rate": 1.1428298499275177e-06, "loss": 1.0123, "step": 36688 }, { "epoch": 0.69, "learning_rate": 1.1427015572165195e-06, "loss": 0.8753, "step": 36689 }, { "epoch": 0.69, "learning_rate": 1.142573269573632e-06, "loss": 0.9324, "step": 36690 }, { "epoch": 0.69, "learning_rate": 1.1424449869993348e-06, "loss": 0.8486, "step": 36691 }, { "epoch": 0.69, "learning_rate": 1.1423167094941063e-06, "loss": 0.8488, "step": 36692 }, { "epoch": 0.69, "learning_rate": 1.1421884370584255e-06, "loss": 0.9501, "step": 36693 }, { "epoch": 0.69, "learning_rate": 1.1420601696927714e-06, "loss": 1.3199, "step": 36694 }, { "epoch": 0.69, "learning_rate": 1.1419319073976238e-06, "loss": 0.8903, "step": 36695 }, { "epoch": 0.69, "learning_rate": 1.1418036501734591e-06, "loss": 0.777, "step": 36696 }, { "epoch": 0.69, "learning_rate": 1.1416753980207598e-06, "loss": 0.9662, "step": 36697 }, { "epoch": 0.69, "learning_rate": 1.141547150940002e-06, "loss": 0.8763, "step": 36698 }, { "epoch": 0.69, "learning_rate": 1.1414189089316655e-06, "loss": 1.075, "step": 36699 }, { "epoch": 0.69, "learning_rate": 1.1412906719962288e-06, "loss": 1.2403, "step": 36700 }, { "epoch": 0.69, "learning_rate": 1.1411624401341714e-06, "loss": 0.9355, "step": 36701 }, { "epoch": 0.69, "learning_rate": 1.1410342133459717e-06, "loss": 1.0569, "step": 36702 }, { "epoch": 0.69, "learning_rate": 1.140905991632109e-06, "loss": 0.9911, "step": 36703 }, { "epoch": 0.69, "learning_rate": 1.140777774993062e-06, "loss": 0.8532, "step": 36704 }, { "epoch": 0.69, "learning_rate": 1.1406495634293075e-06, "loss": 0.8603, "step": 36705 }, { "epoch": 0.69, "learning_rate": 1.1405213569413267e-06, "loss": 1.0193, "step": 36706 }, { "epoch": 0.69, "learning_rate": 1.1403931555295986e-06, "loss": 1.0095, "step": 36707 }, { "epoch": 0.69, "learning_rate": 1.1402649591945986e-06, "loss": 1.0398, "step": 36708 }, { "epoch": 0.69, "learning_rate": 1.1401367679368095e-06, "loss": 0.9363, "step": 36709 }, { "epoch": 0.69, "learning_rate": 1.1400085817567072e-06, "loss": 0.8381, "step": 36710 }, { "epoch": 0.69, "learning_rate": 1.1398804006547712e-06, "loss": 0.87, "step": 36711 }, { "epoch": 0.69, "learning_rate": 1.1397522246314798e-06, "loss": 1.1819, "step": 36712 }, { "epoch": 0.69, "learning_rate": 1.1396240536873121e-06, "loss": 1.0138, "step": 36713 }, { "epoch": 0.69, "learning_rate": 1.1394958878227467e-06, "loss": 0.7179, "step": 36714 }, { "epoch": 0.69, "learning_rate": 1.1393677270382617e-06, "loss": 0.9081, "step": 36715 }, { "epoch": 0.69, "learning_rate": 1.1392395713343365e-06, "loss": 0.9238, "step": 36716 }, { "epoch": 0.69, "learning_rate": 1.1391114207114475e-06, "loss": 0.7629, "step": 36717 }, { "epoch": 0.69, "learning_rate": 1.1389832751700766e-06, "loss": 1.0565, "step": 36718 }, { "epoch": 0.69, "learning_rate": 1.1388551347106997e-06, "loss": 0.7955, "step": 36719 }, { "epoch": 0.69, "learning_rate": 1.1387269993337954e-06, "loss": 0.9297, "step": 36720 }, { "epoch": 0.69, "learning_rate": 1.1385988690398434e-06, "loss": 1.0355, "step": 36721 }, { "epoch": 0.69, "learning_rate": 1.1384707438293211e-06, "loss": 0.8835, "step": 36722 }, { "epoch": 0.69, "learning_rate": 1.1383426237027073e-06, "loss": 0.8251, "step": 36723 }, { "epoch": 0.69, "learning_rate": 1.1382145086604804e-06, "loss": 0.7745, "step": 36724 }, { "epoch": 0.69, "learning_rate": 1.1380863987031199e-06, "loss": 1.3751, "step": 36725 }, { "epoch": 0.69, "learning_rate": 1.137958293831101e-06, "loss": 0.857, "step": 36726 }, { "epoch": 0.69, "learning_rate": 1.137830194044905e-06, "loss": 0.8966, "step": 36727 }, { "epoch": 0.69, "learning_rate": 1.1377020993450103e-06, "loss": 0.9392, "step": 36728 }, { "epoch": 0.69, "learning_rate": 1.1375740097318921e-06, "loss": 0.7022, "step": 36729 }, { "epoch": 0.69, "learning_rate": 1.1374459252060329e-06, "loss": 0.9947, "step": 36730 }, { "epoch": 0.69, "learning_rate": 1.137317845767908e-06, "loss": 1.0001, "step": 36731 }, { "epoch": 0.69, "learning_rate": 1.137189771417996e-06, "loss": 0.9406, "step": 36732 }, { "epoch": 0.69, "learning_rate": 1.1370617021567761e-06, "loss": 0.9797, "step": 36733 }, { "epoch": 0.69, "learning_rate": 1.136933637984726e-06, "loss": 0.7375, "step": 36734 }, { "epoch": 0.69, "learning_rate": 1.1368055789023236e-06, "loss": 0.847, "step": 36735 }, { "epoch": 0.69, "learning_rate": 1.1366775249100476e-06, "loss": 0.7606, "step": 36736 }, { "epoch": 0.69, "learning_rate": 1.1365494760083767e-06, "loss": 0.7894, "step": 36737 }, { "epoch": 0.69, "learning_rate": 1.1364214321977865e-06, "loss": 1.0309, "step": 36738 }, { "epoch": 0.69, "learning_rate": 1.1362933934787588e-06, "loss": 0.7702, "step": 36739 }, { "epoch": 0.69, "learning_rate": 1.1361653598517685e-06, "loss": 1.0005, "step": 36740 }, { "epoch": 0.69, "learning_rate": 1.1360373313172952e-06, "loss": 1.0067, "step": 36741 }, { "epoch": 0.69, "learning_rate": 1.1359093078758166e-06, "loss": 0.8696, "step": 36742 }, { "epoch": 0.69, "learning_rate": 1.1357812895278108e-06, "loss": 0.9641, "step": 36743 }, { "epoch": 0.69, "learning_rate": 1.135653276273756e-06, "loss": 1.1749, "step": 36744 }, { "epoch": 0.69, "learning_rate": 1.1355252681141298e-06, "loss": 0.9876, "step": 36745 }, { "epoch": 0.69, "learning_rate": 1.1353972650494113e-06, "loss": 0.9507, "step": 36746 }, { "epoch": 0.69, "learning_rate": 1.1352692670800761e-06, "loss": 0.7848, "step": 36747 }, { "epoch": 0.69, "learning_rate": 1.1351412742066042e-06, "loss": 0.9113, "step": 36748 }, { "epoch": 0.69, "learning_rate": 1.1350132864294741e-06, "loss": 0.7592, "step": 36749 }, { "epoch": 0.69, "learning_rate": 1.1348853037491605e-06, "loss": 0.9092, "step": 36750 }, { "epoch": 0.69, "learning_rate": 1.1347573261661452e-06, "loss": 0.8503, "step": 36751 }, { "epoch": 0.69, "learning_rate": 1.1346293536809033e-06, "loss": 0.9421, "step": 36752 }, { "epoch": 0.69, "learning_rate": 1.1345013862939135e-06, "loss": 0.8821, "step": 36753 }, { "epoch": 0.69, "learning_rate": 1.1343734240056536e-06, "loss": 0.8665, "step": 36754 }, { "epoch": 0.69, "learning_rate": 1.1342454668166016e-06, "loss": 0.8106, "step": 36755 }, { "epoch": 0.69, "learning_rate": 1.134117514727235e-06, "loss": 1.0999, "step": 36756 }, { "epoch": 0.69, "learning_rate": 1.133989567738032e-06, "loss": 1.1389, "step": 36757 }, { "epoch": 0.69, "learning_rate": 1.1338616258494708e-06, "loss": 1.0075, "step": 36758 }, { "epoch": 0.69, "learning_rate": 1.1337336890620265e-06, "loss": 0.7454, "step": 36759 }, { "epoch": 0.69, "learning_rate": 1.1336057573761807e-06, "loss": 0.815, "step": 36760 }, { "epoch": 0.69, "learning_rate": 1.1334778307924079e-06, "loss": 0.8342, "step": 36761 }, { "epoch": 0.69, "learning_rate": 1.1333499093111875e-06, "loss": 0.8344, "step": 36762 }, { "epoch": 0.69, "learning_rate": 1.1332219929329964e-06, "loss": 0.8727, "step": 36763 }, { "epoch": 0.69, "learning_rate": 1.1330940816583121e-06, "loss": 0.7935, "step": 36764 }, { "epoch": 0.69, "learning_rate": 1.132966175487614e-06, "loss": 0.966, "step": 36765 }, { "epoch": 0.69, "learning_rate": 1.1328382744213761e-06, "loss": 0.7486, "step": 36766 }, { "epoch": 0.69, "learning_rate": 1.13271037846008e-06, "loss": 0.7418, "step": 36767 }, { "epoch": 0.69, "learning_rate": 1.1325824876042007e-06, "loss": 0.9781, "step": 36768 }, { "epoch": 0.69, "learning_rate": 1.1324546018542157e-06, "loss": 0.9304, "step": 36769 }, { "epoch": 0.69, "learning_rate": 1.1323267212106048e-06, "loss": 0.7634, "step": 36770 }, { "epoch": 0.69, "learning_rate": 1.1321988456738434e-06, "loss": 0.9901, "step": 36771 }, { "epoch": 0.69, "learning_rate": 1.1320709752444092e-06, "loss": 0.8664, "step": 36772 }, { "epoch": 0.69, "learning_rate": 1.1319431099227805e-06, "loss": 0.8124, "step": 36773 }, { "epoch": 0.69, "learning_rate": 1.1318152497094338e-06, "loss": 1.1425, "step": 36774 }, { "epoch": 0.69, "learning_rate": 1.1316873946048473e-06, "loss": 1.0403, "step": 36775 }, { "epoch": 0.69, "learning_rate": 1.131559544609498e-06, "loss": 1.0001, "step": 36776 }, { "epoch": 0.69, "learning_rate": 1.1314316997238642e-06, "loss": 0.8394, "step": 36777 }, { "epoch": 0.69, "learning_rate": 1.1313038599484209e-06, "loss": 0.9487, "step": 36778 }, { "epoch": 0.69, "learning_rate": 1.1311760252836487e-06, "loss": 0.8117, "step": 36779 }, { "epoch": 0.69, "learning_rate": 1.1310481957300224e-06, "loss": 1.1139, "step": 36780 }, { "epoch": 0.69, "learning_rate": 1.1309203712880201e-06, "loss": 1.1564, "step": 36781 }, { "epoch": 0.69, "learning_rate": 1.1307925519581192e-06, "loss": 1.1223, "step": 36782 }, { "epoch": 0.69, "learning_rate": 1.130664737740797e-06, "loss": 1.1018, "step": 36783 }, { "epoch": 0.69, "learning_rate": 1.1305369286365306e-06, "loss": 0.7932, "step": 36784 }, { "epoch": 0.69, "learning_rate": 1.130409124645797e-06, "loss": 0.8513, "step": 36785 }, { "epoch": 0.69, "learning_rate": 1.1302813257690753e-06, "loss": 0.8969, "step": 36786 }, { "epoch": 0.69, "learning_rate": 1.1301535320068387e-06, "loss": 1.105, "step": 36787 }, { "epoch": 0.69, "learning_rate": 1.130025743359569e-06, "loss": 0.7552, "step": 36788 }, { "epoch": 0.69, "learning_rate": 1.1298979598277404e-06, "loss": 0.755, "step": 36789 }, { "epoch": 0.69, "learning_rate": 1.1297701814118294e-06, "loss": 0.7895, "step": 36790 }, { "epoch": 0.69, "learning_rate": 1.1296424081123166e-06, "loss": 0.931, "step": 36791 }, { "epoch": 0.69, "learning_rate": 1.1295146399296763e-06, "loss": 0.8301, "step": 36792 }, { "epoch": 0.69, "learning_rate": 1.1293868768643863e-06, "loss": 0.782, "step": 36793 }, { "epoch": 0.69, "learning_rate": 1.1292591189169236e-06, "loss": 1.0955, "step": 36794 }, { "epoch": 0.69, "learning_rate": 1.129131366087765e-06, "loss": 0.9424, "step": 36795 }, { "epoch": 0.69, "learning_rate": 1.129003618377388e-06, "loss": 0.9525, "step": 36796 }, { "epoch": 0.69, "learning_rate": 1.1288758757862697e-06, "loss": 0.9578, "step": 36797 }, { "epoch": 0.69, "learning_rate": 1.1287481383148877e-06, "loss": 0.7775, "step": 36798 }, { "epoch": 0.69, "learning_rate": 1.1286204059637163e-06, "loss": 0.8419, "step": 36799 }, { "epoch": 0.69, "learning_rate": 1.128492678733236e-06, "loss": 1.0621, "step": 36800 }, { "epoch": 0.69, "learning_rate": 1.128364956623921e-06, "loss": 0.9125, "step": 36801 }, { "epoch": 0.69, "learning_rate": 1.1282372396362492e-06, "loss": 0.9486, "step": 36802 }, { "epoch": 0.69, "learning_rate": 1.1281095277706975e-06, "loss": 0.9906, "step": 36803 }, { "epoch": 0.69, "learning_rate": 1.127981821027743e-06, "loss": 0.737, "step": 36804 }, { "epoch": 0.69, "learning_rate": 1.1278541194078618e-06, "loss": 1.0993, "step": 36805 }, { "epoch": 0.69, "learning_rate": 1.1277264229115317e-06, "loss": 1.1484, "step": 36806 }, { "epoch": 0.69, "learning_rate": 1.1275987315392298e-06, "loss": 0.9891, "step": 36807 }, { "epoch": 0.69, "learning_rate": 1.1274710452914303e-06, "loss": 0.9779, "step": 36808 }, { "epoch": 0.69, "learning_rate": 1.1273433641686137e-06, "loss": 0.9677, "step": 36809 }, { "epoch": 0.69, "learning_rate": 1.1272156881712543e-06, "loss": 0.7716, "step": 36810 }, { "epoch": 0.69, "learning_rate": 1.127088017299828e-06, "loss": 1.0303, "step": 36811 }, { "epoch": 0.69, "learning_rate": 1.126960351554815e-06, "loss": 1.0811, "step": 36812 }, { "epoch": 0.69, "learning_rate": 1.1268326909366892e-06, "loss": 0.8182, "step": 36813 }, { "epoch": 0.69, "learning_rate": 1.1267050354459278e-06, "loss": 0.7687, "step": 36814 }, { "epoch": 0.69, "learning_rate": 1.1265773850830077e-06, "loss": 0.9109, "step": 36815 }, { "epoch": 0.69, "learning_rate": 1.1264497398484056e-06, "loss": 0.8087, "step": 36816 }, { "epoch": 0.69, "learning_rate": 1.126322099742598e-06, "loss": 1.0071, "step": 36817 }, { "epoch": 0.69, "learning_rate": 1.1261944647660616e-06, "loss": 1.0779, "step": 36818 }, { "epoch": 0.69, "learning_rate": 1.126066834919274e-06, "loss": 1.0101, "step": 36819 }, { "epoch": 0.69, "learning_rate": 1.1259392102027086e-06, "loss": 1.1396, "step": 36820 }, { "epoch": 0.69, "learning_rate": 1.1258115906168462e-06, "loss": 0.9656, "step": 36821 }, { "epoch": 0.69, "learning_rate": 1.1256839761621602e-06, "loss": 0.9661, "step": 36822 }, { "epoch": 0.69, "learning_rate": 1.1255563668391278e-06, "loss": 0.8044, "step": 36823 }, { "epoch": 0.69, "learning_rate": 1.125428762648226e-06, "loss": 0.9921, "step": 36824 }, { "epoch": 0.69, "learning_rate": 1.125301163589931e-06, "loss": 0.9786, "step": 36825 }, { "epoch": 0.69, "learning_rate": 1.1251735696647195e-06, "loss": 0.7693, "step": 36826 }, { "epoch": 0.69, "learning_rate": 1.1250459808730677e-06, "loss": 0.8002, "step": 36827 }, { "epoch": 0.69, "learning_rate": 1.1249183972154525e-06, "loss": 0.8864, "step": 36828 }, { "epoch": 0.69, "learning_rate": 1.1247908186923486e-06, "loss": 0.7945, "step": 36829 }, { "epoch": 0.69, "learning_rate": 1.1246632453042354e-06, "loss": 0.7761, "step": 36830 }, { "epoch": 0.69, "learning_rate": 1.1245356770515861e-06, "loss": 1.0078, "step": 36831 }, { "epoch": 0.69, "learning_rate": 1.1244081139348778e-06, "loss": 1.1403, "step": 36832 }, { "epoch": 0.69, "learning_rate": 1.1242805559545895e-06, "loss": 0.8706, "step": 36833 }, { "epoch": 0.69, "learning_rate": 1.124153003111194e-06, "loss": 0.9967, "step": 36834 }, { "epoch": 0.69, "learning_rate": 1.1240254554051694e-06, "loss": 0.8089, "step": 36835 }, { "epoch": 0.69, "learning_rate": 1.1238979128369912e-06, "loss": 0.9171, "step": 36836 }, { "epoch": 0.69, "learning_rate": 1.1237703754071363e-06, "loss": 1.0102, "step": 36837 }, { "epoch": 0.7, "learning_rate": 1.1236428431160806e-06, "loss": 0.9987, "step": 36838 }, { "epoch": 0.7, "learning_rate": 1.1235153159643e-06, "loss": 0.8548, "step": 36839 }, { "epoch": 0.7, "learning_rate": 1.1233877939522721e-06, "loss": 0.8269, "step": 36840 }, { "epoch": 0.7, "learning_rate": 1.1232602770804704e-06, "loss": 0.9539, "step": 36841 }, { "epoch": 0.7, "learning_rate": 1.1231327653493742e-06, "loss": 0.8154, "step": 36842 }, { "epoch": 0.7, "learning_rate": 1.1230052587594573e-06, "loss": 0.9415, "step": 36843 }, { "epoch": 0.7, "learning_rate": 1.1228777573111965e-06, "loss": 1.1713, "step": 36844 }, { "epoch": 0.7, "learning_rate": 1.1227502610050678e-06, "loss": 0.7108, "step": 36845 }, { "epoch": 0.7, "learning_rate": 1.1226227698415473e-06, "loss": 0.8024, "step": 36846 }, { "epoch": 0.7, "learning_rate": 1.1224952838211114e-06, "loss": 0.8687, "step": 36847 }, { "epoch": 0.7, "learning_rate": 1.1223678029442358e-06, "loss": 0.9418, "step": 36848 }, { "epoch": 0.7, "learning_rate": 1.1222403272113975e-06, "loss": 0.7932, "step": 36849 }, { "epoch": 0.7, "learning_rate": 1.1221128566230697e-06, "loss": 1.1683, "step": 36850 }, { "epoch": 0.7, "learning_rate": 1.1219853911797322e-06, "loss": 0.6806, "step": 36851 }, { "epoch": 0.7, "learning_rate": 1.1218579308818577e-06, "loss": 0.8942, "step": 36852 }, { "epoch": 0.7, "learning_rate": 1.121730475729923e-06, "loss": 1.0016, "step": 36853 }, { "epoch": 0.7, "learning_rate": 1.121603025724406e-06, "loss": 0.8959, "step": 36854 }, { "epoch": 0.7, "learning_rate": 1.12147558086578e-06, "loss": 1.0614, "step": 36855 }, { "epoch": 0.7, "learning_rate": 1.1213481411545223e-06, "loss": 0.8788, "step": 36856 }, { "epoch": 0.7, "learning_rate": 1.1212207065911082e-06, "loss": 0.9808, "step": 36857 }, { "epoch": 0.7, "learning_rate": 1.1210932771760137e-06, "loss": 0.7832, "step": 36858 }, { "epoch": 0.7, "learning_rate": 1.1209658529097144e-06, "loss": 0.8586, "step": 36859 }, { "epoch": 0.7, "learning_rate": 1.1208384337926868e-06, "loss": 0.6716, "step": 36860 }, { "epoch": 0.7, "learning_rate": 1.1207110198254067e-06, "loss": 1.0148, "step": 36861 }, { "epoch": 0.7, "learning_rate": 1.1205836110083476e-06, "loss": 1.232, "step": 36862 }, { "epoch": 0.7, "learning_rate": 1.1204562073419889e-06, "loss": 0.9229, "step": 36863 }, { "epoch": 0.7, "learning_rate": 1.1203288088268035e-06, "loss": 0.6954, "step": 36864 }, { "epoch": 0.7, "learning_rate": 1.1202014154632682e-06, "loss": 0.7855, "step": 36865 }, { "epoch": 0.7, "learning_rate": 1.1200740272518585e-06, "loss": 0.8583, "step": 36866 }, { "epoch": 0.7, "learning_rate": 1.11994664419305e-06, "loss": 0.8158, "step": 36867 }, { "epoch": 0.7, "learning_rate": 1.119819266287318e-06, "loss": 1.0836, "step": 36868 }, { "epoch": 0.7, "learning_rate": 1.1196918935351389e-06, "loss": 1.1514, "step": 36869 }, { "epoch": 0.7, "learning_rate": 1.119564525936989e-06, "loss": 0.8672, "step": 36870 }, { "epoch": 0.7, "learning_rate": 1.1194371634933406e-06, "loss": 0.7948, "step": 36871 }, { "epoch": 0.7, "learning_rate": 1.1193098062046739e-06, "loss": 0.821, "step": 36872 }, { "epoch": 0.7, "learning_rate": 1.1191824540714607e-06, "loss": 0.8121, "step": 36873 }, { "epoch": 0.7, "learning_rate": 1.119055107094177e-06, "loss": 0.9931, "step": 36874 }, { "epoch": 0.7, "learning_rate": 1.1189277652733013e-06, "loss": 0.8489, "step": 36875 }, { "epoch": 0.7, "learning_rate": 1.1188004286093058e-06, "loss": 1.0137, "step": 36876 }, { "epoch": 0.7, "learning_rate": 1.118673097102667e-06, "loss": 0.8303, "step": 36877 }, { "epoch": 0.7, "learning_rate": 1.118545770753861e-06, "loss": 0.8598, "step": 36878 }, { "epoch": 0.7, "learning_rate": 1.1184184495633623e-06, "loss": 0.8972, "step": 36879 }, { "epoch": 0.7, "learning_rate": 1.118291133531647e-06, "loss": 0.8665, "step": 36880 }, { "epoch": 0.7, "learning_rate": 1.11816382265919e-06, "loss": 1.0854, "step": 36881 }, { "epoch": 0.7, "learning_rate": 1.1180365169464683e-06, "loss": 0.8111, "step": 36882 }, { "epoch": 0.7, "learning_rate": 1.1179092163939536e-06, "loss": 0.8557, "step": 36883 }, { "epoch": 0.7, "learning_rate": 1.1177819210021255e-06, "loss": 0.8685, "step": 36884 }, { "epoch": 0.7, "learning_rate": 1.1176546307714565e-06, "loss": 0.8425, "step": 36885 }, { "epoch": 0.7, "learning_rate": 1.1175273457024225e-06, "loss": 1.0251, "step": 36886 }, { "epoch": 0.7, "learning_rate": 1.1174000657954993e-06, "loss": 0.8284, "step": 36887 }, { "epoch": 0.7, "learning_rate": 1.1172727910511616e-06, "loss": 1.0189, "step": 36888 }, { "epoch": 0.7, "learning_rate": 1.1171455214698849e-06, "loss": 1.0103, "step": 36889 }, { "epoch": 0.7, "learning_rate": 1.1170182570521445e-06, "loss": 0.7549, "step": 36890 }, { "epoch": 0.7, "learning_rate": 1.1168909977984165e-06, "loss": 0.8363, "step": 36891 }, { "epoch": 0.7, "learning_rate": 1.1167637437091734e-06, "loss": 0.9568, "step": 36892 }, { "epoch": 0.7, "learning_rate": 1.1166364947848934e-06, "loss": 1.0056, "step": 36893 }, { "epoch": 0.7, "learning_rate": 1.1165092510260497e-06, "loss": 1.0945, "step": 36894 }, { "epoch": 0.7, "learning_rate": 1.1163820124331174e-06, "loss": 1.0391, "step": 36895 }, { "epoch": 0.7, "learning_rate": 1.1162547790065736e-06, "loss": 0.7839, "step": 36896 }, { "epoch": 0.7, "learning_rate": 1.1161275507468914e-06, "loss": 1.122, "step": 36897 }, { "epoch": 0.7, "learning_rate": 1.1160003276545464e-06, "loss": 0.7933, "step": 36898 }, { "epoch": 0.7, "learning_rate": 1.1158731097300138e-06, "loss": 0.8076, "step": 36899 }, { "epoch": 0.7, "learning_rate": 1.1157458969737686e-06, "loss": 0.9618, "step": 36900 }, { "epoch": 0.7, "learning_rate": 1.1156186893862854e-06, "loss": 0.927, "step": 36901 }, { "epoch": 0.7, "learning_rate": 1.1154914869680403e-06, "loss": 0.9567, "step": 36902 }, { "epoch": 0.7, "learning_rate": 1.115364289719508e-06, "loss": 0.9771, "step": 36903 }, { "epoch": 0.7, "learning_rate": 1.115237097641161e-06, "loss": 0.8861, "step": 36904 }, { "epoch": 0.7, "learning_rate": 1.1151099107334783e-06, "loss": 1.1436, "step": 36905 }, { "epoch": 0.7, "learning_rate": 1.1149827289969317e-06, "loss": 1.0267, "step": 36906 }, { "epoch": 0.7, "learning_rate": 1.1148555524319974e-06, "loss": 0.919, "step": 36907 }, { "epoch": 0.7, "learning_rate": 1.1147283810391497e-06, "loss": 1.075, "step": 36908 }, { "epoch": 0.7, "learning_rate": 1.1146012148188636e-06, "loss": 0.8318, "step": 36909 }, { "epoch": 0.7, "learning_rate": 1.1144740537716145e-06, "loss": 0.6911, "step": 36910 }, { "epoch": 0.7, "learning_rate": 1.1143468978978766e-06, "loss": 0.8354, "step": 36911 }, { "epoch": 0.7, "learning_rate": 1.1142197471981259e-06, "loss": 0.9757, "step": 36912 }, { "epoch": 0.7, "learning_rate": 1.1140926016728343e-06, "loss": 0.972, "step": 36913 }, { "epoch": 0.7, "learning_rate": 1.11396546132248e-06, "loss": 0.8726, "step": 36914 }, { "epoch": 0.7, "learning_rate": 1.1138383261475357e-06, "loss": 0.8585, "step": 36915 }, { "epoch": 0.7, "learning_rate": 1.1137111961484755e-06, "loss": 0.7289, "step": 36916 }, { "epoch": 0.7, "learning_rate": 1.113584071325777e-06, "loss": 0.6993, "step": 36917 }, { "epoch": 0.7, "learning_rate": 1.113456951679912e-06, "loss": 0.8089, "step": 36918 }, { "epoch": 0.7, "learning_rate": 1.1133298372113567e-06, "loss": 1.0427, "step": 36919 }, { "epoch": 0.7, "learning_rate": 1.1132027279205849e-06, "loss": 0.9364, "step": 36920 }, { "epoch": 0.7, "learning_rate": 1.1130756238080715e-06, "loss": 0.8494, "step": 36921 }, { "epoch": 0.7, "learning_rate": 1.1129485248742913e-06, "loss": 0.7729, "step": 36922 }, { "epoch": 0.7, "learning_rate": 1.1128214311197189e-06, "loss": 0.7304, "step": 36923 }, { "epoch": 0.7, "learning_rate": 1.1126943425448293e-06, "loss": 0.8943, "step": 36924 }, { "epoch": 0.7, "learning_rate": 1.1125672591500952e-06, "loss": 0.8773, "step": 36925 }, { "epoch": 0.7, "learning_rate": 1.1124401809359938e-06, "loss": 1.135, "step": 36926 }, { "epoch": 0.7, "learning_rate": 1.1123131079029978e-06, "loss": 0.8201, "step": 36927 }, { "epoch": 0.7, "learning_rate": 1.1121860400515816e-06, "loss": 1.0335, "step": 36928 }, { "epoch": 0.7, "learning_rate": 1.1120589773822205e-06, "loss": 0.8826, "step": 36929 }, { "epoch": 0.7, "learning_rate": 1.1119319198953885e-06, "loss": 0.8813, "step": 36930 }, { "epoch": 0.7, "learning_rate": 1.1118048675915603e-06, "loss": 1.1625, "step": 36931 }, { "epoch": 0.7, "learning_rate": 1.1116778204712098e-06, "loss": 0.8416, "step": 36932 }, { "epoch": 0.7, "learning_rate": 1.1115507785348128e-06, "loss": 1.0054, "step": 36933 }, { "epoch": 0.7, "learning_rate": 1.111423741782841e-06, "loss": 0.9091, "step": 36934 }, { "epoch": 0.7, "learning_rate": 1.111296710215772e-06, "loss": 0.9442, "step": 36935 }, { "epoch": 0.7, "learning_rate": 1.1111696838340777e-06, "loss": 1.0142, "step": 36936 }, { "epoch": 0.7, "learning_rate": 1.1110426626382323e-06, "loss": 1.0638, "step": 36937 }, { "epoch": 0.7, "learning_rate": 1.1109156466287128e-06, "loss": 1.1235, "step": 36938 }, { "epoch": 0.7, "learning_rate": 1.1107886358059908e-06, "loss": 0.6929, "step": 36939 }, { "epoch": 0.7, "learning_rate": 1.1106616301705414e-06, "loss": 0.8403, "step": 36940 }, { "epoch": 0.7, "learning_rate": 1.110534629722839e-06, "loss": 0.9533, "step": 36941 }, { "epoch": 0.7, "learning_rate": 1.1104076344633575e-06, "loss": 0.8464, "step": 36942 }, { "epoch": 0.7, "learning_rate": 1.1102806443925713e-06, "loss": 0.9374, "step": 36943 }, { "epoch": 0.7, "learning_rate": 1.1101536595109547e-06, "loss": 1.0642, "step": 36944 }, { "epoch": 0.7, "learning_rate": 1.1100266798189825e-06, "loss": 0.8117, "step": 36945 }, { "epoch": 0.7, "learning_rate": 1.1098997053171262e-06, "loss": 0.9603, "step": 36946 }, { "epoch": 0.7, "learning_rate": 1.1097727360058637e-06, "loss": 1.1084, "step": 36947 }, { "epoch": 0.7, "learning_rate": 1.1096457718856666e-06, "loss": 0.8708, "step": 36948 }, { "epoch": 0.7, "learning_rate": 1.109518812957009e-06, "loss": 1.2247, "step": 36949 }, { "epoch": 0.7, "learning_rate": 1.1093918592203657e-06, "loss": 0.9406, "step": 36950 }, { "epoch": 0.7, "learning_rate": 1.1092649106762106e-06, "loss": 0.9643, "step": 36951 }, { "epoch": 0.7, "learning_rate": 1.1091379673250176e-06, "loss": 0.9369, "step": 36952 }, { "epoch": 0.7, "learning_rate": 1.109011029167261e-06, "loss": 0.7877, "step": 36953 }, { "epoch": 0.7, "learning_rate": 1.1088840962034154e-06, "loss": 0.7903, "step": 36954 }, { "epoch": 0.7, "learning_rate": 1.108757168433952e-06, "loss": 0.8524, "step": 36955 }, { "epoch": 0.7, "learning_rate": 1.1086302458593488e-06, "loss": 0.9459, "step": 36956 }, { "epoch": 0.7, "learning_rate": 1.1085033284800763e-06, "loss": 0.7497, "step": 36957 }, { "epoch": 0.7, "learning_rate": 1.108376416296609e-06, "loss": 0.9012, "step": 36958 }, { "epoch": 0.7, "learning_rate": 1.1082495093094234e-06, "loss": 0.8134, "step": 36959 }, { "epoch": 0.7, "learning_rate": 1.1081226075189902e-06, "loss": 0.7885, "step": 36960 }, { "epoch": 0.7, "learning_rate": 1.1079957109257847e-06, "loss": 0.8625, "step": 36961 }, { "epoch": 0.7, "learning_rate": 1.1078688195302806e-06, "loss": 1.0509, "step": 36962 }, { "epoch": 0.7, "learning_rate": 1.1077419333329517e-06, "loss": 0.942, "step": 36963 }, { "epoch": 0.7, "learning_rate": 1.1076150523342716e-06, "loss": 0.7964, "step": 36964 }, { "epoch": 0.7, "learning_rate": 1.1074881765347142e-06, "loss": 0.9682, "step": 36965 }, { "epoch": 0.7, "learning_rate": 1.1073613059347543e-06, "loss": 0.9236, "step": 36966 }, { "epoch": 0.7, "learning_rate": 1.1072344405348625e-06, "loss": 0.6923, "step": 36967 }, { "epoch": 0.7, "learning_rate": 1.1071075803355167e-06, "loss": 1.0277, "step": 36968 }, { "epoch": 0.7, "learning_rate": 1.1069807253371875e-06, "loss": 1.0609, "step": 36969 }, { "epoch": 0.7, "learning_rate": 1.1068538755403496e-06, "loss": 1.0697, "step": 36970 }, { "epoch": 0.7, "learning_rate": 1.1067270309454763e-06, "loss": 1.0264, "step": 36971 }, { "epoch": 0.7, "learning_rate": 1.1066001915530419e-06, "loss": 0.9026, "step": 36972 }, { "epoch": 0.7, "learning_rate": 1.1064733573635194e-06, "loss": 0.9091, "step": 36973 }, { "epoch": 0.7, "learning_rate": 1.106346528377383e-06, "loss": 0.8992, "step": 36974 }, { "epoch": 0.7, "learning_rate": 1.1062197045951067e-06, "loss": 1.1501, "step": 36975 }, { "epoch": 0.7, "learning_rate": 1.1060928860171612e-06, "loss": 0.8141, "step": 36976 }, { "epoch": 0.7, "learning_rate": 1.1059660726440244e-06, "loss": 0.9075, "step": 36977 }, { "epoch": 0.7, "learning_rate": 1.1058392644761665e-06, "loss": 0.9397, "step": 36978 }, { "epoch": 0.7, "learning_rate": 1.1057124615140607e-06, "loss": 0.9138, "step": 36979 }, { "epoch": 0.7, "learning_rate": 1.105585663758184e-06, "loss": 0.9342, "step": 36980 }, { "epoch": 0.7, "learning_rate": 1.105458871209007e-06, "loss": 1.1884, "step": 36981 }, { "epoch": 0.7, "learning_rate": 1.1053320838670035e-06, "loss": 0.9788, "step": 36982 }, { "epoch": 0.7, "learning_rate": 1.1052053017326472e-06, "loss": 0.787, "step": 36983 }, { "epoch": 0.7, "learning_rate": 1.1050785248064116e-06, "loss": 0.9271, "step": 36984 }, { "epoch": 0.7, "learning_rate": 1.1049517530887701e-06, "loss": 0.6635, "step": 36985 }, { "epoch": 0.7, "learning_rate": 1.1048249865801958e-06, "loss": 0.8845, "step": 36986 }, { "epoch": 0.7, "learning_rate": 1.1046982252811633e-06, "loss": 0.804, "step": 36987 }, { "epoch": 0.7, "learning_rate": 1.104571469192143e-06, "loss": 1.2248, "step": 36988 }, { "epoch": 0.7, "learning_rate": 1.104444718313612e-06, "loss": 0.9023, "step": 36989 }, { "epoch": 0.7, "learning_rate": 1.1043179726460404e-06, "loss": 0.7457, "step": 36990 }, { "epoch": 0.7, "learning_rate": 1.1041912321899028e-06, "loss": 0.8734, "step": 36991 }, { "epoch": 0.7, "learning_rate": 1.1040644969456726e-06, "loss": 0.8212, "step": 36992 }, { "epoch": 0.7, "learning_rate": 1.1039377669138227e-06, "loss": 0.9409, "step": 36993 }, { "epoch": 0.7, "learning_rate": 1.1038110420948261e-06, "loss": 0.9849, "step": 36994 }, { "epoch": 0.7, "learning_rate": 1.1036843224891564e-06, "loss": 0.9653, "step": 36995 }, { "epoch": 0.7, "learning_rate": 1.1035576080972875e-06, "loss": 0.7678, "step": 36996 }, { "epoch": 0.7, "learning_rate": 1.103430898919691e-06, "loss": 0.8157, "step": 36997 }, { "epoch": 0.7, "learning_rate": 1.1033041949568405e-06, "loss": 0.7846, "step": 36998 }, { "epoch": 0.7, "learning_rate": 1.1031774962092093e-06, "loss": 0.9588, "step": 36999 }, { "epoch": 0.7, "learning_rate": 1.1030508026772705e-06, "loss": 1.0419, "step": 37000 }, { "epoch": 0.7, "learning_rate": 1.1029241143614972e-06, "loss": 0.9266, "step": 37001 }, { "epoch": 0.7, "learning_rate": 1.1027974312623625e-06, "loss": 0.987, "step": 37002 }, { "epoch": 0.7, "learning_rate": 1.1026707533803402e-06, "loss": 0.9948, "step": 37003 }, { "epoch": 0.7, "learning_rate": 1.1025440807159007e-06, "loss": 0.8271, "step": 37004 }, { "epoch": 0.7, "learning_rate": 1.1024174132695195e-06, "loss": 1.1865, "step": 37005 }, { "epoch": 0.7, "learning_rate": 1.10229075104167e-06, "loss": 1.0306, "step": 37006 }, { "epoch": 0.7, "learning_rate": 1.1021640940328219e-06, "loss": 0.9202, "step": 37007 }, { "epoch": 0.7, "learning_rate": 1.1020374422434522e-06, "loss": 0.7278, "step": 37008 }, { "epoch": 0.7, "learning_rate": 1.1019107956740308e-06, "loss": 0.8864, "step": 37009 }, { "epoch": 0.7, "learning_rate": 1.1017841543250318e-06, "loss": 0.9349, "step": 37010 }, { "epoch": 0.7, "learning_rate": 1.1016575181969278e-06, "loss": 0.9342, "step": 37011 }, { "epoch": 0.7, "learning_rate": 1.1015308872901917e-06, "loss": 0.933, "step": 37012 }, { "epoch": 0.7, "learning_rate": 1.1014042616052964e-06, "loss": 0.9127, "step": 37013 }, { "epoch": 0.7, "learning_rate": 1.1012776411427147e-06, "loss": 0.8918, "step": 37014 }, { "epoch": 0.7, "learning_rate": 1.1011510259029204e-06, "loss": 0.8813, "step": 37015 }, { "epoch": 0.7, "learning_rate": 1.1010244158863834e-06, "loss": 0.9059, "step": 37016 }, { "epoch": 0.7, "learning_rate": 1.1008978110935801e-06, "loss": 0.9539, "step": 37017 }, { "epoch": 0.7, "learning_rate": 1.1007712115249804e-06, "loss": 1.0652, "step": 37018 }, { "epoch": 0.7, "learning_rate": 1.1006446171810586e-06, "loss": 1.2748, "step": 37019 }, { "epoch": 0.7, "learning_rate": 1.1005180280622866e-06, "loss": 0.7662, "step": 37020 }, { "epoch": 0.7, "learning_rate": 1.1003914441691374e-06, "loss": 0.9778, "step": 37021 }, { "epoch": 0.7, "learning_rate": 1.1002648655020834e-06, "loss": 0.7356, "step": 37022 }, { "epoch": 0.7, "learning_rate": 1.1001382920615978e-06, "loss": 1.0123, "step": 37023 }, { "epoch": 0.7, "learning_rate": 1.1000117238481537e-06, "loss": 1.0945, "step": 37024 }, { "epoch": 0.7, "learning_rate": 1.099885160862221e-06, "loss": 1.0919, "step": 37025 }, { "epoch": 0.7, "learning_rate": 1.0997586031042754e-06, "loss": 0.8973, "step": 37026 }, { "epoch": 0.7, "learning_rate": 1.0996320505747888e-06, "loss": 0.7687, "step": 37027 }, { "epoch": 0.7, "learning_rate": 1.0995055032742315e-06, "loss": 0.9412, "step": 37028 }, { "epoch": 0.7, "learning_rate": 1.0993789612030796e-06, "loss": 0.8683, "step": 37029 }, { "epoch": 0.7, "learning_rate": 1.0992524243618027e-06, "loss": 0.8278, "step": 37030 }, { "epoch": 0.7, "learning_rate": 1.0991258927508745e-06, "loss": 1.0486, "step": 37031 }, { "epoch": 0.7, "learning_rate": 1.0989993663707669e-06, "loss": 0.894, "step": 37032 }, { "epoch": 0.7, "learning_rate": 1.098872845221953e-06, "loss": 0.8709, "step": 37033 }, { "epoch": 0.7, "learning_rate": 1.0987463293049047e-06, "loss": 0.9949, "step": 37034 }, { "epoch": 0.7, "learning_rate": 1.0986198186200947e-06, "loss": 0.9208, "step": 37035 }, { "epoch": 0.7, "learning_rate": 1.0984933131679964e-06, "loss": 1.0661, "step": 37036 }, { "epoch": 0.7, "learning_rate": 1.0983668129490793e-06, "loss": 1.1526, "step": 37037 }, { "epoch": 0.7, "learning_rate": 1.0982403179638193e-06, "loss": 1.1331, "step": 37038 }, { "epoch": 0.7, "learning_rate": 1.098113828212686e-06, "loss": 0.8286, "step": 37039 }, { "epoch": 0.7, "learning_rate": 1.0979873436961527e-06, "loss": 0.8052, "step": 37040 }, { "epoch": 0.7, "learning_rate": 1.0978608644146915e-06, "loss": 0.9244, "step": 37041 }, { "epoch": 0.7, "learning_rate": 1.0977343903687752e-06, "loss": 0.9141, "step": 37042 }, { "epoch": 0.7, "learning_rate": 1.0976079215588756e-06, "loss": 0.9752, "step": 37043 }, { "epoch": 0.7, "learning_rate": 1.0974814579854649e-06, "loss": 0.9991, "step": 37044 }, { "epoch": 0.7, "learning_rate": 1.0973549996490163e-06, "loss": 0.8707, "step": 37045 }, { "epoch": 0.7, "learning_rate": 1.0972285465499993e-06, "loss": 0.746, "step": 37046 }, { "epoch": 0.7, "learning_rate": 1.097102098688889e-06, "loss": 0.8821, "step": 37047 }, { "epoch": 0.7, "learning_rate": 1.0969756560661571e-06, "loss": 0.9707, "step": 37048 }, { "epoch": 0.7, "learning_rate": 1.0968492186822734e-06, "loss": 1.0499, "step": 37049 }, { "epoch": 0.7, "learning_rate": 1.0967227865377135e-06, "loss": 0.9536, "step": 37050 }, { "epoch": 0.7, "learning_rate": 1.096596359632947e-06, "loss": 0.8053, "step": 37051 }, { "epoch": 0.7, "learning_rate": 1.0964699379684466e-06, "loss": 0.9483, "step": 37052 }, { "epoch": 0.7, "learning_rate": 1.0963435215446841e-06, "loss": 0.9626, "step": 37053 }, { "epoch": 0.7, "learning_rate": 1.0962171103621322e-06, "loss": 0.7563, "step": 37054 }, { "epoch": 0.7, "learning_rate": 1.0960907044212624e-06, "loss": 1.0237, "step": 37055 }, { "epoch": 0.7, "learning_rate": 1.0959643037225468e-06, "loss": 1.1406, "step": 37056 }, { "epoch": 0.7, "learning_rate": 1.0958379082664586e-06, "loss": 0.9817, "step": 37057 }, { "epoch": 0.7, "learning_rate": 1.0957115180534664e-06, "loss": 0.7317, "step": 37058 }, { "epoch": 0.7, "learning_rate": 1.0955851330840463e-06, "loss": 0.7354, "step": 37059 }, { "epoch": 0.7, "learning_rate": 1.0954587533586675e-06, "loss": 0.9324, "step": 37060 }, { "epoch": 0.7, "learning_rate": 1.0953323788778025e-06, "loss": 0.9471, "step": 37061 }, { "epoch": 0.7, "learning_rate": 1.0952060096419235e-06, "loss": 1.1973, "step": 37062 }, { "epoch": 0.7, "learning_rate": 1.095079645651502e-06, "loss": 1.0787, "step": 37063 }, { "epoch": 0.7, "learning_rate": 1.0949532869070101e-06, "loss": 0.7264, "step": 37064 }, { "epoch": 0.7, "learning_rate": 1.0948269334089196e-06, "loss": 0.8427, "step": 37065 }, { "epoch": 0.7, "learning_rate": 1.0947005851577031e-06, "loss": 0.9264, "step": 37066 }, { "epoch": 0.7, "learning_rate": 1.0945742421538297e-06, "loss": 0.7274, "step": 37067 }, { "epoch": 0.7, "learning_rate": 1.094447904397774e-06, "loss": 0.856, "step": 37068 }, { "epoch": 0.7, "learning_rate": 1.0943215718900074e-06, "loss": 0.9663, "step": 37069 }, { "epoch": 0.7, "learning_rate": 1.0941952446309995e-06, "loss": 0.8808, "step": 37070 }, { "epoch": 0.7, "learning_rate": 1.0940689226212251e-06, "loss": 0.7972, "step": 37071 }, { "epoch": 0.7, "learning_rate": 1.0939426058611533e-06, "loss": 0.7543, "step": 37072 }, { "epoch": 0.7, "learning_rate": 1.0938162943512566e-06, "loss": 1.0433, "step": 37073 }, { "epoch": 0.7, "learning_rate": 1.0936899880920067e-06, "loss": 1.3141, "step": 37074 }, { "epoch": 0.7, "learning_rate": 1.0935636870838756e-06, "loss": 1.0114, "step": 37075 }, { "epoch": 0.7, "learning_rate": 1.0934373913273342e-06, "loss": 0.8968, "step": 37076 }, { "epoch": 0.7, "learning_rate": 1.0933111008228548e-06, "loss": 0.9433, "step": 37077 }, { "epoch": 0.7, "learning_rate": 1.0931848155709094e-06, "loss": 0.7602, "step": 37078 }, { "epoch": 0.7, "learning_rate": 1.0930585355719666e-06, "loss": 0.7823, "step": 37079 }, { "epoch": 0.7, "learning_rate": 1.0929322608265022e-06, "loss": 0.9746, "step": 37080 }, { "epoch": 0.7, "learning_rate": 1.0928059913349848e-06, "loss": 1.0582, "step": 37081 }, { "epoch": 0.7, "learning_rate": 1.0926797270978867e-06, "loss": 1.0184, "step": 37082 }, { "epoch": 0.7, "learning_rate": 1.092553468115679e-06, "loss": 0.7388, "step": 37083 }, { "epoch": 0.7, "learning_rate": 1.0924272143888336e-06, "loss": 1.0425, "step": 37084 }, { "epoch": 0.7, "learning_rate": 1.0923009659178222e-06, "loss": 0.95, "step": 37085 }, { "epoch": 0.7, "learning_rate": 1.0921747227031154e-06, "loss": 0.8167, "step": 37086 }, { "epoch": 0.7, "learning_rate": 1.0920484847451861e-06, "loss": 0.993, "step": 37087 }, { "epoch": 0.7, "learning_rate": 1.091922252044503e-06, "loss": 1.1498, "step": 37088 }, { "epoch": 0.7, "learning_rate": 1.0917960246015396e-06, "loss": 0.9227, "step": 37089 }, { "epoch": 0.7, "learning_rate": 1.0916698024167677e-06, "loss": 0.8347, "step": 37090 }, { "epoch": 0.7, "learning_rate": 1.0915435854906558e-06, "loss": 0.7928, "step": 37091 }, { "epoch": 0.7, "learning_rate": 1.0914173738236788e-06, "loss": 0.8869, "step": 37092 }, { "epoch": 0.7, "learning_rate": 1.0912911674163051e-06, "loss": 0.8994, "step": 37093 }, { "epoch": 0.7, "learning_rate": 1.091164966269007e-06, "loss": 1.0234, "step": 37094 }, { "epoch": 0.7, "learning_rate": 1.0910387703822559e-06, "loss": 0.8381, "step": 37095 }, { "epoch": 0.7, "learning_rate": 1.0909125797565226e-06, "loss": 0.9279, "step": 37096 }, { "epoch": 0.7, "learning_rate": 1.090786394392279e-06, "loss": 0.9608, "step": 37097 }, { "epoch": 0.7, "learning_rate": 1.0906602142899952e-06, "loss": 0.9482, "step": 37098 }, { "epoch": 0.7, "learning_rate": 1.0905340394501441e-06, "loss": 1.0494, "step": 37099 }, { "epoch": 0.7, "learning_rate": 1.0904078698731938e-06, "loss": 0.9587, "step": 37100 }, { "epoch": 0.7, "learning_rate": 1.0902817055596194e-06, "loss": 0.7185, "step": 37101 }, { "epoch": 0.7, "learning_rate": 1.0901555465098887e-06, "loss": 0.9146, "step": 37102 }, { "epoch": 0.7, "learning_rate": 1.0900293927244728e-06, "loss": 0.8647, "step": 37103 }, { "epoch": 0.7, "learning_rate": 1.0899032442038462e-06, "loss": 0.7985, "step": 37104 }, { "epoch": 0.7, "learning_rate": 1.0897771009484767e-06, "loss": 0.832, "step": 37105 }, { "epoch": 0.7, "learning_rate": 1.0896509629588361e-06, "loss": 1.0605, "step": 37106 }, { "epoch": 0.7, "learning_rate": 1.0895248302353955e-06, "loss": 1.1627, "step": 37107 }, { "epoch": 0.7, "learning_rate": 1.089398702778626e-06, "loss": 0.726, "step": 37108 }, { "epoch": 0.7, "learning_rate": 1.0892725805889987e-06, "loss": 0.8439, "step": 37109 }, { "epoch": 0.7, "learning_rate": 1.089146463666984e-06, "loss": 1.0344, "step": 37110 }, { "epoch": 0.7, "learning_rate": 1.0890203520130543e-06, "loss": 0.8541, "step": 37111 }, { "epoch": 0.7, "learning_rate": 1.0888942456276775e-06, "loss": 0.9801, "step": 37112 }, { "epoch": 0.7, "learning_rate": 1.0887681445113283e-06, "loss": 1.063, "step": 37113 }, { "epoch": 0.7, "learning_rate": 1.0886420486644742e-06, "loss": 0.9745, "step": 37114 }, { "epoch": 0.7, "learning_rate": 1.0885159580875878e-06, "loss": 0.8223, "step": 37115 }, { "epoch": 0.7, "learning_rate": 1.0883898727811392e-06, "loss": 0.8935, "step": 37116 }, { "epoch": 0.7, "learning_rate": 1.0882637927455999e-06, "loss": 0.8543, "step": 37117 }, { "epoch": 0.7, "learning_rate": 1.08813771798144e-06, "loss": 0.8616, "step": 37118 }, { "epoch": 0.7, "learning_rate": 1.088011648489131e-06, "loss": 1.0509, "step": 37119 }, { "epoch": 0.7, "learning_rate": 1.0878855842691439e-06, "loss": 0.925, "step": 37120 }, { "epoch": 0.7, "learning_rate": 1.0877595253219467e-06, "loss": 0.9292, "step": 37121 }, { "epoch": 0.7, "learning_rate": 1.0876334716480142e-06, "loss": 0.7883, "step": 37122 }, { "epoch": 0.7, "learning_rate": 1.087507423247814e-06, "loss": 0.8533, "step": 37123 }, { "epoch": 0.7, "learning_rate": 1.0873813801218169e-06, "loss": 1.003, "step": 37124 }, { "epoch": 0.7, "learning_rate": 1.0872553422704963e-06, "loss": 1.0833, "step": 37125 }, { "epoch": 0.7, "learning_rate": 1.0871293096943197e-06, "loss": 0.9129, "step": 37126 }, { "epoch": 0.7, "learning_rate": 1.0870032823937593e-06, "loss": 0.8798, "step": 37127 }, { "epoch": 0.7, "learning_rate": 1.0868772603692854e-06, "loss": 0.918, "step": 37128 }, { "epoch": 0.7, "learning_rate": 1.086751243621368e-06, "loss": 0.7761, "step": 37129 }, { "epoch": 0.7, "learning_rate": 1.0866252321504785e-06, "loss": 1.0017, "step": 37130 }, { "epoch": 0.7, "learning_rate": 1.086499225957087e-06, "loss": 1.0139, "step": 37131 }, { "epoch": 0.7, "learning_rate": 1.086373225041665e-06, "loss": 0.8045, "step": 37132 }, { "epoch": 0.7, "learning_rate": 1.08624722940468e-06, "loss": 0.8351, "step": 37133 }, { "epoch": 0.7, "learning_rate": 1.0861212390466066e-06, "loss": 0.9068, "step": 37134 }, { "epoch": 0.7, "learning_rate": 1.0859952539679119e-06, "loss": 1.1323, "step": 37135 }, { "epoch": 0.7, "learning_rate": 1.085869274169068e-06, "loss": 0.6717, "step": 37136 }, { "epoch": 0.7, "learning_rate": 1.0857432996505447e-06, "loss": 0.9888, "step": 37137 }, { "epoch": 0.7, "learning_rate": 1.0856173304128123e-06, "loss": 0.9946, "step": 37138 }, { "epoch": 0.7, "learning_rate": 1.0854913664563416e-06, "loss": 0.8503, "step": 37139 }, { "epoch": 0.7, "learning_rate": 1.0853654077816028e-06, "loss": 1.0643, "step": 37140 }, { "epoch": 0.7, "learning_rate": 1.085239454389067e-06, "loss": 0.8845, "step": 37141 }, { "epoch": 0.7, "learning_rate": 1.085113506279202e-06, "loss": 0.8678, "step": 37142 }, { "epoch": 0.7, "learning_rate": 1.0849875634524815e-06, "loss": 1.2675, "step": 37143 }, { "epoch": 0.7, "learning_rate": 1.0848616259093733e-06, "loss": 1.2244, "step": 37144 }, { "epoch": 0.7, "learning_rate": 1.0847356936503476e-06, "loss": 0.8738, "step": 37145 }, { "epoch": 0.7, "learning_rate": 1.0846097666758768e-06, "loss": 0.9685, "step": 37146 }, { "epoch": 0.7, "learning_rate": 1.0844838449864292e-06, "loss": 0.8773, "step": 37147 }, { "epoch": 0.7, "learning_rate": 1.0843579285824753e-06, "loss": 0.9441, "step": 37148 }, { "epoch": 0.7, "learning_rate": 1.0842320174644855e-06, "loss": 0.9286, "step": 37149 }, { "epoch": 0.7, "learning_rate": 1.08410611163293e-06, "loss": 1.0442, "step": 37150 }, { "epoch": 0.7, "learning_rate": 1.083980211088279e-06, "loss": 0.8093, "step": 37151 }, { "epoch": 0.7, "learning_rate": 1.0838543158310025e-06, "loss": 0.8676, "step": 37152 }, { "epoch": 0.7, "learning_rate": 1.0837284258615712e-06, "loss": 0.9066, "step": 37153 }, { "epoch": 0.7, "learning_rate": 1.0836025411804528e-06, "loss": 0.9205, "step": 37154 }, { "epoch": 0.7, "learning_rate": 1.083476661788121e-06, "loss": 0.9478, "step": 37155 }, { "epoch": 0.7, "learning_rate": 1.083350787685043e-06, "loss": 1.1624, "step": 37156 }, { "epoch": 0.7, "learning_rate": 1.0832249188716897e-06, "loss": 0.7838, "step": 37157 }, { "epoch": 0.7, "learning_rate": 1.0830990553485309e-06, "loss": 0.7788, "step": 37158 }, { "epoch": 0.7, "learning_rate": 1.082973197116037e-06, "loss": 0.8961, "step": 37159 }, { "epoch": 0.7, "learning_rate": 1.082847344174678e-06, "loss": 0.7652, "step": 37160 }, { "epoch": 0.7, "learning_rate": 1.0827214965249231e-06, "loss": 0.9704, "step": 37161 }, { "epoch": 0.7, "learning_rate": 1.0825956541672438e-06, "loss": 1.0709, "step": 37162 }, { "epoch": 0.7, "learning_rate": 1.082469817102107e-06, "loss": 0.888, "step": 37163 }, { "epoch": 0.7, "learning_rate": 1.0823439853299865e-06, "loss": 0.8232, "step": 37164 }, { "epoch": 0.7, "learning_rate": 1.082218158851349e-06, "loss": 0.6522, "step": 37165 }, { "epoch": 0.7, "learning_rate": 1.0820923376666643e-06, "loss": 0.855, "step": 37166 }, { "epoch": 0.7, "learning_rate": 1.0819665217764052e-06, "loss": 0.8071, "step": 37167 }, { "epoch": 0.7, "learning_rate": 1.0818407111810388e-06, "loss": 0.774, "step": 37168 }, { "epoch": 0.7, "learning_rate": 1.081714905881036e-06, "loss": 0.9031, "step": 37169 }, { "epoch": 0.7, "learning_rate": 1.081589105876866e-06, "loss": 0.8705, "step": 37170 }, { "epoch": 0.7, "learning_rate": 1.0814633111689987e-06, "loss": 0.8252, "step": 37171 }, { "epoch": 0.7, "learning_rate": 1.0813375217579039e-06, "loss": 1.0788, "step": 37172 }, { "epoch": 0.7, "learning_rate": 1.0812117376440515e-06, "loss": 0.752, "step": 37173 }, { "epoch": 0.7, "learning_rate": 1.0810859588279118e-06, "loss": 0.9084, "step": 37174 }, { "epoch": 0.7, "learning_rate": 1.0809601853099518e-06, "loss": 1.0321, "step": 37175 }, { "epoch": 0.7, "learning_rate": 1.080834417090645e-06, "loss": 1.061, "step": 37176 }, { "epoch": 0.7, "learning_rate": 1.0807086541704575e-06, "loss": 0.972, "step": 37177 }, { "epoch": 0.7, "learning_rate": 1.0805828965498608e-06, "loss": 0.6948, "step": 37178 }, { "epoch": 0.7, "learning_rate": 1.0804571442293238e-06, "loss": 1.004, "step": 37179 }, { "epoch": 0.7, "learning_rate": 1.0803313972093166e-06, "loss": 0.9659, "step": 37180 }, { "epoch": 0.7, "learning_rate": 1.0802056554903081e-06, "loss": 0.8871, "step": 37181 }, { "epoch": 0.7, "learning_rate": 1.0800799190727685e-06, "loss": 0.7965, "step": 37182 }, { "epoch": 0.7, "learning_rate": 1.0799541879571675e-06, "loss": 0.9037, "step": 37183 }, { "epoch": 0.7, "learning_rate": 1.0798284621439724e-06, "loss": 0.9907, "step": 37184 }, { "epoch": 0.7, "learning_rate": 1.0797027416336561e-06, "loss": 0.9462, "step": 37185 }, { "epoch": 0.7, "learning_rate": 1.0795770264266855e-06, "loss": 0.9332, "step": 37186 }, { "epoch": 0.7, "learning_rate": 1.0794513165235297e-06, "loss": 1.3843, "step": 37187 }, { "epoch": 0.7, "learning_rate": 1.0793256119246606e-06, "loss": 0.9224, "step": 37188 }, { "epoch": 0.7, "learning_rate": 1.0791999126305456e-06, "loss": 0.9597, "step": 37189 }, { "epoch": 0.7, "learning_rate": 1.0790742186416544e-06, "loss": 0.8705, "step": 37190 }, { "epoch": 0.7, "learning_rate": 1.0789485299584564e-06, "loss": 0.8436, "step": 37191 }, { "epoch": 0.7, "learning_rate": 1.0788228465814212e-06, "loss": 0.745, "step": 37192 }, { "epoch": 0.7, "learning_rate": 1.0786971685110178e-06, "loss": 0.9715, "step": 37193 }, { "epoch": 0.7, "learning_rate": 1.0785714957477158e-06, "loss": 1.1278, "step": 37194 }, { "epoch": 0.7, "learning_rate": 1.0784458282919849e-06, "loss": 0.8655, "step": 37195 }, { "epoch": 0.7, "learning_rate": 1.078320166144292e-06, "loss": 0.8334, "step": 37196 }, { "epoch": 0.7, "learning_rate": 1.07819450930511e-06, "loss": 1.0067, "step": 37197 }, { "epoch": 0.7, "learning_rate": 1.0780688577749048e-06, "loss": 1.0011, "step": 37198 }, { "epoch": 0.7, "learning_rate": 1.0779432115541472e-06, "loss": 0.978, "step": 37199 }, { "epoch": 0.7, "learning_rate": 1.077817570643306e-06, "loss": 1.1458, "step": 37200 }, { "epoch": 0.7, "learning_rate": 1.0776919350428503e-06, "loss": 0.9982, "step": 37201 }, { "epoch": 0.7, "learning_rate": 1.0775663047532495e-06, "loss": 0.9877, "step": 37202 }, { "epoch": 0.7, "learning_rate": 1.0774406797749724e-06, "loss": 1.0041, "step": 37203 }, { "epoch": 0.7, "learning_rate": 1.0773150601084889e-06, "loss": 0.8159, "step": 37204 }, { "epoch": 0.7, "learning_rate": 1.0771894457542657e-06, "loss": 0.9199, "step": 37205 }, { "epoch": 0.7, "learning_rate": 1.077063836712775e-06, "loss": 1.134, "step": 37206 }, { "epoch": 0.7, "learning_rate": 1.0769382329844837e-06, "loss": 0.9134, "step": 37207 }, { "epoch": 0.7, "learning_rate": 1.0768126345698608e-06, "loss": 0.8514, "step": 37208 }, { "epoch": 0.7, "learning_rate": 1.0766870414693773e-06, "loss": 0.856, "step": 37209 }, { "epoch": 0.7, "learning_rate": 1.0765614536834997e-06, "loss": 0.7925, "step": 37210 }, { "epoch": 0.7, "learning_rate": 1.0764358712126982e-06, "loss": 0.8137, "step": 37211 }, { "epoch": 0.7, "learning_rate": 1.0763102940574416e-06, "loss": 1.0366, "step": 37212 }, { "epoch": 0.7, "learning_rate": 1.0761847222181987e-06, "loss": 0.95, "step": 37213 }, { "epoch": 0.7, "learning_rate": 1.0760591556954383e-06, "loss": 0.9185, "step": 37214 }, { "epoch": 0.7, "learning_rate": 1.0759335944896293e-06, "loss": 0.8796, "step": 37215 }, { "epoch": 0.7, "learning_rate": 1.0758080386012414e-06, "loss": 0.8082, "step": 37216 }, { "epoch": 0.7, "learning_rate": 1.0756824880307413e-06, "loss": 0.782, "step": 37217 }, { "epoch": 0.7, "learning_rate": 1.0755569427786003e-06, "loss": 0.8933, "step": 37218 }, { "epoch": 0.7, "learning_rate": 1.0754314028452856e-06, "loss": 1.0527, "step": 37219 }, { "epoch": 0.7, "learning_rate": 1.075305868231266e-06, "loss": 0.9554, "step": 37220 }, { "epoch": 0.7, "learning_rate": 1.0751803389370109e-06, "loss": 0.9506, "step": 37221 }, { "epoch": 0.7, "learning_rate": 1.0750548149629887e-06, "loss": 0.9047, "step": 37222 }, { "epoch": 0.7, "learning_rate": 1.0749292963096677e-06, "loss": 1.0383, "step": 37223 }, { "epoch": 0.7, "learning_rate": 1.0748037829775175e-06, "loss": 1.0373, "step": 37224 }, { "epoch": 0.7, "learning_rate": 1.0746782749670071e-06, "loss": 0.9738, "step": 37225 }, { "epoch": 0.7, "learning_rate": 1.0745527722786023e-06, "loss": 1.0003, "step": 37226 }, { "epoch": 0.7, "learning_rate": 1.0744272749127757e-06, "loss": 0.6468, "step": 37227 }, { "epoch": 0.7, "learning_rate": 1.0743017828699932e-06, "loss": 1.0297, "step": 37228 }, { "epoch": 0.7, "learning_rate": 1.0741762961507238e-06, "loss": 0.9239, "step": 37229 }, { "epoch": 0.7, "learning_rate": 1.0740508147554366e-06, "loss": 1.0548, "step": 37230 }, { "epoch": 0.7, "learning_rate": 1.0739253386846e-06, "loss": 0.9815, "step": 37231 }, { "epoch": 0.7, "learning_rate": 1.0737998679386832e-06, "loss": 1.0743, "step": 37232 }, { "epoch": 0.7, "learning_rate": 1.0736744025181522e-06, "loss": 0.8684, "step": 37233 }, { "epoch": 0.7, "learning_rate": 1.073548942423478e-06, "loss": 0.81, "step": 37234 }, { "epoch": 0.7, "learning_rate": 1.0734234876551295e-06, "loss": 0.8551, "step": 37235 }, { "epoch": 0.7, "learning_rate": 1.0732980382135718e-06, "loss": 0.7218, "step": 37236 }, { "epoch": 0.7, "learning_rate": 1.0731725940992776e-06, "loss": 1.0638, "step": 37237 }, { "epoch": 0.7, "learning_rate": 1.0730471553127123e-06, "loss": 1.0063, "step": 37238 }, { "epoch": 0.7, "learning_rate": 1.072921721854345e-06, "loss": 0.8722, "step": 37239 }, { "epoch": 0.7, "learning_rate": 1.0727962937246444e-06, "loss": 0.8515, "step": 37240 }, { "epoch": 0.7, "learning_rate": 1.0726708709240785e-06, "loss": 0.8876, "step": 37241 }, { "epoch": 0.7, "learning_rate": 1.072545453453116e-06, "loss": 0.8024, "step": 37242 }, { "epoch": 0.7, "learning_rate": 1.0724200413122249e-06, "loss": 0.9156, "step": 37243 }, { "epoch": 0.7, "learning_rate": 1.0722946345018745e-06, "loss": 0.8859, "step": 37244 }, { "epoch": 0.7, "learning_rate": 1.0721692330225302e-06, "loss": 0.8129, "step": 37245 }, { "epoch": 0.7, "learning_rate": 1.0720438368746645e-06, "loss": 0.8017, "step": 37246 }, { "epoch": 0.7, "learning_rate": 1.071918446058742e-06, "loss": 0.758, "step": 37247 }, { "epoch": 0.7, "learning_rate": 1.0717930605752322e-06, "loss": 0.794, "step": 37248 }, { "epoch": 0.7, "learning_rate": 1.0716676804246035e-06, "loss": 0.9258, "step": 37249 }, { "epoch": 0.7, "learning_rate": 1.0715423056073238e-06, "loss": 1.0323, "step": 37250 }, { "epoch": 0.7, "learning_rate": 1.0714169361238613e-06, "loss": 0.6724, "step": 37251 }, { "epoch": 0.7, "learning_rate": 1.0712915719746845e-06, "loss": 0.7538, "step": 37252 }, { "epoch": 0.7, "learning_rate": 1.0711662131602615e-06, "loss": 0.8105, "step": 37253 }, { "epoch": 0.7, "learning_rate": 1.0710408596810586e-06, "loss": 0.8347, "step": 37254 }, { "epoch": 0.7, "learning_rate": 1.0709155115375464e-06, "loss": 0.8496, "step": 37255 }, { "epoch": 0.7, "learning_rate": 1.0707901687301925e-06, "loss": 1.0144, "step": 37256 }, { "epoch": 0.7, "learning_rate": 1.0706648312594623e-06, "loss": 0.8284, "step": 37257 }, { "epoch": 0.7, "learning_rate": 1.0705394991258278e-06, "loss": 1.0551, "step": 37258 }, { "epoch": 0.7, "learning_rate": 1.0704141723297543e-06, "loss": 0.6781, "step": 37259 }, { "epoch": 0.7, "learning_rate": 1.0702888508717101e-06, "loss": 0.9845, "step": 37260 }, { "epoch": 0.7, "learning_rate": 1.0701635347521636e-06, "loss": 0.8613, "step": 37261 }, { "epoch": 0.7, "learning_rate": 1.0700382239715828e-06, "loss": 1.0375, "step": 37262 }, { "epoch": 0.7, "learning_rate": 1.0699129185304353e-06, "loss": 0.9274, "step": 37263 }, { "epoch": 0.7, "learning_rate": 1.0697876184291891e-06, "loss": 0.8466, "step": 37264 }, { "epoch": 0.7, "learning_rate": 1.069662323668313e-06, "loss": 0.827, "step": 37265 }, { "epoch": 0.7, "learning_rate": 1.0695370342482719e-06, "loss": 0.8763, "step": 37266 }, { "epoch": 0.7, "learning_rate": 1.0694117501695378e-06, "loss": 0.805, "step": 37267 }, { "epoch": 0.7, "learning_rate": 1.0692864714325755e-06, "loss": 1.1771, "step": 37268 }, { "epoch": 0.7, "learning_rate": 1.0691611980378532e-06, "loss": 1.0046, "step": 37269 }, { "epoch": 0.7, "learning_rate": 1.0690359299858395e-06, "loss": 0.8554, "step": 37270 }, { "epoch": 0.7, "learning_rate": 1.0689106672770017e-06, "loss": 0.8564, "step": 37271 }, { "epoch": 0.7, "learning_rate": 1.0687854099118074e-06, "loss": 0.9099, "step": 37272 }, { "epoch": 0.7, "learning_rate": 1.0686601578907246e-06, "loss": 0.9031, "step": 37273 }, { "epoch": 0.7, "learning_rate": 1.0685349112142222e-06, "loss": 0.9922, "step": 37274 }, { "epoch": 0.7, "learning_rate": 1.0684096698827642e-06, "loss": 1.0662, "step": 37275 }, { "epoch": 0.7, "learning_rate": 1.0682844338968217e-06, "loss": 0.7049, "step": 37276 }, { "epoch": 0.7, "learning_rate": 1.0681592032568622e-06, "loss": 0.7209, "step": 37277 }, { "epoch": 0.7, "learning_rate": 1.0680339779633504e-06, "loss": 0.9323, "step": 37278 }, { "epoch": 0.7, "learning_rate": 1.0679087580167577e-06, "loss": 0.6933, "step": 37279 }, { "epoch": 0.7, "learning_rate": 1.0677835434175488e-06, "loss": 1.0198, "step": 37280 }, { "epoch": 0.7, "learning_rate": 1.0676583341661923e-06, "loss": 1.1633, "step": 37281 }, { "epoch": 0.7, "learning_rate": 1.0675331302631556e-06, "loss": 0.9688, "step": 37282 }, { "epoch": 0.7, "learning_rate": 1.0674079317089065e-06, "loss": 0.7993, "step": 37283 }, { "epoch": 0.7, "learning_rate": 1.067282738503912e-06, "loss": 0.7585, "step": 37284 }, { "epoch": 0.7, "learning_rate": 1.0671575506486397e-06, "loss": 0.8456, "step": 37285 }, { "epoch": 0.7, "learning_rate": 1.0670323681435585e-06, "loss": 0.7755, "step": 37286 }, { "epoch": 0.7, "learning_rate": 1.0669071909891324e-06, "loss": 0.9109, "step": 37287 }, { "epoch": 0.7, "learning_rate": 1.0667820191858327e-06, "loss": 1.0053, "step": 37288 }, { "epoch": 0.7, "learning_rate": 1.0666568527341242e-06, "loss": 0.9487, "step": 37289 }, { "epoch": 0.7, "learning_rate": 1.066531691634475e-06, "loss": 0.8748, "step": 37290 }, { "epoch": 0.7, "learning_rate": 1.0664065358873527e-06, "loss": 0.9044, "step": 37291 }, { "epoch": 0.7, "learning_rate": 1.0662813854932243e-06, "loss": 1.027, "step": 37292 }, { "epoch": 0.7, "learning_rate": 1.0661562404525571e-06, "loss": 0.9813, "step": 37293 }, { "epoch": 0.7, "learning_rate": 1.066031100765819e-06, "loss": 1.126, "step": 37294 }, { "epoch": 0.7, "learning_rate": 1.0659059664334772e-06, "loss": 0.891, "step": 37295 }, { "epoch": 0.7, "learning_rate": 1.0657808374559969e-06, "loss": 0.8807, "step": 37296 }, { "epoch": 0.7, "learning_rate": 1.065655713833848e-06, "loss": 0.8397, "step": 37297 }, { "epoch": 0.7, "learning_rate": 1.0655305955674974e-06, "loss": 0.823, "step": 37298 }, { "epoch": 0.7, "learning_rate": 1.06540548265741e-06, "loss": 1.1362, "step": 37299 }, { "epoch": 0.7, "learning_rate": 1.0652803751040564e-06, "loss": 1.1669, "step": 37300 }, { "epoch": 0.7, "learning_rate": 1.0651552729079007e-06, "loss": 0.829, "step": 37301 }, { "epoch": 0.7, "learning_rate": 1.0650301760694111e-06, "loss": 0.8296, "step": 37302 }, { "epoch": 0.7, "learning_rate": 1.064905084589055e-06, "loss": 1.0059, "step": 37303 }, { "epoch": 0.7, "learning_rate": 1.0647799984672996e-06, "loss": 0.7837, "step": 37304 }, { "epoch": 0.7, "learning_rate": 1.0646549177046113e-06, "loss": 1.0281, "step": 37305 }, { "epoch": 0.7, "learning_rate": 1.0645298423014577e-06, "loss": 0.8887, "step": 37306 }, { "epoch": 0.7, "learning_rate": 1.0644047722583068e-06, "loss": 0.9159, "step": 37307 }, { "epoch": 0.7, "learning_rate": 1.0642797075756223e-06, "loss": 1.0355, "step": 37308 }, { "epoch": 0.7, "learning_rate": 1.0641546482538754e-06, "loss": 0.7573, "step": 37309 }, { "epoch": 0.7, "learning_rate": 1.06402959429353e-06, "loss": 0.8329, "step": 37310 }, { "epoch": 0.7, "learning_rate": 1.0639045456950538e-06, "loss": 0.7833, "step": 37311 }, { "epoch": 0.7, "learning_rate": 1.0637795024589143e-06, "loss": 0.9923, "step": 37312 }, { "epoch": 0.7, "learning_rate": 1.063654464585578e-06, "loss": 1.0887, "step": 37313 }, { "epoch": 0.7, "learning_rate": 1.063529432075512e-06, "loss": 0.7636, "step": 37314 }, { "epoch": 0.7, "learning_rate": 1.063404404929183e-06, "loss": 0.9091, "step": 37315 }, { "epoch": 0.7, "learning_rate": 1.0632793831470586e-06, "loss": 0.8498, "step": 37316 }, { "epoch": 0.7, "learning_rate": 1.0631543667296036e-06, "loss": 0.8564, "step": 37317 }, { "epoch": 0.7, "learning_rate": 1.0630293556772866e-06, "loss": 0.9867, "step": 37318 }, { "epoch": 0.7, "learning_rate": 1.062904349990575e-06, "loss": 1.132, "step": 37319 }, { "epoch": 0.7, "learning_rate": 1.0627793496699327e-06, "loss": 0.7128, "step": 37320 }, { "epoch": 0.7, "learning_rate": 1.0626543547158299e-06, "loss": 0.9418, "step": 37321 }, { "epoch": 0.7, "learning_rate": 1.0625293651287311e-06, "loss": 0.7053, "step": 37322 }, { "epoch": 0.7, "learning_rate": 1.0624043809091033e-06, "loss": 0.8791, "step": 37323 }, { "epoch": 0.7, "learning_rate": 1.0622794020574136e-06, "loss": 1.1953, "step": 37324 }, { "epoch": 0.7, "learning_rate": 1.0621544285741283e-06, "loss": 1.1398, "step": 37325 }, { "epoch": 0.7, "learning_rate": 1.0620294604597145e-06, "loss": 0.9714, "step": 37326 }, { "epoch": 0.7, "learning_rate": 1.0619044977146386e-06, "loss": 0.826, "step": 37327 }, { "epoch": 0.7, "learning_rate": 1.0617795403393682e-06, "loss": 0.9631, "step": 37328 }, { "epoch": 0.7, "learning_rate": 1.0616545883343668e-06, "loss": 0.8146, "step": 37329 }, { "epoch": 0.7, "learning_rate": 1.061529641700105e-06, "loss": 1.0629, "step": 37330 }, { "epoch": 0.7, "learning_rate": 1.0614047004370468e-06, "loss": 1.0332, "step": 37331 }, { "epoch": 0.7, "learning_rate": 1.061279764545659e-06, "loss": 1.1271, "step": 37332 }, { "epoch": 0.7, "learning_rate": 1.0611548340264085e-06, "loss": 0.9454, "step": 37333 }, { "epoch": 0.7, "learning_rate": 1.0610299088797618e-06, "loss": 1.0052, "step": 37334 }, { "epoch": 0.7, "learning_rate": 1.0609049891061852e-06, "loss": 0.858, "step": 37335 }, { "epoch": 0.7, "learning_rate": 1.0607800747061453e-06, "loss": 0.8164, "step": 37336 }, { "epoch": 0.7, "learning_rate": 1.0606551656801096e-06, "loss": 0.9053, "step": 37337 }, { "epoch": 0.7, "learning_rate": 1.0605302620285413e-06, "loss": 1.0693, "step": 37338 }, { "epoch": 0.7, "learning_rate": 1.0604053637519096e-06, "loss": 0.8056, "step": 37339 }, { "epoch": 0.7, "learning_rate": 1.0602804708506815e-06, "loss": 1.0442, "step": 37340 }, { "epoch": 0.7, "learning_rate": 1.06015558332532e-06, "loss": 0.6798, "step": 37341 }, { "epoch": 0.7, "learning_rate": 1.060030701176295e-06, "loss": 0.9897, "step": 37342 }, { "epoch": 0.7, "learning_rate": 1.0599058244040705e-06, "loss": 0.866, "step": 37343 }, { "epoch": 0.7, "learning_rate": 1.0597809530091135e-06, "loss": 0.8361, "step": 37344 }, { "epoch": 0.7, "learning_rate": 1.0596560869918901e-06, "loss": 0.8306, "step": 37345 }, { "epoch": 0.7, "learning_rate": 1.0595312263528667e-06, "loss": 0.9196, "step": 37346 }, { "epoch": 0.7, "learning_rate": 1.0594063710925099e-06, "loss": 0.5832, "step": 37347 }, { "epoch": 0.7, "learning_rate": 1.0592815212112853e-06, "loss": 0.6046, "step": 37348 }, { "epoch": 0.7, "learning_rate": 1.0591566767096604e-06, "loss": 1.129, "step": 37349 }, { "epoch": 0.7, "learning_rate": 1.059031837588098e-06, "loss": 1.1948, "step": 37350 }, { "epoch": 0.7, "learning_rate": 1.058907003847069e-06, "loss": 0.9339, "step": 37351 }, { "epoch": 0.7, "learning_rate": 1.0587821754870356e-06, "loss": 0.8992, "step": 37352 }, { "epoch": 0.7, "learning_rate": 1.0586573525084656e-06, "loss": 1.0253, "step": 37353 }, { "epoch": 0.7, "learning_rate": 1.058532534911825e-06, "loss": 0.8442, "step": 37354 }, { "epoch": 0.7, "learning_rate": 1.0584077226975794e-06, "loss": 0.85, "step": 37355 }, { "epoch": 0.7, "learning_rate": 1.0582829158661952e-06, "loss": 1.0043, "step": 37356 }, { "epoch": 0.7, "learning_rate": 1.0581581144181389e-06, "loss": 1.0078, "step": 37357 }, { "epoch": 0.7, "learning_rate": 1.0580333183538762e-06, "loss": 0.9574, "step": 37358 }, { "epoch": 0.7, "learning_rate": 1.0579085276738714e-06, "loss": 0.7676, "step": 37359 }, { "epoch": 0.7, "learning_rate": 1.057783742378593e-06, "loss": 0.7742, "step": 37360 }, { "epoch": 0.7, "learning_rate": 1.0576589624685065e-06, "loss": 0.8766, "step": 37361 }, { "epoch": 0.7, "learning_rate": 1.0575341879440757e-06, "loss": 0.7323, "step": 37362 }, { "epoch": 0.7, "learning_rate": 1.0574094188057696e-06, "loss": 1.1353, "step": 37363 }, { "epoch": 0.7, "learning_rate": 1.0572846550540517e-06, "loss": 1.0153, "step": 37364 }, { "epoch": 0.7, "learning_rate": 1.0571598966893885e-06, "loss": 0.8771, "step": 37365 }, { "epoch": 0.7, "learning_rate": 1.0570351437122462e-06, "loss": 0.8203, "step": 37366 }, { "epoch": 0.7, "learning_rate": 1.0569103961230904e-06, "loss": 0.9508, "step": 37367 }, { "epoch": 0.71, "learning_rate": 1.0567856539223866e-06, "loss": 0.9372, "step": 37368 }, { "epoch": 0.71, "learning_rate": 1.0566609171106013e-06, "loss": 1.0003, "step": 37369 }, { "epoch": 0.71, "learning_rate": 1.0565361856882005e-06, "loss": 0.8701, "step": 37370 }, { "epoch": 0.71, "learning_rate": 1.0564114596556479e-06, "loss": 0.8032, "step": 37371 }, { "epoch": 0.71, "learning_rate": 1.0562867390134124e-06, "loss": 0.7892, "step": 37372 }, { "epoch": 0.71, "learning_rate": 1.0561620237619569e-06, "loss": 0.9253, "step": 37373 }, { "epoch": 0.71, "learning_rate": 1.056037313901748e-06, "loss": 1.1345, "step": 37374 }, { "epoch": 0.71, "learning_rate": 1.0559126094332517e-06, "loss": 1.1095, "step": 37375 }, { "epoch": 0.71, "learning_rate": 1.0557879103569332e-06, "loss": 0.7409, "step": 37376 }, { "epoch": 0.71, "learning_rate": 1.0556632166732585e-06, "loss": 0.8229, "step": 37377 }, { "epoch": 0.71, "learning_rate": 1.0555385283826932e-06, "loss": 0.7751, "step": 37378 }, { "epoch": 0.71, "learning_rate": 1.0554138454857035e-06, "loss": 0.7472, "step": 37379 }, { "epoch": 0.71, "learning_rate": 1.0552891679827527e-06, "loss": 0.9276, "step": 37380 }, { "epoch": 0.71, "learning_rate": 1.0551644958743084e-06, "loss": 0.9737, "step": 37381 }, { "epoch": 0.71, "learning_rate": 1.0550398291608365e-06, "loss": 0.9899, "step": 37382 }, { "epoch": 0.71, "learning_rate": 1.0549151678427998e-06, "loss": 0.882, "step": 37383 }, { "epoch": 0.71, "learning_rate": 1.0547905119206675e-06, "loss": 0.954, "step": 37384 }, { "epoch": 0.71, "learning_rate": 1.054665861394902e-06, "loss": 0.946, "step": 37385 }, { "epoch": 0.71, "learning_rate": 1.05454121626597e-06, "loss": 0.7966, "step": 37386 }, { "epoch": 0.71, "learning_rate": 1.054416576534337e-06, "loss": 1.2449, "step": 37387 }, { "epoch": 0.71, "learning_rate": 1.054291942200468e-06, "loss": 1.0282, "step": 37388 }, { "epoch": 0.71, "learning_rate": 1.0541673132648284e-06, "loss": 1.0825, "step": 37389 }, { "epoch": 0.71, "learning_rate": 1.0540426897278837e-06, "loss": 0.801, "step": 37390 }, { "epoch": 0.71, "learning_rate": 1.0539180715901003e-06, "loss": 0.8304, "step": 37391 }, { "epoch": 0.71, "learning_rate": 1.0537934588519408e-06, "loss": 0.6265, "step": 37392 }, { "epoch": 0.71, "learning_rate": 1.0536688515138739e-06, "loss": 1.0252, "step": 37393 }, { "epoch": 0.71, "learning_rate": 1.0535442495763624e-06, "loss": 1.1142, "step": 37394 }, { "epoch": 0.71, "learning_rate": 1.053419653039872e-06, "loss": 0.9572, "step": 37395 }, { "epoch": 0.71, "learning_rate": 1.0532950619048685e-06, "loss": 0.9489, "step": 37396 }, { "epoch": 0.71, "learning_rate": 1.0531704761718168e-06, "loss": 0.8198, "step": 37397 }, { "epoch": 0.71, "learning_rate": 1.0530458958411821e-06, "loss": 0.8375, "step": 37398 }, { "epoch": 0.71, "learning_rate": 1.0529213209134295e-06, "loss": 0.9233, "step": 37399 }, { "epoch": 0.71, "learning_rate": 1.0527967513890256e-06, "loss": 1.0098, "step": 37400 }, { "epoch": 0.71, "learning_rate": 1.0526721872684323e-06, "loss": 0.9313, "step": 37401 }, { "epoch": 0.71, "learning_rate": 1.0525476285521177e-06, "loss": 0.8927, "step": 37402 }, { "epoch": 0.71, "learning_rate": 1.0524230752405466e-06, "loss": 0.8692, "step": 37403 }, { "epoch": 0.71, "learning_rate": 1.0522985273341815e-06, "loss": 0.8424, "step": 37404 }, { "epoch": 0.71, "learning_rate": 1.0521739848334914e-06, "loss": 1.0425, "step": 37405 }, { "epoch": 0.71, "learning_rate": 1.0520494477389382e-06, "loss": 1.1866, "step": 37406 }, { "epoch": 0.71, "learning_rate": 1.0519249160509878e-06, "loss": 1.033, "step": 37407 }, { "epoch": 0.71, "learning_rate": 1.0518003897701057e-06, "loss": 0.8116, "step": 37408 }, { "epoch": 0.71, "learning_rate": 1.0516758688967563e-06, "loss": 0.9622, "step": 37409 }, { "epoch": 0.71, "learning_rate": 1.0515513534314047e-06, "loss": 0.969, "step": 37410 }, { "epoch": 0.71, "learning_rate": 1.0514268433745161e-06, "loss": 0.799, "step": 37411 }, { "epoch": 0.71, "learning_rate": 1.051302338726556e-06, "loss": 1.0158, "step": 37412 }, { "epoch": 0.71, "learning_rate": 1.051177839487987e-06, "loss": 1.0282, "step": 37413 }, { "epoch": 0.71, "learning_rate": 1.0510533456592773e-06, "loss": 0.8735, "step": 37414 }, { "epoch": 0.71, "learning_rate": 1.0509288572408891e-06, "loss": 0.957, "step": 37415 }, { "epoch": 0.71, "learning_rate": 1.050804374233288e-06, "loss": 0.7479, "step": 37416 }, { "epoch": 0.71, "learning_rate": 1.0506798966369388e-06, "loss": 0.8586, "step": 37417 }, { "epoch": 0.71, "learning_rate": 1.0505554244523067e-06, "loss": 0.7814, "step": 37418 }, { "epoch": 0.71, "learning_rate": 1.050430957679856e-06, "loss": 1.0217, "step": 37419 }, { "epoch": 0.71, "learning_rate": 1.0503064963200518e-06, "loss": 0.8538, "step": 37420 }, { "epoch": 0.71, "learning_rate": 1.0501820403733596e-06, "loss": 0.653, "step": 37421 }, { "epoch": 0.71, "learning_rate": 1.0500575898402413e-06, "loss": 0.7754, "step": 37422 }, { "epoch": 0.71, "learning_rate": 1.0499331447211643e-06, "loss": 0.7817, "step": 37423 }, { "epoch": 0.71, "learning_rate": 1.0498087050165936e-06, "loss": 1.1065, "step": 37424 }, { "epoch": 0.71, "learning_rate": 1.0496842707269908e-06, "loss": 0.8774, "step": 37425 }, { "epoch": 0.71, "learning_rate": 1.0495598418528243e-06, "loss": 0.8059, "step": 37426 }, { "epoch": 0.71, "learning_rate": 1.049435418394556e-06, "loss": 0.8736, "step": 37427 }, { "epoch": 0.71, "learning_rate": 1.0493110003526513e-06, "loss": 0.7658, "step": 37428 }, { "epoch": 0.71, "learning_rate": 1.049186587727575e-06, "loss": 0.9164, "step": 37429 }, { "epoch": 0.71, "learning_rate": 1.0490621805197914e-06, "loss": 0.9155, "step": 37430 }, { "epoch": 0.71, "learning_rate": 1.0489377787297653e-06, "loss": 0.7826, "step": 37431 }, { "epoch": 0.71, "learning_rate": 1.0488133823579609e-06, "loss": 0.8466, "step": 37432 }, { "epoch": 0.71, "learning_rate": 1.0486889914048436e-06, "loss": 0.7444, "step": 37433 }, { "epoch": 0.71, "learning_rate": 1.0485646058708755e-06, "loss": 0.8408, "step": 37434 }, { "epoch": 0.71, "learning_rate": 1.0484402257565244e-06, "loss": 0.848, "step": 37435 }, { "epoch": 0.71, "learning_rate": 1.048315851062252e-06, "loss": 0.9684, "step": 37436 }, { "epoch": 0.71, "learning_rate": 1.0481914817885238e-06, "loss": 1.0803, "step": 37437 }, { "epoch": 0.71, "learning_rate": 1.048067117935804e-06, "loss": 1.0263, "step": 37438 }, { "epoch": 0.71, "learning_rate": 1.0479427595045571e-06, "loss": 0.9605, "step": 37439 }, { "epoch": 0.71, "learning_rate": 1.0478184064952477e-06, "loss": 0.7937, "step": 37440 }, { "epoch": 0.71, "learning_rate": 1.0476940589083395e-06, "loss": 0.8918, "step": 37441 }, { "epoch": 0.71, "learning_rate": 1.047569716744298e-06, "loss": 0.8429, "step": 37442 }, { "epoch": 0.71, "learning_rate": 1.0474453800035853e-06, "loss": 1.0777, "step": 37443 }, { "epoch": 0.71, "learning_rate": 1.0473210486866674e-06, "loss": 0.938, "step": 37444 }, { "epoch": 0.71, "learning_rate": 1.0471967227940094e-06, "loss": 0.7823, "step": 37445 }, { "epoch": 0.71, "learning_rate": 1.0470724023260723e-06, "loss": 0.8981, "step": 37446 }, { "epoch": 0.71, "learning_rate": 1.0469480872833244e-06, "loss": 1.0356, "step": 37447 }, { "epoch": 0.71, "learning_rate": 1.0468237776662266e-06, "loss": 0.7163, "step": 37448 }, { "epoch": 0.71, "learning_rate": 1.046699473475244e-06, "loss": 0.8512, "step": 37449 }, { "epoch": 0.71, "learning_rate": 1.0465751747108415e-06, "loss": 1.291, "step": 37450 }, { "epoch": 0.71, "learning_rate": 1.0464508813734825e-06, "loss": 0.9847, "step": 37451 }, { "epoch": 0.71, "learning_rate": 1.0463265934636316e-06, "loss": 0.9736, "step": 37452 }, { "epoch": 0.71, "learning_rate": 1.0462023109817524e-06, "loss": 0.9076, "step": 37453 }, { "epoch": 0.71, "learning_rate": 1.04607803392831e-06, "loss": 0.852, "step": 37454 }, { "epoch": 0.71, "learning_rate": 1.0459537623037661e-06, "loss": 0.9092, "step": 37455 }, { "epoch": 0.71, "learning_rate": 1.045829496108588e-06, "loss": 1.077, "step": 37456 }, { "epoch": 0.71, "learning_rate": 1.045705235343237e-06, "loss": 0.7804, "step": 37457 }, { "epoch": 0.71, "learning_rate": 1.0455809800081781e-06, "loss": 0.9891, "step": 37458 }, { "epoch": 0.71, "learning_rate": 1.0454567301038752e-06, "loss": 0.8428, "step": 37459 }, { "epoch": 0.71, "learning_rate": 1.0453324856307922e-06, "loss": 0.8123, "step": 37460 }, { "epoch": 0.71, "learning_rate": 1.045208246589393e-06, "loss": 0.8841, "step": 37461 }, { "epoch": 0.71, "learning_rate": 1.045084012980142e-06, "loss": 0.8277, "step": 37462 }, { "epoch": 0.71, "learning_rate": 1.0449597848035035e-06, "loss": 0.9473, "step": 37463 }, { "epoch": 0.71, "learning_rate": 1.0448355620599392e-06, "loss": 0.8189, "step": 37464 }, { "epoch": 0.71, "learning_rate": 1.044711344749914e-06, "loss": 0.9621, "step": 37465 }, { "epoch": 0.71, "learning_rate": 1.0445871328738935e-06, "loss": 0.9171, "step": 37466 }, { "epoch": 0.71, "learning_rate": 1.044462926432339e-06, "loss": 0.9949, "step": 37467 }, { "epoch": 0.71, "learning_rate": 1.0443387254257157e-06, "loss": 0.8509, "step": 37468 }, { "epoch": 0.71, "learning_rate": 1.0442145298544868e-06, "loss": 1.1286, "step": 37469 }, { "epoch": 0.71, "learning_rate": 1.044090339719116e-06, "loss": 0.9022, "step": 37470 }, { "epoch": 0.71, "learning_rate": 1.0439661550200675e-06, "loss": 1.0239, "step": 37471 }, { "epoch": 0.71, "learning_rate": 1.0438419757578044e-06, "loss": 0.968, "step": 37472 }, { "epoch": 0.71, "learning_rate": 1.043717801932792e-06, "loss": 0.6398, "step": 37473 }, { "epoch": 0.71, "learning_rate": 1.0435936335454904e-06, "loss": 1.0053, "step": 37474 }, { "epoch": 0.71, "learning_rate": 1.0434694705963678e-06, "loss": 0.9575, "step": 37475 }, { "epoch": 0.71, "learning_rate": 1.0433453130858845e-06, "loss": 0.8757, "step": 37476 }, { "epoch": 0.71, "learning_rate": 1.0432211610145053e-06, "loss": 0.9493, "step": 37477 }, { "epoch": 0.71, "learning_rate": 1.0430970143826933e-06, "loss": 0.8866, "step": 37478 }, { "epoch": 0.71, "learning_rate": 1.0429728731909125e-06, "loss": 0.6998, "step": 37479 }, { "epoch": 0.71, "learning_rate": 1.0428487374396263e-06, "loss": 0.8355, "step": 37480 }, { "epoch": 0.71, "learning_rate": 1.042724607129298e-06, "loss": 1.1508, "step": 37481 }, { "epoch": 0.71, "learning_rate": 1.0426004822603928e-06, "loss": 0.9822, "step": 37482 }, { "epoch": 0.71, "learning_rate": 1.0424763628333703e-06, "loss": 1.0517, "step": 37483 }, { "epoch": 0.71, "learning_rate": 1.0423522488486986e-06, "loss": 1.0092, "step": 37484 }, { "epoch": 0.71, "learning_rate": 1.0422281403068379e-06, "loss": 0.9161, "step": 37485 }, { "epoch": 0.71, "learning_rate": 1.0421040372082516e-06, "loss": 1.0527, "step": 37486 }, { "epoch": 0.71, "learning_rate": 1.0419799395534061e-06, "loss": 0.9956, "step": 37487 }, { "epoch": 0.71, "learning_rate": 1.041855847342762e-06, "loss": 0.9436, "step": 37488 }, { "epoch": 0.71, "learning_rate": 1.0417317605767832e-06, "loss": 0.8919, "step": 37489 }, { "epoch": 0.71, "learning_rate": 1.0416076792559335e-06, "loss": 0.805, "step": 37490 }, { "epoch": 0.71, "learning_rate": 1.0414836033806757e-06, "loss": 0.7522, "step": 37491 }, { "epoch": 0.71, "learning_rate": 1.0413595329514736e-06, "loss": 0.9415, "step": 37492 }, { "epoch": 0.71, "learning_rate": 1.0412354679687906e-06, "loss": 1.0026, "step": 37493 }, { "epoch": 0.71, "learning_rate": 1.04111140843309e-06, "loss": 1.1387, "step": 37494 }, { "epoch": 0.71, "learning_rate": 1.0409873543448332e-06, "loss": 0.8489, "step": 37495 }, { "epoch": 0.71, "learning_rate": 1.0408633057044864e-06, "loss": 0.9196, "step": 37496 }, { "epoch": 0.71, "learning_rate": 1.0407392625125106e-06, "loss": 1.0104, "step": 37497 }, { "epoch": 0.71, "learning_rate": 1.0406152247693696e-06, "loss": 0.9682, "step": 37498 }, { "epoch": 0.71, "learning_rate": 1.0404911924755267e-06, "loss": 0.9775, "step": 37499 }, { "epoch": 0.71, "learning_rate": 1.0403671656314449e-06, "loss": 1.1133, "step": 37500 }, { "epoch": 0.71, "learning_rate": 1.0402431442375875e-06, "loss": 0.9141, "step": 37501 }, { "epoch": 0.71, "learning_rate": 1.040119128294417e-06, "loss": 1.012, "step": 37502 }, { "epoch": 0.71, "learning_rate": 1.039995117802398e-06, "loss": 0.9132, "step": 37503 }, { "epoch": 0.71, "learning_rate": 1.0398711127619909e-06, "loss": 0.7748, "step": 37504 }, { "epoch": 0.71, "learning_rate": 1.039747113173662e-06, "loss": 1.0583, "step": 37505 }, { "epoch": 0.71, "learning_rate": 1.0396231190378713e-06, "loss": 1.113, "step": 37506 }, { "epoch": 0.71, "learning_rate": 1.0394991303550828e-06, "loss": 0.9988, "step": 37507 }, { "epoch": 0.71, "learning_rate": 1.0393751471257612e-06, "loss": 0.6991, "step": 37508 }, { "epoch": 0.71, "learning_rate": 1.039251169350367e-06, "loss": 1.1041, "step": 37509 }, { "epoch": 0.71, "learning_rate": 1.0391271970293645e-06, "loss": 0.9852, "step": 37510 }, { "epoch": 0.71, "learning_rate": 1.039003230163216e-06, "loss": 0.9631, "step": 37511 }, { "epoch": 0.71, "learning_rate": 1.038879268752385e-06, "loss": 1.1403, "step": 37512 }, { "epoch": 0.71, "learning_rate": 1.0387553127973337e-06, "loss": 1.0826, "step": 37513 }, { "epoch": 0.71, "learning_rate": 1.0386313622985253e-06, "loss": 0.8323, "step": 37514 }, { "epoch": 0.71, "learning_rate": 1.0385074172564236e-06, "loss": 0.9473, "step": 37515 }, { "epoch": 0.71, "learning_rate": 1.0383834776714885e-06, "loss": 0.8566, "step": 37516 }, { "epoch": 0.71, "learning_rate": 1.0382595435441864e-06, "loss": 0.9839, "step": 37517 }, { "epoch": 0.71, "learning_rate": 1.0381356148749775e-06, "loss": 1.1187, "step": 37518 }, { "epoch": 0.71, "learning_rate": 1.0380116916643254e-06, "loss": 1.1404, "step": 37519 }, { "epoch": 0.71, "learning_rate": 1.037887773912693e-06, "loss": 1.0074, "step": 37520 }, { "epoch": 0.71, "learning_rate": 1.0377638616205426e-06, "loss": 0.7793, "step": 37521 }, { "epoch": 0.71, "learning_rate": 1.0376399547883373e-06, "loss": 0.7691, "step": 37522 }, { "epoch": 0.71, "learning_rate": 1.0375160534165394e-06, "loss": 0.7883, "step": 37523 }, { "epoch": 0.71, "learning_rate": 1.0373921575056126e-06, "loss": 0.9422, "step": 37524 }, { "epoch": 0.71, "learning_rate": 1.0372682670560168e-06, "loss": 1.0268, "step": 37525 }, { "epoch": 0.71, "learning_rate": 1.0371443820682184e-06, "loss": 1.1557, "step": 37526 }, { "epoch": 0.71, "learning_rate": 1.037020502542677e-06, "loss": 0.9784, "step": 37527 }, { "epoch": 0.71, "learning_rate": 1.0368966284798554e-06, "loss": 1.0739, "step": 37528 }, { "epoch": 0.71, "learning_rate": 1.0367727598802188e-06, "loss": 0.7445, "step": 37529 }, { "epoch": 0.71, "learning_rate": 1.0366488967442267e-06, "loss": 0.65, "step": 37530 }, { "epoch": 0.71, "learning_rate": 1.036525039072343e-06, "loss": 0.9097, "step": 37531 }, { "epoch": 0.71, "learning_rate": 1.0364011868650299e-06, "loss": 0.9286, "step": 37532 }, { "epoch": 0.71, "learning_rate": 1.0362773401227496e-06, "loss": 0.7383, "step": 37533 }, { "epoch": 0.71, "learning_rate": 1.036153498845965e-06, "loss": 0.7224, "step": 37534 }, { "epoch": 0.71, "learning_rate": 1.0360296630351386e-06, "loss": 0.8166, "step": 37535 }, { "epoch": 0.71, "learning_rate": 1.0359058326907332e-06, "loss": 1.1417, "step": 37536 }, { "epoch": 0.71, "learning_rate": 1.035782007813209e-06, "loss": 1.1254, "step": 37537 }, { "epoch": 0.71, "learning_rate": 1.0356581884030312e-06, "loss": 1.0176, "step": 37538 }, { "epoch": 0.71, "learning_rate": 1.0355343744606602e-06, "loss": 0.9091, "step": 37539 }, { "epoch": 0.71, "learning_rate": 1.035410565986559e-06, "loss": 0.7901, "step": 37540 }, { "epoch": 0.71, "learning_rate": 1.0352867629811897e-06, "loss": 0.686, "step": 37541 }, { "epoch": 0.71, "learning_rate": 1.0351629654450149e-06, "loss": 0.9388, "step": 37542 }, { "epoch": 0.71, "learning_rate": 1.0350391733784964e-06, "loss": 0.838, "step": 37543 }, { "epoch": 0.71, "learning_rate": 1.0349153867820972e-06, "loss": 0.786, "step": 37544 }, { "epoch": 0.71, "learning_rate": 1.0347916056562796e-06, "loss": 1.0572, "step": 37545 }, { "epoch": 0.71, "learning_rate": 1.0346678300015035e-06, "loss": 0.8997, "step": 37546 }, { "epoch": 0.71, "learning_rate": 1.0345440598182343e-06, "loss": 0.9063, "step": 37547 }, { "epoch": 0.71, "learning_rate": 1.034420295106932e-06, "loss": 0.7274, "step": 37548 }, { "epoch": 0.71, "learning_rate": 1.0342965358680584e-06, "loss": 1.0528, "step": 37549 }, { "epoch": 0.71, "learning_rate": 1.0341727821020786e-06, "loss": 1.109, "step": 37550 }, { "epoch": 0.71, "learning_rate": 1.0340490338094516e-06, "loss": 0.7916, "step": 37551 }, { "epoch": 0.71, "learning_rate": 1.0339252909906406e-06, "loss": 0.9113, "step": 37552 }, { "epoch": 0.71, "learning_rate": 1.0338015536461076e-06, "loss": 0.9153, "step": 37553 }, { "epoch": 0.71, "learning_rate": 1.0336778217763147e-06, "loss": 0.9838, "step": 37554 }, { "epoch": 0.71, "learning_rate": 1.0335540953817238e-06, "loss": 1.3328, "step": 37555 }, { "epoch": 0.71, "learning_rate": 1.0334303744627968e-06, "loss": 0.979, "step": 37556 }, { "epoch": 0.71, "learning_rate": 1.033306659019997e-06, "loss": 0.8182, "step": 37557 }, { "epoch": 0.71, "learning_rate": 1.0331829490537832e-06, "loss": 0.7649, "step": 37558 }, { "epoch": 0.71, "learning_rate": 1.0330592445646212e-06, "loss": 0.9312, "step": 37559 }, { "epoch": 0.71, "learning_rate": 1.03293554555297e-06, "loss": 0.9709, "step": 37560 }, { "epoch": 0.71, "learning_rate": 1.0328118520192925e-06, "loss": 0.9935, "step": 37561 }, { "epoch": 0.71, "learning_rate": 1.0326881639640508e-06, "loss": 1.0619, "step": 37562 }, { "epoch": 0.71, "learning_rate": 1.0325644813877061e-06, "loss": 0.9709, "step": 37563 }, { "epoch": 0.71, "learning_rate": 1.0324408042907208e-06, "loss": 0.7661, "step": 37564 }, { "epoch": 0.71, "learning_rate": 1.0323171326735567e-06, "loss": 0.8429, "step": 37565 }, { "epoch": 0.71, "learning_rate": 1.0321934665366761e-06, "loss": 0.8898, "step": 37566 }, { "epoch": 0.71, "learning_rate": 1.0320698058805385e-06, "loss": 0.8941, "step": 37567 }, { "epoch": 0.71, "learning_rate": 1.0319461507056089e-06, "loss": 0.9861, "step": 37568 }, { "epoch": 0.71, "learning_rate": 1.0318225010123464e-06, "loss": 0.838, "step": 37569 }, { "epoch": 0.71, "learning_rate": 1.031698856801213e-06, "loss": 0.9648, "step": 37570 }, { "epoch": 0.71, "learning_rate": 1.0315752180726726e-06, "loss": 0.8474, "step": 37571 }, { "epoch": 0.71, "learning_rate": 1.0314515848271843e-06, "loss": 0.864, "step": 37572 }, { "epoch": 0.71, "learning_rate": 1.0313279570652112e-06, "loss": 0.9522, "step": 37573 }, { "epoch": 0.71, "learning_rate": 1.0312043347872142e-06, "loss": 1.036, "step": 37574 }, { "epoch": 0.71, "learning_rate": 1.0310807179936552e-06, "loss": 0.9817, "step": 37575 }, { "epoch": 0.71, "learning_rate": 1.0309571066849958e-06, "loss": 0.8747, "step": 37576 }, { "epoch": 0.71, "learning_rate": 1.0308335008616975e-06, "loss": 0.7955, "step": 37577 }, { "epoch": 0.71, "learning_rate": 1.030709900524223e-06, "loss": 0.9762, "step": 37578 }, { "epoch": 0.71, "learning_rate": 1.0305863056730307e-06, "loss": 0.6916, "step": 37579 }, { "epoch": 0.71, "learning_rate": 1.0304627163085857e-06, "loss": 1.0986, "step": 37580 }, { "epoch": 0.71, "learning_rate": 1.0303391324313473e-06, "loss": 1.1575, "step": 37581 }, { "epoch": 0.71, "learning_rate": 1.0302155540417771e-06, "loss": 1.0802, "step": 37582 }, { "epoch": 0.71, "learning_rate": 1.030091981140337e-06, "loss": 1.1211, "step": 37583 }, { "epoch": 0.71, "learning_rate": 1.0299684137274888e-06, "loss": 0.7787, "step": 37584 }, { "epoch": 0.71, "learning_rate": 1.0298448518036933e-06, "loss": 1.0652, "step": 37585 }, { "epoch": 0.71, "learning_rate": 1.029721295369412e-06, "loss": 0.8231, "step": 37586 }, { "epoch": 0.71, "learning_rate": 1.0295977444251071e-06, "loss": 1.1409, "step": 37587 }, { "epoch": 0.71, "learning_rate": 1.0294741989712373e-06, "loss": 0.8846, "step": 37588 }, { "epoch": 0.71, "learning_rate": 1.0293506590082678e-06, "loss": 0.9379, "step": 37589 }, { "epoch": 0.71, "learning_rate": 1.0292271245366567e-06, "loss": 0.8571, "step": 37590 }, { "epoch": 0.71, "learning_rate": 1.0291035955568658e-06, "loss": 0.8351, "step": 37591 }, { "epoch": 0.71, "learning_rate": 1.0289800720693586e-06, "loss": 0.8433, "step": 37592 }, { "epoch": 0.71, "learning_rate": 1.0288565540745937e-06, "loss": 1.026, "step": 37593 }, { "epoch": 0.71, "learning_rate": 1.0287330415730333e-06, "loss": 0.9326, "step": 37594 }, { "epoch": 0.71, "learning_rate": 1.0286095345651387e-06, "loss": 1.0209, "step": 37595 }, { "epoch": 0.71, "learning_rate": 1.0284860330513713e-06, "loss": 0.8049, "step": 37596 }, { "epoch": 0.71, "learning_rate": 1.0283625370321914e-06, "loss": 0.8365, "step": 37597 }, { "epoch": 0.71, "learning_rate": 1.028239046508061e-06, "loss": 0.807, "step": 37598 }, { "epoch": 0.71, "learning_rate": 1.0281155614794416e-06, "loss": 0.8829, "step": 37599 }, { "epoch": 0.71, "learning_rate": 1.027992081946792e-06, "loss": 0.8514, "step": 37600 }, { "epoch": 0.71, "learning_rate": 1.0278686079105766e-06, "loss": 0.8601, "step": 37601 }, { "epoch": 0.71, "learning_rate": 1.0277451393712538e-06, "loss": 1.0114, "step": 37602 }, { "epoch": 0.71, "learning_rate": 1.027621676329285e-06, "loss": 0.8902, "step": 37603 }, { "epoch": 0.71, "learning_rate": 1.0274982187851324e-06, "loss": 0.8713, "step": 37604 }, { "epoch": 0.71, "learning_rate": 1.027374766739256e-06, "loss": 0.8936, "step": 37605 }, { "epoch": 0.71, "learning_rate": 1.0272513201921171e-06, "loss": 1.279, "step": 37606 }, { "epoch": 0.71, "learning_rate": 1.0271278791441765e-06, "loss": 0.8772, "step": 37607 }, { "epoch": 0.71, "learning_rate": 1.0270044435958964e-06, "loss": 0.8377, "step": 37608 }, { "epoch": 0.71, "learning_rate": 1.0268810135477344e-06, "loss": 0.9378, "step": 37609 }, { "epoch": 0.71, "learning_rate": 1.0267575890001557e-06, "loss": 0.8879, "step": 37610 }, { "epoch": 0.71, "learning_rate": 1.0266341699536179e-06, "loss": 0.9878, "step": 37611 }, { "epoch": 0.71, "learning_rate": 1.0265107564085819e-06, "loss": 0.9341, "step": 37612 }, { "epoch": 0.71, "learning_rate": 1.0263873483655115e-06, "loss": 0.8961, "step": 37613 }, { "epoch": 0.71, "learning_rate": 1.0262639458248646e-06, "loss": 0.9577, "step": 37614 }, { "epoch": 0.71, "learning_rate": 1.0261405487871032e-06, "loss": 0.8859, "step": 37615 }, { "epoch": 0.71, "learning_rate": 1.0260171572526876e-06, "loss": 0.844, "step": 37616 }, { "epoch": 0.71, "learning_rate": 1.0258937712220786e-06, "loss": 0.9104, "step": 37617 }, { "epoch": 0.71, "learning_rate": 1.0257703906957373e-06, "loss": 0.8636, "step": 37618 }, { "epoch": 0.71, "learning_rate": 1.025647015674124e-06, "loss": 1.136, "step": 37619 }, { "epoch": 0.71, "learning_rate": 1.0255236461577006e-06, "loss": 0.9758, "step": 37620 }, { "epoch": 0.71, "learning_rate": 1.0254002821469248e-06, "loss": 0.9158, "step": 37621 }, { "epoch": 0.71, "learning_rate": 1.0252769236422608e-06, "loss": 0.8317, "step": 37622 }, { "epoch": 0.71, "learning_rate": 1.0251535706441667e-06, "loss": 0.6709, "step": 37623 }, { "epoch": 0.71, "learning_rate": 1.0250302231531041e-06, "loss": 1.0361, "step": 37624 }, { "epoch": 0.71, "learning_rate": 1.0249068811695334e-06, "loss": 1.118, "step": 37625 }, { "epoch": 0.71, "learning_rate": 1.0247835446939154e-06, "loss": 0.798, "step": 37626 }, { "epoch": 0.71, "learning_rate": 1.0246602137267101e-06, "loss": 0.9539, "step": 37627 }, { "epoch": 0.71, "learning_rate": 1.0245368882683782e-06, "loss": 0.8222, "step": 37628 }, { "epoch": 0.71, "learning_rate": 1.0244135683193816e-06, "loss": 0.846, "step": 37629 }, { "epoch": 0.71, "learning_rate": 1.0242902538801775e-06, "loss": 0.8752, "step": 37630 }, { "epoch": 0.71, "learning_rate": 1.02416694495123e-06, "loss": 1.2214, "step": 37631 }, { "epoch": 0.71, "learning_rate": 1.024043641532997e-06, "loss": 0.8942, "step": 37632 }, { "epoch": 0.71, "learning_rate": 1.023920343625939e-06, "loss": 0.6299, "step": 37633 }, { "epoch": 0.71, "learning_rate": 1.023797051230519e-06, "loss": 0.9371, "step": 37634 }, { "epoch": 0.71, "learning_rate": 1.0236737643471947e-06, "loss": 0.8946, "step": 37635 }, { "epoch": 0.71, "learning_rate": 1.0235504829764274e-06, "loss": 0.9836, "step": 37636 }, { "epoch": 0.71, "learning_rate": 1.023427207118677e-06, "loss": 1.1545, "step": 37637 }, { "epoch": 0.71, "learning_rate": 1.0233039367744044e-06, "loss": 1.0914, "step": 37638 }, { "epoch": 0.71, "learning_rate": 1.0231806719440693e-06, "loss": 0.7649, "step": 37639 }, { "epoch": 0.71, "learning_rate": 1.0230574126281326e-06, "loss": 0.9264, "step": 37640 }, { "epoch": 0.71, "learning_rate": 1.022934158827055e-06, "loss": 0.855, "step": 37641 }, { "epoch": 0.71, "learning_rate": 1.0228109105412942e-06, "loss": 0.8512, "step": 37642 }, { "epoch": 0.71, "learning_rate": 1.0226876677713141e-06, "loss": 0.9695, "step": 37643 }, { "epoch": 0.71, "learning_rate": 1.022564430517572e-06, "loss": 1.0148, "step": 37644 }, { "epoch": 0.71, "learning_rate": 1.0224411987805289e-06, "loss": 0.8252, "step": 37645 }, { "epoch": 0.71, "learning_rate": 1.0223179725606449e-06, "loss": 0.9059, "step": 37646 }, { "epoch": 0.71, "learning_rate": 1.0221947518583805e-06, "loss": 0.839, "step": 37647 }, { "epoch": 0.71, "learning_rate": 1.0220715366741957e-06, "loss": 0.8414, "step": 37648 }, { "epoch": 0.71, "learning_rate": 1.0219483270085504e-06, "loss": 0.7585, "step": 37649 }, { "epoch": 0.71, "learning_rate": 1.0218251228619055e-06, "loss": 0.9391, "step": 37650 }, { "epoch": 0.71, "learning_rate": 1.0217019242347184e-06, "loss": 1.0498, "step": 37651 }, { "epoch": 0.71, "learning_rate": 1.021578731127453e-06, "loss": 0.9734, "step": 37652 }, { "epoch": 0.71, "learning_rate": 1.0214555435405665e-06, "loss": 0.8326, "step": 37653 }, { "epoch": 0.71, "learning_rate": 1.0213323614745185e-06, "loss": 0.9781, "step": 37654 }, { "epoch": 0.71, "learning_rate": 1.0212091849297721e-06, "loss": 0.877, "step": 37655 }, { "epoch": 0.71, "learning_rate": 1.0210860139067842e-06, "loss": 1.1852, "step": 37656 }, { "epoch": 0.71, "learning_rate": 1.0209628484060159e-06, "loss": 0.9219, "step": 37657 }, { "epoch": 0.71, "learning_rate": 1.0208396884279268e-06, "loss": 0.7704, "step": 37658 }, { "epoch": 0.71, "learning_rate": 1.0207165339729772e-06, "loss": 0.8806, "step": 37659 }, { "epoch": 0.71, "learning_rate": 1.0205933850416266e-06, "loss": 0.8722, "step": 37660 }, { "epoch": 0.71, "learning_rate": 1.0204702416343349e-06, "loss": 0.995, "step": 37661 }, { "epoch": 0.71, "learning_rate": 1.0203471037515627e-06, "loss": 0.9453, "step": 37662 }, { "epoch": 0.71, "learning_rate": 1.0202239713937676e-06, "loss": 0.7724, "step": 37663 }, { "epoch": 0.71, "learning_rate": 1.0201008445614125e-06, "loss": 0.6974, "step": 37664 }, { "epoch": 0.71, "learning_rate": 1.0199777232549545e-06, "loss": 1.0444, "step": 37665 }, { "epoch": 0.71, "learning_rate": 1.0198546074748545e-06, "loss": 0.9261, "step": 37666 }, { "epoch": 0.71, "learning_rate": 1.0197314972215717e-06, "loss": 0.6841, "step": 37667 }, { "epoch": 0.71, "learning_rate": 1.0196083924955663e-06, "loss": 0.9624, "step": 37668 }, { "epoch": 0.71, "learning_rate": 1.0194852932972976e-06, "loss": 1.0189, "step": 37669 }, { "epoch": 0.71, "learning_rate": 1.0193621996272255e-06, "loss": 0.8827, "step": 37670 }, { "epoch": 0.71, "learning_rate": 1.0192391114858105e-06, "loss": 0.8615, "step": 37671 }, { "epoch": 0.71, "learning_rate": 1.0191160288735093e-06, "loss": 0.6498, "step": 37672 }, { "epoch": 0.71, "learning_rate": 1.0189929517907856e-06, "loss": 0.839, "step": 37673 }, { "epoch": 0.71, "learning_rate": 1.0188698802380956e-06, "loss": 0.9514, "step": 37674 }, { "epoch": 0.71, "learning_rate": 1.0187468142158992e-06, "loss": 1.0046, "step": 37675 }, { "epoch": 0.71, "learning_rate": 1.0186237537246589e-06, "loss": 1.095, "step": 37676 }, { "epoch": 0.71, "learning_rate": 1.0185006987648308e-06, "loss": 0.9697, "step": 37677 }, { "epoch": 0.71, "learning_rate": 1.0183776493368758e-06, "loss": 0.7731, "step": 37678 }, { "epoch": 0.71, "learning_rate": 1.0182546054412532e-06, "loss": 0.8149, "step": 37679 }, { "epoch": 0.71, "learning_rate": 1.0181315670784224e-06, "loss": 0.9876, "step": 37680 }, { "epoch": 0.71, "learning_rate": 1.018008534248843e-06, "loss": 1.1509, "step": 37681 }, { "epoch": 0.71, "learning_rate": 1.017885506952974e-06, "loss": 0.8907, "step": 37682 }, { "epoch": 0.71, "learning_rate": 1.0177624851912765e-06, "loss": 0.8064, "step": 37683 }, { "epoch": 0.71, "learning_rate": 1.0176394689642064e-06, "loss": 0.9344, "step": 37684 }, { "epoch": 0.71, "learning_rate": 1.0175164582722268e-06, "loss": 0.7337, "step": 37685 }, { "epoch": 0.71, "learning_rate": 1.0173934531157946e-06, "loss": 0.8373, "step": 37686 }, { "epoch": 0.71, "learning_rate": 1.0172704534953695e-06, "loss": 0.9554, "step": 37687 }, { "epoch": 0.71, "learning_rate": 1.0171474594114112e-06, "loss": 1.15, "step": 37688 }, { "epoch": 0.71, "learning_rate": 1.017024470864379e-06, "loss": 0.8776, "step": 37689 }, { "epoch": 0.71, "learning_rate": 1.0169014878547318e-06, "loss": 0.9509, "step": 37690 }, { "epoch": 0.71, "learning_rate": 1.0167785103829287e-06, "loss": 0.7914, "step": 37691 }, { "epoch": 0.71, "learning_rate": 1.0166555384494304e-06, "loss": 0.8372, "step": 37692 }, { "epoch": 0.71, "learning_rate": 1.0165325720546928e-06, "loss": 1.1469, "step": 37693 }, { "epoch": 0.71, "learning_rate": 1.0164096111991791e-06, "loss": 0.9215, "step": 37694 }, { "epoch": 0.71, "learning_rate": 1.0162866558833456e-06, "loss": 0.7783, "step": 37695 }, { "epoch": 0.71, "learning_rate": 1.0161637061076513e-06, "loss": 1.0056, "step": 37696 }, { "epoch": 0.71, "learning_rate": 1.0160407618725577e-06, "loss": 0.9769, "step": 37697 }, { "epoch": 0.71, "learning_rate": 1.015917823178522e-06, "loss": 0.821, "step": 37698 }, { "epoch": 0.71, "learning_rate": 1.0157948900260039e-06, "loss": 1.0718, "step": 37699 }, { "epoch": 0.71, "learning_rate": 1.015671962415461e-06, "loss": 0.8819, "step": 37700 }, { "epoch": 0.71, "learning_rate": 1.0155490403473539e-06, "loss": 0.7574, "step": 37701 }, { "epoch": 0.71, "learning_rate": 1.0154261238221425e-06, "loss": 0.8918, "step": 37702 }, { "epoch": 0.71, "learning_rate": 1.0153032128402824e-06, "loss": 0.8881, "step": 37703 }, { "epoch": 0.71, "learning_rate": 1.0151803074022363e-06, "loss": 0.7892, "step": 37704 }, { "epoch": 0.71, "learning_rate": 1.0150574075084608e-06, "loss": 0.7328, "step": 37705 }, { "epoch": 0.71, "learning_rate": 1.0149345131594152e-06, "loss": 1.1012, "step": 37706 }, { "epoch": 0.71, "learning_rate": 1.0148116243555586e-06, "loss": 0.9807, "step": 37707 }, { "epoch": 0.71, "learning_rate": 1.0146887410973498e-06, "loss": 0.8533, "step": 37708 }, { "epoch": 0.71, "learning_rate": 1.0145658633852479e-06, "loss": 0.8658, "step": 37709 }, { "epoch": 0.71, "learning_rate": 1.0144429912197112e-06, "loss": 0.8588, "step": 37710 }, { "epoch": 0.71, "learning_rate": 1.0143201246012e-06, "loss": 0.9233, "step": 37711 }, { "epoch": 0.71, "learning_rate": 1.01419726353017e-06, "loss": 0.8762, "step": 37712 }, { "epoch": 0.71, "learning_rate": 1.0140744080070838e-06, "loss": 0.9429, "step": 37713 }, { "epoch": 0.71, "learning_rate": 1.0139515580323973e-06, "loss": 0.9229, "step": 37714 }, { "epoch": 0.71, "learning_rate": 1.0138287136065688e-06, "loss": 0.8744, "step": 37715 }, { "epoch": 0.71, "learning_rate": 1.0137058747300605e-06, "loss": 1.1273, "step": 37716 }, { "epoch": 0.71, "learning_rate": 1.013583041403328e-06, "loss": 0.9063, "step": 37717 }, { "epoch": 0.71, "learning_rate": 1.0134602136268307e-06, "loss": 1.0224, "step": 37718 }, { "epoch": 0.71, "learning_rate": 1.0133373914010274e-06, "loss": 0.9898, "step": 37719 }, { "epoch": 0.71, "learning_rate": 1.013214574726377e-06, "loss": 1.1548, "step": 37720 }, { "epoch": 0.71, "learning_rate": 1.0130917636033375e-06, "loss": 0.9108, "step": 37721 }, { "epoch": 0.71, "learning_rate": 1.0129689580323676e-06, "loss": 0.8007, "step": 37722 }, { "epoch": 0.71, "learning_rate": 1.0128461580139273e-06, "loss": 0.7581, "step": 37723 }, { "epoch": 0.71, "learning_rate": 1.0127233635484718e-06, "loss": 1.1106, "step": 37724 }, { "epoch": 0.71, "learning_rate": 1.0126005746364638e-06, "loss": 0.9343, "step": 37725 }, { "epoch": 0.71, "learning_rate": 1.0124777912783582e-06, "loss": 0.8578, "step": 37726 }, { "epoch": 0.71, "learning_rate": 1.0123550134746152e-06, "loss": 0.8873, "step": 37727 }, { "epoch": 0.71, "learning_rate": 1.012232241225693e-06, "loss": 0.9901, "step": 37728 }, { "epoch": 0.71, "learning_rate": 1.01210947453205e-06, "loss": 0.9521, "step": 37729 }, { "epoch": 0.71, "learning_rate": 1.0119867133941443e-06, "loss": 0.9573, "step": 37730 }, { "epoch": 0.71, "learning_rate": 1.011863957812435e-06, "loss": 0.933, "step": 37731 }, { "epoch": 0.71, "learning_rate": 1.011741207787381e-06, "loss": 1.0498, "step": 37732 }, { "epoch": 0.71, "learning_rate": 1.0116184633194377e-06, "loss": 0.9868, "step": 37733 }, { "epoch": 0.71, "learning_rate": 1.011495724409067e-06, "loss": 0.8497, "step": 37734 }, { "epoch": 0.71, "learning_rate": 1.0113729910567253e-06, "loss": 0.8936, "step": 37735 }, { "epoch": 0.71, "learning_rate": 1.0112502632628697e-06, "loss": 0.8636, "step": 37736 }, { "epoch": 0.71, "learning_rate": 1.0111275410279623e-06, "loss": 1.024, "step": 37737 }, { "epoch": 0.71, "learning_rate": 1.0110048243524575e-06, "loss": 1.0992, "step": 37738 }, { "epoch": 0.71, "learning_rate": 1.0108821132368155e-06, "loss": 0.8866, "step": 37739 }, { "epoch": 0.71, "learning_rate": 1.0107594076814939e-06, "loss": 0.8453, "step": 37740 }, { "epoch": 0.71, "learning_rate": 1.010636707686951e-06, "loss": 0.7506, "step": 37741 }, { "epoch": 0.71, "learning_rate": 1.010514013253645e-06, "loss": 0.9564, "step": 37742 }, { "epoch": 0.71, "learning_rate": 1.010391324382034e-06, "loss": 0.8135, "step": 37743 }, { "epoch": 0.71, "learning_rate": 1.0102686410725771e-06, "loss": 1.1522, "step": 37744 }, { "epoch": 0.71, "learning_rate": 1.0101459633257295e-06, "loss": 0.8298, "step": 37745 }, { "epoch": 0.71, "learning_rate": 1.010023291141953e-06, "loss": 0.7354, "step": 37746 }, { "epoch": 0.71, "learning_rate": 1.009900624521703e-06, "loss": 0.8273, "step": 37747 }, { "epoch": 0.71, "learning_rate": 1.0097779634654383e-06, "loss": 0.5929, "step": 37748 }, { "epoch": 0.71, "learning_rate": 1.0096553079736172e-06, "loss": 0.9003, "step": 37749 }, { "epoch": 0.71, "learning_rate": 1.0095326580466975e-06, "loss": 1.2959, "step": 37750 }, { "epoch": 0.71, "learning_rate": 1.0094100136851368e-06, "loss": 0.8279, "step": 37751 }, { "epoch": 0.71, "learning_rate": 1.0092873748893937e-06, "loss": 0.642, "step": 37752 }, { "epoch": 0.71, "learning_rate": 1.0091647416599265e-06, "loss": 0.868, "step": 37753 }, { "epoch": 0.71, "learning_rate": 1.009042113997191e-06, "loss": 0.7531, "step": 37754 }, { "epoch": 0.71, "learning_rate": 1.0089194919016478e-06, "loss": 0.9268, "step": 37755 }, { "epoch": 0.71, "learning_rate": 1.008796875373753e-06, "loss": 0.9679, "step": 37756 }, { "epoch": 0.71, "learning_rate": 1.008674264413964e-06, "loss": 0.9877, "step": 37757 }, { "epoch": 0.71, "learning_rate": 1.0085516590227414e-06, "loss": 0.9534, "step": 37758 }, { "epoch": 0.71, "learning_rate": 1.0084290592005401e-06, "loss": 0.6273, "step": 37759 }, { "epoch": 0.71, "learning_rate": 1.0083064649478192e-06, "loss": 0.9872, "step": 37760 }, { "epoch": 0.71, "learning_rate": 1.008183876265036e-06, "loss": 1.0748, "step": 37761 }, { "epoch": 0.71, "learning_rate": 1.0080612931526487e-06, "loss": 0.8676, "step": 37762 }, { "epoch": 0.71, "learning_rate": 1.0079387156111144e-06, "loss": 1.1612, "step": 37763 }, { "epoch": 0.71, "learning_rate": 1.0078161436408915e-06, "loss": 0.7796, "step": 37764 }, { "epoch": 0.71, "learning_rate": 1.0076935772424384e-06, "loss": 0.8648, "step": 37765 }, { "epoch": 0.71, "learning_rate": 1.0075710164162098e-06, "loss": 0.8177, "step": 37766 }, { "epoch": 0.71, "learning_rate": 1.0074484611626668e-06, "loss": 0.8065, "step": 37767 }, { "epoch": 0.71, "learning_rate": 1.0073259114822647e-06, "loss": 0.9747, "step": 37768 }, { "epoch": 0.71, "learning_rate": 1.0072033673754623e-06, "loss": 1.1228, "step": 37769 }, { "epoch": 0.71, "learning_rate": 1.0070808288427162e-06, "loss": 0.8696, "step": 37770 }, { "epoch": 0.71, "learning_rate": 1.0069582958844848e-06, "loss": 0.8667, "step": 37771 }, { "epoch": 0.71, "learning_rate": 1.0068357685012254e-06, "loss": 0.8943, "step": 37772 }, { "epoch": 0.71, "learning_rate": 1.0067132466933952e-06, "loss": 1.0355, "step": 37773 }, { "epoch": 0.71, "learning_rate": 1.0065907304614528e-06, "loss": 0.9677, "step": 37774 }, { "epoch": 0.71, "learning_rate": 1.0064682198058534e-06, "loss": 0.9466, "step": 37775 }, { "epoch": 0.71, "learning_rate": 1.0063457147270575e-06, "loss": 0.9116, "step": 37776 }, { "epoch": 0.71, "learning_rate": 1.00622321522552e-06, "loss": 0.8115, "step": 37777 }, { "epoch": 0.71, "learning_rate": 1.0061007213016983e-06, "loss": 0.9215, "step": 37778 }, { "epoch": 0.71, "learning_rate": 1.0059782329560524e-06, "loss": 0.8335, "step": 37779 }, { "epoch": 0.71, "learning_rate": 1.0058557501890374e-06, "loss": 0.8091, "step": 37780 }, { "epoch": 0.71, "learning_rate": 1.0057332730011107e-06, "loss": 0.76, "step": 37781 }, { "epoch": 0.71, "learning_rate": 1.0056108013927305e-06, "loss": 0.9665, "step": 37782 }, { "epoch": 0.71, "learning_rate": 1.0054883353643539e-06, "loss": 0.89, "step": 37783 }, { "epoch": 0.71, "learning_rate": 1.0053658749164378e-06, "loss": 1.0594, "step": 37784 }, { "epoch": 0.71, "learning_rate": 1.0052434200494395e-06, "loss": 0.9504, "step": 37785 }, { "epoch": 0.71, "learning_rate": 1.0051209707638176e-06, "loss": 0.8491, "step": 37786 }, { "epoch": 0.71, "learning_rate": 1.0049985270600262e-06, "loss": 1.0347, "step": 37787 }, { "epoch": 0.71, "learning_rate": 1.0048760889385265e-06, "loss": 0.9293, "step": 37788 }, { "epoch": 0.71, "learning_rate": 1.0047536563997726e-06, "loss": 0.9431, "step": 37789 }, { "epoch": 0.71, "learning_rate": 1.0046312294442226e-06, "loss": 0.8478, "step": 37790 }, { "epoch": 0.71, "learning_rate": 1.004508808072334e-06, "loss": 0.8132, "step": 37791 }, { "epoch": 0.71, "learning_rate": 1.0043863922845635e-06, "loss": 0.7065, "step": 37792 }, { "epoch": 0.71, "learning_rate": 1.0042639820813686e-06, "loss": 0.8586, "step": 37793 }, { "epoch": 0.71, "learning_rate": 1.0041415774632057e-06, "loss": 1.0109, "step": 37794 }, { "epoch": 0.71, "learning_rate": 1.0040191784305334e-06, "loss": 0.8822, "step": 37795 }, { "epoch": 0.71, "learning_rate": 1.0038967849838057e-06, "loss": 0.8832, "step": 37796 }, { "epoch": 0.71, "learning_rate": 1.0037743971234834e-06, "loss": 0.8398, "step": 37797 }, { "epoch": 0.71, "learning_rate": 1.0036520148500209e-06, "loss": 0.8098, "step": 37798 }, { "epoch": 0.71, "learning_rate": 1.0035296381638748e-06, "loss": 0.9566, "step": 37799 }, { "epoch": 0.71, "learning_rate": 1.003407267065505e-06, "loss": 1.145, "step": 37800 }, { "epoch": 0.71, "learning_rate": 1.0032849015553658e-06, "loss": 0.9318, "step": 37801 }, { "epoch": 0.71, "learning_rate": 1.0031625416339147e-06, "loss": 0.8413, "step": 37802 }, { "epoch": 0.71, "learning_rate": 1.0030401873016087e-06, "loss": 0.8423, "step": 37803 }, { "epoch": 0.71, "learning_rate": 1.002917838558905e-06, "loss": 0.741, "step": 37804 }, { "epoch": 0.71, "learning_rate": 1.0027954954062601e-06, "loss": 0.8065, "step": 37805 }, { "epoch": 0.71, "learning_rate": 1.0026731578441309e-06, "loss": 1.252, "step": 37806 }, { "epoch": 0.71, "learning_rate": 1.0025508258729752e-06, "loss": 1.1794, "step": 37807 }, { "epoch": 0.71, "learning_rate": 1.002428499493247e-06, "loss": 1.0346, "step": 37808 }, { "epoch": 0.71, "learning_rate": 1.0023061787054064e-06, "loss": 0.7545, "step": 37809 }, { "epoch": 0.71, "learning_rate": 1.0021838635099078e-06, "loss": 0.8861, "step": 37810 }, { "epoch": 0.71, "learning_rate": 1.002061553907209e-06, "loss": 0.6762, "step": 37811 }, { "epoch": 0.71, "learning_rate": 1.0019392498977663e-06, "loss": 0.9143, "step": 37812 }, { "epoch": 0.71, "learning_rate": 1.0018169514820363e-06, "loss": 1.0482, "step": 37813 }, { "epoch": 0.71, "learning_rate": 1.0016946586604762e-06, "loss": 0.8809, "step": 37814 }, { "epoch": 0.71, "learning_rate": 1.001572371433542e-06, "loss": 1.0186, "step": 37815 }, { "epoch": 0.71, "learning_rate": 1.0014500898016919e-06, "loss": 0.9423, "step": 37816 }, { "epoch": 0.71, "learning_rate": 1.0013278137653792e-06, "loss": 0.915, "step": 37817 }, { "epoch": 0.71, "learning_rate": 1.0012055433250643e-06, "loss": 0.7449, "step": 37818 }, { "epoch": 0.71, "learning_rate": 1.0010832784812008e-06, "loss": 0.9124, "step": 37819 }, { "epoch": 0.71, "learning_rate": 1.0009610192342459e-06, "loss": 0.8465, "step": 37820 }, { "epoch": 0.71, "learning_rate": 1.000838765584658e-06, "loss": 0.8629, "step": 37821 }, { "epoch": 0.71, "learning_rate": 1.0007165175328918e-06, "loss": 0.9549, "step": 37822 }, { "epoch": 0.71, "learning_rate": 1.0005942750794037e-06, "loss": 0.853, "step": 37823 }, { "epoch": 0.71, "learning_rate": 1.0004720382246507e-06, "loss": 0.8932, "step": 37824 }, { "epoch": 0.71, "learning_rate": 1.0003498069690891e-06, "loss": 1.1472, "step": 37825 }, { "epoch": 0.71, "learning_rate": 1.0002275813131754e-06, "loss": 1.006, "step": 37826 }, { "epoch": 0.71, "learning_rate": 1.0001053612573661e-06, "loss": 0.8198, "step": 37827 }, { "epoch": 0.71, "learning_rate": 9.99983146802118e-07, "loss": 1.0031, "step": 37828 }, { "epoch": 0.71, "learning_rate": 9.998609379478852e-07, "loss": 0.8201, "step": 37829 }, { "epoch": 0.71, "learning_rate": 9.997387346951274e-07, "loss": 0.8348, "step": 37830 }, { "epoch": 0.71, "learning_rate": 9.996165370442984e-07, "loss": 0.9948, "step": 37831 }, { "epoch": 0.71, "learning_rate": 9.994943449958549e-07, "loss": 0.9417, "step": 37832 }, { "epoch": 0.71, "learning_rate": 9.99372158550254e-07, "loss": 0.9468, "step": 37833 }, { "epoch": 0.71, "learning_rate": 9.992499777079512e-07, "loss": 1.0292, "step": 37834 }, { "epoch": 0.71, "learning_rate": 9.99127802469403e-07, "loss": 0.7694, "step": 37835 }, { "epoch": 0.71, "learning_rate": 9.990056328350656e-07, "loss": 0.9742, "step": 37836 }, { "epoch": 0.71, "learning_rate": 9.988834688053958e-07, "loss": 1.2415, "step": 37837 }, { "epoch": 0.71, "learning_rate": 9.987613103808475e-07, "loss": 0.8554, "step": 37838 }, { "epoch": 0.71, "learning_rate": 9.986391575618803e-07, "loss": 0.7406, "step": 37839 }, { "epoch": 0.71, "learning_rate": 9.985170103489474e-07, "loss": 0.8558, "step": 37840 }, { "epoch": 0.71, "learning_rate": 9.983948687425051e-07, "loss": 1.063, "step": 37841 }, { "epoch": 0.71, "learning_rate": 9.982727327430122e-07, "loss": 0.8597, "step": 37842 }, { "epoch": 0.71, "learning_rate": 9.98150602350922e-07, "loss": 1.1827, "step": 37843 }, { "epoch": 0.71, "learning_rate": 9.980284775666912e-07, "loss": 0.8352, "step": 37844 }, { "epoch": 0.71, "learning_rate": 9.97906358390776e-07, "loss": 0.916, "step": 37845 }, { "epoch": 0.71, "learning_rate": 9.977842448236328e-07, "loss": 1.0258, "step": 37846 }, { "epoch": 0.71, "learning_rate": 9.976621368657169e-07, "loss": 1.1409, "step": 37847 }, { "epoch": 0.71, "learning_rate": 9.975400345174846e-07, "loss": 0.6868, "step": 37848 }, { "epoch": 0.71, "learning_rate": 9.974179377793924e-07, "loss": 0.9825, "step": 37849 }, { "epoch": 0.71, "learning_rate": 9.972958466518939e-07, "loss": 1.049, "step": 37850 }, { "epoch": 0.71, "learning_rate": 9.971737611354484e-07, "loss": 0.7734, "step": 37851 }, { "epoch": 0.71, "learning_rate": 9.970516812305091e-07, "loss": 0.7958, "step": 37852 }, { "epoch": 0.71, "learning_rate": 9.96929606937533e-07, "loss": 1.053, "step": 37853 }, { "epoch": 0.71, "learning_rate": 9.968075382569756e-07, "loss": 0.8688, "step": 37854 }, { "epoch": 0.71, "learning_rate": 9.966854751892924e-07, "loss": 0.8737, "step": 37855 }, { "epoch": 0.71, "learning_rate": 9.965634177349399e-07, "loss": 1.4174, "step": 37856 }, { "epoch": 0.71, "learning_rate": 9.964413658943733e-07, "loss": 1.1826, "step": 37857 }, { "epoch": 0.71, "learning_rate": 9.963193196680496e-07, "loss": 0.8877, "step": 37858 }, { "epoch": 0.71, "learning_rate": 9.961972790564214e-07, "loss": 0.7865, "step": 37859 }, { "epoch": 0.71, "learning_rate": 9.960752440599486e-07, "loss": 0.8828, "step": 37860 }, { "epoch": 0.71, "learning_rate": 9.959532146790834e-07, "loss": 0.8468, "step": 37861 }, { "epoch": 0.71, "learning_rate": 9.958311909142824e-07, "loss": 0.8635, "step": 37862 }, { "epoch": 0.71, "learning_rate": 9.95709172766003e-07, "loss": 1.0829, "step": 37863 }, { "epoch": 0.71, "learning_rate": 9.955871602346987e-07, "loss": 0.9185, "step": 37864 }, { "epoch": 0.71, "learning_rate": 9.954651533208257e-07, "loss": 0.7558, "step": 37865 }, { "epoch": 0.71, "learning_rate": 9.9534315202484e-07, "loss": 0.8317, "step": 37866 }, { "epoch": 0.71, "learning_rate": 9.952211563471964e-07, "loss": 0.9161, "step": 37867 }, { "epoch": 0.71, "learning_rate": 9.950991662883511e-07, "loss": 1.0466, "step": 37868 }, { "epoch": 0.71, "learning_rate": 9.949771818487593e-07, "loss": 1.0069, "step": 37869 }, { "epoch": 0.71, "learning_rate": 9.948552030288777e-07, "loss": 1.0988, "step": 37870 }, { "epoch": 0.71, "learning_rate": 9.947332298291584e-07, "loss": 0.9207, "step": 37871 }, { "epoch": 0.71, "learning_rate": 9.946112622500612e-07, "loss": 0.726, "step": 37872 }, { "epoch": 0.71, "learning_rate": 9.944893002920382e-07, "loss": 0.7792, "step": 37873 }, { "epoch": 0.71, "learning_rate": 9.943673439555463e-07, "loss": 0.9418, "step": 37874 }, { "epoch": 0.71, "learning_rate": 9.942453932410406e-07, "loss": 0.8728, "step": 37875 }, { "epoch": 0.71, "learning_rate": 9.941234481489762e-07, "loss": 0.835, "step": 37876 }, { "epoch": 0.71, "learning_rate": 9.940015086798088e-07, "loss": 0.9129, "step": 37877 }, { "epoch": 0.71, "learning_rate": 9.938795748339935e-07, "loss": 0.9005, "step": 37878 }, { "epoch": 0.71, "learning_rate": 9.937576466119866e-07, "loss": 0.898, "step": 37879 }, { "epoch": 0.71, "learning_rate": 9.936357240142408e-07, "loss": 1.033, "step": 37880 }, { "epoch": 0.71, "learning_rate": 9.935138070412148e-07, "loss": 0.8332, "step": 37881 }, { "epoch": 0.71, "learning_rate": 9.93391895693361e-07, "loss": 0.9808, "step": 37882 }, { "epoch": 0.71, "learning_rate": 9.932699899711349e-07, "loss": 0.715, "step": 37883 }, { "epoch": 0.71, "learning_rate": 9.93148089874994e-07, "loss": 0.8721, "step": 37884 }, { "epoch": 0.71, "learning_rate": 9.930261954053914e-07, "loss": 0.7457, "step": 37885 }, { "epoch": 0.71, "learning_rate": 9.929043065627825e-07, "loss": 1.1163, "step": 37886 }, { "epoch": 0.71, "learning_rate": 9.927824233476229e-07, "loss": 1.1791, "step": 37887 }, { "epoch": 0.71, "learning_rate": 9.926605457603675e-07, "loss": 0.9569, "step": 37888 }, { "epoch": 0.71, "learning_rate": 9.925386738014715e-07, "loss": 0.7538, "step": 37889 }, { "epoch": 0.71, "learning_rate": 9.924168074713894e-07, "loss": 0.811, "step": 37890 }, { "epoch": 0.71, "learning_rate": 9.922949467705782e-07, "loss": 0.7541, "step": 37891 }, { "epoch": 0.71, "learning_rate": 9.921730916994892e-07, "loss": 0.856, "step": 37892 }, { "epoch": 0.71, "learning_rate": 9.920512422585817e-07, "loss": 0.8224, "step": 37893 }, { "epoch": 0.71, "learning_rate": 9.919293984483078e-07, "loss": 0.9427, "step": 37894 }, { "epoch": 0.71, "learning_rate": 9.91807560269123e-07, "loss": 1.0396, "step": 37895 }, { "epoch": 0.71, "learning_rate": 9.916857277214827e-07, "loss": 0.9018, "step": 37896 }, { "epoch": 0.71, "learning_rate": 9.915639008058416e-07, "loss": 0.762, "step": 37897 }, { "epoch": 0.72, "learning_rate": 9.914420795226545e-07, "loss": 0.6978, "step": 37898 }, { "epoch": 0.72, "learning_rate": 9.913202638723769e-07, "loss": 0.8963, "step": 37899 }, { "epoch": 0.72, "learning_rate": 9.911984538554636e-07, "loss": 0.8207, "step": 37900 }, { "epoch": 0.72, "learning_rate": 9.910766494723676e-07, "loss": 0.9645, "step": 37901 }, { "epoch": 0.72, "learning_rate": 9.909548507235464e-07, "loss": 0.9543, "step": 37902 }, { "epoch": 0.72, "learning_rate": 9.90833057609453e-07, "loss": 1.0431, "step": 37903 }, { "epoch": 0.72, "learning_rate": 9.907112701305419e-07, "loss": 0.9355, "step": 37904 }, { "epoch": 0.72, "learning_rate": 9.905894882872702e-07, "loss": 0.9191, "step": 37905 }, { "epoch": 0.72, "learning_rate": 9.904677120800902e-07, "loss": 1.2542, "step": 37906 }, { "epoch": 0.72, "learning_rate": 9.903459415094575e-07, "loss": 1.0069, "step": 37907 }, { "epoch": 0.72, "learning_rate": 9.902241765758266e-07, "loss": 0.9358, "step": 37908 }, { "epoch": 0.72, "learning_rate": 9.901024172796524e-07, "loss": 0.925, "step": 37909 }, { "epoch": 0.72, "learning_rate": 9.899806636213898e-07, "loss": 0.876, "step": 37910 }, { "epoch": 0.72, "learning_rate": 9.89858915601493e-07, "loss": 0.7675, "step": 37911 }, { "epoch": 0.72, "learning_rate": 9.897371732204173e-07, "loss": 0.8954, "step": 37912 }, { "epoch": 0.72, "learning_rate": 9.89615436478615e-07, "loss": 0.9952, "step": 37913 }, { "epoch": 0.72, "learning_rate": 9.894937053765444e-07, "loss": 0.8515, "step": 37914 }, { "epoch": 0.72, "learning_rate": 9.89371979914657e-07, "loss": 0.7834, "step": 37915 }, { "epoch": 0.72, "learning_rate": 9.892502600934082e-07, "loss": 0.8787, "step": 37916 }, { "epoch": 0.72, "learning_rate": 9.891285459132526e-07, "loss": 0.6463, "step": 37917 }, { "epoch": 0.72, "learning_rate": 9.890068373746447e-07, "loss": 0.7511, "step": 37918 }, { "epoch": 0.72, "learning_rate": 9.88885134478039e-07, "loss": 1.0809, "step": 37919 }, { "epoch": 0.72, "learning_rate": 9.887634372238899e-07, "loss": 0.7575, "step": 37920 }, { "epoch": 0.72, "learning_rate": 9.886417456126527e-07, "loss": 0.8285, "step": 37921 }, { "epoch": 0.72, "learning_rate": 9.885200596447788e-07, "loss": 0.8621, "step": 37922 }, { "epoch": 0.72, "learning_rate": 9.88398379320727e-07, "loss": 0.7612, "step": 37923 }, { "epoch": 0.72, "learning_rate": 9.882767046409478e-07, "loss": 1.0399, "step": 37924 }, { "epoch": 0.72, "learning_rate": 9.881550356058964e-07, "loss": 0.9184, "step": 37925 }, { "epoch": 0.72, "learning_rate": 9.880333722160297e-07, "loss": 0.9475, "step": 37926 }, { "epoch": 0.72, "learning_rate": 9.879117144717989e-07, "loss": 0.8835, "step": 37927 }, { "epoch": 0.72, "learning_rate": 9.877900623736595e-07, "loss": 0.8407, "step": 37928 }, { "epoch": 0.72, "learning_rate": 9.876684159220656e-07, "loss": 0.791, "step": 37929 }, { "epoch": 0.72, "learning_rate": 9.875467751174716e-07, "loss": 0.9118, "step": 37930 }, { "epoch": 0.72, "learning_rate": 9.874251399603324e-07, "loss": 1.1039, "step": 37931 }, { "epoch": 0.72, "learning_rate": 9.873035104510996e-07, "loss": 0.846, "step": 37932 }, { "epoch": 0.72, "learning_rate": 9.871818865902305e-07, "loss": 1.1392, "step": 37933 }, { "epoch": 0.72, "learning_rate": 9.870602683781775e-07, "loss": 0.8902, "step": 37934 }, { "epoch": 0.72, "learning_rate": 9.869386558153947e-07, "loss": 0.7957, "step": 37935 }, { "epoch": 0.72, "learning_rate": 9.868170489023368e-07, "loss": 1.0234, "step": 37936 }, { "epoch": 0.72, "learning_rate": 9.866954476394575e-07, "loss": 1.2191, "step": 37937 }, { "epoch": 0.72, "learning_rate": 9.865738520272112e-07, "loss": 0.9025, "step": 37938 }, { "epoch": 0.72, "learning_rate": 9.864522620660517e-07, "loss": 0.8643, "step": 37939 }, { "epoch": 0.72, "learning_rate": 9.863306777564334e-07, "loss": 0.9647, "step": 37940 }, { "epoch": 0.72, "learning_rate": 9.862090990988088e-07, "loss": 0.9788, "step": 37941 }, { "epoch": 0.72, "learning_rate": 9.860875260936344e-07, "loss": 0.8741, "step": 37942 }, { "epoch": 0.72, "learning_rate": 9.859659587413623e-07, "loss": 1.0405, "step": 37943 }, { "epoch": 0.72, "learning_rate": 9.858443970424467e-07, "loss": 0.9301, "step": 37944 }, { "epoch": 0.72, "learning_rate": 9.857228409973415e-07, "loss": 0.9215, "step": 37945 }, { "epoch": 0.72, "learning_rate": 9.85601290606501e-07, "loss": 0.8964, "step": 37946 }, { "epoch": 0.72, "learning_rate": 9.85479745870379e-07, "loss": 0.7249, "step": 37947 }, { "epoch": 0.72, "learning_rate": 9.853582067894287e-07, "loss": 0.7589, "step": 37948 }, { "epoch": 0.72, "learning_rate": 9.852366733641056e-07, "loss": 1.0521, "step": 37949 }, { "epoch": 0.72, "learning_rate": 9.851151455948605e-07, "loss": 0.9932, "step": 37950 }, { "epoch": 0.72, "learning_rate": 9.849936234821497e-07, "loss": 1.0848, "step": 37951 }, { "epoch": 0.72, "learning_rate": 9.848721070264275e-07, "loss": 0.7765, "step": 37952 }, { "epoch": 0.72, "learning_rate": 9.847505962281445e-07, "loss": 0.8694, "step": 37953 }, { "epoch": 0.72, "learning_rate": 9.84629091087758e-07, "loss": 0.8391, "step": 37954 }, { "epoch": 0.72, "learning_rate": 9.845075916057192e-07, "loss": 1.053, "step": 37955 }, { "epoch": 0.72, "learning_rate": 9.843860977824826e-07, "loss": 1.1362, "step": 37956 }, { "epoch": 0.72, "learning_rate": 9.842646096185016e-07, "loss": 0.7711, "step": 37957 }, { "epoch": 0.72, "learning_rate": 9.841431271142305e-07, "loss": 0.8892, "step": 37958 }, { "epoch": 0.72, "learning_rate": 9.840216502701222e-07, "loss": 0.9531, "step": 37959 }, { "epoch": 0.72, "learning_rate": 9.839001790866306e-07, "loss": 0.7463, "step": 37960 }, { "epoch": 0.72, "learning_rate": 9.8377871356421e-07, "loss": 0.9272, "step": 37961 }, { "epoch": 0.72, "learning_rate": 9.836572537033118e-07, "loss": 1.1407, "step": 37962 }, { "epoch": 0.72, "learning_rate": 9.835357995043924e-07, "loss": 0.9185, "step": 37963 }, { "epoch": 0.72, "learning_rate": 9.83414350967903e-07, "loss": 0.8705, "step": 37964 }, { "epoch": 0.72, "learning_rate": 9.83292908094298e-07, "loss": 0.7321, "step": 37965 }, { "epoch": 0.72, "learning_rate": 9.831714708840307e-07, "loss": 0.6167, "step": 37966 }, { "epoch": 0.72, "learning_rate": 9.830500393375548e-07, "loss": 0.6328, "step": 37967 }, { "epoch": 0.72, "learning_rate": 9.82928613455323e-07, "loss": 0.9027, "step": 37968 }, { "epoch": 0.72, "learning_rate": 9.8280719323779e-07, "loss": 1.1005, "step": 37969 }, { "epoch": 0.72, "learning_rate": 9.82685778685409e-07, "loss": 0.9835, "step": 37970 }, { "epoch": 0.72, "learning_rate": 9.825643697986309e-07, "loss": 0.8703, "step": 37971 }, { "epoch": 0.72, "learning_rate": 9.824429665779116e-07, "loss": 0.9678, "step": 37972 }, { "epoch": 0.72, "learning_rate": 9.823215690237052e-07, "loss": 0.7504, "step": 37973 }, { "epoch": 0.72, "learning_rate": 9.822001771364612e-07, "loss": 0.8362, "step": 37974 }, { "epoch": 0.72, "learning_rate": 9.82078790916637e-07, "loss": 0.8818, "step": 37975 }, { "epoch": 0.72, "learning_rate": 9.819574103646836e-07, "loss": 0.9673, "step": 37976 }, { "epoch": 0.72, "learning_rate": 9.818360354810544e-07, "loss": 0.7905, "step": 37977 }, { "epoch": 0.72, "learning_rate": 9.81714666266203e-07, "loss": 0.8443, "step": 37978 }, { "epoch": 0.72, "learning_rate": 9.815933027205823e-07, "loss": 0.8112, "step": 37979 }, { "epoch": 0.72, "learning_rate": 9.814719448446457e-07, "loss": 0.8056, "step": 37980 }, { "epoch": 0.72, "learning_rate": 9.813505926388466e-07, "loss": 0.9886, "step": 37981 }, { "epoch": 0.72, "learning_rate": 9.812292461036385e-07, "loss": 0.9672, "step": 37982 }, { "epoch": 0.72, "learning_rate": 9.81107905239472e-07, "loss": 0.789, "step": 37983 }, { "epoch": 0.72, "learning_rate": 9.809865700468039e-07, "loss": 0.879, "step": 37984 }, { "epoch": 0.72, "learning_rate": 9.808652405260842e-07, "loss": 0.879, "step": 37985 }, { "epoch": 0.72, "learning_rate": 9.807439166777677e-07, "loss": 0.946, "step": 37986 }, { "epoch": 0.72, "learning_rate": 9.806225985023062e-07, "loss": 0.9698, "step": 37987 }, { "epoch": 0.72, "learning_rate": 9.805012860001537e-07, "loss": 0.8784, "step": 37988 }, { "epoch": 0.72, "learning_rate": 9.803799791717627e-07, "loss": 0.8241, "step": 37989 }, { "epoch": 0.72, "learning_rate": 9.802586780175863e-07, "loss": 0.7903, "step": 37990 }, { "epoch": 0.72, "learning_rate": 9.801373825380783e-07, "loss": 0.7679, "step": 37991 }, { "epoch": 0.72, "learning_rate": 9.800160927336888e-07, "loss": 0.8549, "step": 37992 }, { "epoch": 0.72, "learning_rate": 9.798948086048738e-07, "loss": 0.909, "step": 37993 }, { "epoch": 0.72, "learning_rate": 9.797735301520854e-07, "loss": 1.049, "step": 37994 }, { "epoch": 0.72, "learning_rate": 9.796522573757748e-07, "loss": 0.881, "step": 37995 }, { "epoch": 0.72, "learning_rate": 9.795309902763975e-07, "loss": 0.8017, "step": 37996 }, { "epoch": 0.72, "learning_rate": 9.794097288544039e-07, "loss": 0.9767, "step": 37997 }, { "epoch": 0.72, "learning_rate": 9.792884731102478e-07, "loss": 0.7712, "step": 37998 }, { "epoch": 0.72, "learning_rate": 9.79167223044382e-07, "loss": 0.7064, "step": 37999 }, { "epoch": 0.72, "learning_rate": 9.790459786572592e-07, "loss": 0.9686, "step": 38000 }, { "epoch": 0.72, "learning_rate": 9.78924739949332e-07, "loss": 0.6617, "step": 38001 }, { "epoch": 0.72, "learning_rate": 9.788035069210533e-07, "loss": 0.8914, "step": 38002 }, { "epoch": 0.72, "learning_rate": 9.786822795728766e-07, "loss": 0.7847, "step": 38003 }, { "epoch": 0.72, "learning_rate": 9.785610579052516e-07, "loss": 0.7277, "step": 38004 }, { "epoch": 0.72, "learning_rate": 9.784398419186348e-07, "loss": 0.8316, "step": 38005 }, { "epoch": 0.72, "learning_rate": 9.783186316134763e-07, "loss": 1.0073, "step": 38006 }, { "epoch": 0.72, "learning_rate": 9.781974269902292e-07, "loss": 0.7194, "step": 38007 }, { "epoch": 0.72, "learning_rate": 9.780762280493462e-07, "loss": 0.8058, "step": 38008 }, { "epoch": 0.72, "learning_rate": 9.779550347912801e-07, "loss": 0.8028, "step": 38009 }, { "epoch": 0.72, "learning_rate": 9.778338472164828e-07, "loss": 0.7928, "step": 38010 }, { "epoch": 0.72, "learning_rate": 9.777126653254077e-07, "loss": 0.8693, "step": 38011 }, { "epoch": 0.72, "learning_rate": 9.775914891185076e-07, "loss": 1.0933, "step": 38012 }, { "epoch": 0.72, "learning_rate": 9.774703185962323e-07, "loss": 0.9644, "step": 38013 }, { "epoch": 0.72, "learning_rate": 9.77349153759037e-07, "loss": 0.815, "step": 38014 }, { "epoch": 0.72, "learning_rate": 9.772279946073743e-07, "loss": 0.9191, "step": 38015 }, { "epoch": 0.72, "learning_rate": 9.771068411416939e-07, "loss": 0.7312, "step": 38016 }, { "epoch": 0.72, "learning_rate": 9.769856933624515e-07, "loss": 0.7684, "step": 38017 }, { "epoch": 0.72, "learning_rate": 9.76864551270097e-07, "loss": 0.9932, "step": 38018 }, { "epoch": 0.72, "learning_rate": 9.767434148650835e-07, "loss": 1.0434, "step": 38019 }, { "epoch": 0.72, "learning_rate": 9.766222841478634e-07, "loss": 0.7531, "step": 38020 }, { "epoch": 0.72, "learning_rate": 9.76501159118889e-07, "loss": 0.8132, "step": 38021 }, { "epoch": 0.72, "learning_rate": 9.763800397786124e-07, "loss": 0.9073, "step": 38022 }, { "epoch": 0.72, "learning_rate": 9.762589261274862e-07, "loss": 0.6649, "step": 38023 }, { "epoch": 0.72, "learning_rate": 9.761378181659634e-07, "loss": 1.1179, "step": 38024 }, { "epoch": 0.72, "learning_rate": 9.760167158944935e-07, "loss": 1.0783, "step": 38025 }, { "epoch": 0.72, "learning_rate": 9.758956193135321e-07, "loss": 0.8927, "step": 38026 }, { "epoch": 0.72, "learning_rate": 9.75774528423529e-07, "loss": 0.718, "step": 38027 }, { "epoch": 0.72, "learning_rate": 9.756534432249368e-07, "loss": 0.6185, "step": 38028 }, { "epoch": 0.72, "learning_rate": 9.755323637182081e-07, "loss": 0.8738, "step": 38029 }, { "epoch": 0.72, "learning_rate": 9.75411289903795e-07, "loss": 0.9074, "step": 38030 }, { "epoch": 0.72, "learning_rate": 9.75290221782149e-07, "loss": 1.1622, "step": 38031 }, { "epoch": 0.72, "learning_rate": 9.751691593537227e-07, "loss": 1.0842, "step": 38032 }, { "epoch": 0.72, "learning_rate": 9.750481026189689e-07, "loss": 0.9358, "step": 38033 }, { "epoch": 0.72, "learning_rate": 9.74927051578337e-07, "loss": 0.8498, "step": 38034 }, { "epoch": 0.72, "learning_rate": 9.748060062322814e-07, "loss": 0.9057, "step": 38035 }, { "epoch": 0.72, "learning_rate": 9.746849665812546e-07, "loss": 0.7336, "step": 38036 }, { "epoch": 0.72, "learning_rate": 9.745639326257055e-07, "loss": 0.8806, "step": 38037 }, { "epoch": 0.72, "learning_rate": 9.744429043660897e-07, "loss": 0.7867, "step": 38038 }, { "epoch": 0.72, "learning_rate": 9.743218818028564e-07, "loss": 1.0443, "step": 38039 }, { "epoch": 0.72, "learning_rate": 9.742008649364583e-07, "loss": 0.964, "step": 38040 }, { "epoch": 0.72, "learning_rate": 9.740798537673477e-07, "loss": 1.0048, "step": 38041 }, { "epoch": 0.72, "learning_rate": 9.739588482959759e-07, "loss": 0.7885, "step": 38042 }, { "epoch": 0.72, "learning_rate": 9.73837848522795e-07, "loss": 0.7737, "step": 38043 }, { "epoch": 0.72, "learning_rate": 9.737168544482566e-07, "loss": 0.9825, "step": 38044 }, { "epoch": 0.72, "learning_rate": 9.73595866072814e-07, "loss": 1.0161, "step": 38045 }, { "epoch": 0.72, "learning_rate": 9.734748833969153e-07, "loss": 0.973, "step": 38046 }, { "epoch": 0.72, "learning_rate": 9.733539064210168e-07, "loss": 0.9504, "step": 38047 }, { "epoch": 0.72, "learning_rate": 9.732329351455673e-07, "loss": 0.7537, "step": 38048 }, { "epoch": 0.72, "learning_rate": 9.731119695710187e-07, "loss": 0.8836, "step": 38049 }, { "epoch": 0.72, "learning_rate": 9.729910096978234e-07, "loss": 1.1333, "step": 38050 }, { "epoch": 0.72, "learning_rate": 9.728700555264328e-07, "loss": 0.9718, "step": 38051 }, { "epoch": 0.72, "learning_rate": 9.727491070572986e-07, "loss": 0.8035, "step": 38052 }, { "epoch": 0.72, "learning_rate": 9.726281642908725e-07, "loss": 0.9351, "step": 38053 }, { "epoch": 0.72, "learning_rate": 9.725072272276067e-07, "loss": 0.9733, "step": 38054 }, { "epoch": 0.72, "learning_rate": 9.723862958679506e-07, "loss": 1.0299, "step": 38055 }, { "epoch": 0.72, "learning_rate": 9.722653702123577e-07, "loss": 1.2368, "step": 38056 }, { "epoch": 0.72, "learning_rate": 9.721444502612803e-07, "loss": 0.8811, "step": 38057 }, { "epoch": 0.72, "learning_rate": 9.720235360151668e-07, "loss": 0.8768, "step": 38058 }, { "epoch": 0.72, "learning_rate": 9.719026274744721e-07, "loss": 0.7237, "step": 38059 }, { "epoch": 0.72, "learning_rate": 9.717817246396458e-07, "loss": 0.7327, "step": 38060 }, { "epoch": 0.72, "learning_rate": 9.716608275111395e-07, "loss": 0.9635, "step": 38061 }, { "epoch": 0.72, "learning_rate": 9.715399360894045e-07, "loss": 0.989, "step": 38062 }, { "epoch": 0.72, "learning_rate": 9.714190503748928e-07, "loss": 1.0717, "step": 38063 }, { "epoch": 0.72, "learning_rate": 9.712981703680556e-07, "loss": 0.8911, "step": 38064 }, { "epoch": 0.72, "learning_rate": 9.711772960693435e-07, "loss": 0.8471, "step": 38065 }, { "epoch": 0.72, "learning_rate": 9.7105642747921e-07, "loss": 0.8287, "step": 38066 }, { "epoch": 0.72, "learning_rate": 9.70935564598103e-07, "loss": 0.7892, "step": 38067 }, { "epoch": 0.72, "learning_rate": 9.708147074264777e-07, "loss": 0.818, "step": 38068 }, { "epoch": 0.72, "learning_rate": 9.70693855964782e-07, "loss": 1.0691, "step": 38069 }, { "epoch": 0.72, "learning_rate": 9.705730102134688e-07, "loss": 0.9138, "step": 38070 }, { "epoch": 0.72, "learning_rate": 9.704521701729893e-07, "loss": 0.7301, "step": 38071 }, { "epoch": 0.72, "learning_rate": 9.703313358437944e-07, "loss": 1.0207, "step": 38072 }, { "epoch": 0.72, "learning_rate": 9.702105072263354e-07, "loss": 0.7952, "step": 38073 }, { "epoch": 0.72, "learning_rate": 9.700896843210633e-07, "loss": 1.0171, "step": 38074 }, { "epoch": 0.72, "learning_rate": 9.699688671284304e-07, "loss": 0.9072, "step": 38075 }, { "epoch": 0.72, "learning_rate": 9.698480556488852e-07, "loss": 1.0696, "step": 38076 }, { "epoch": 0.72, "learning_rate": 9.697272498828811e-07, "loss": 0.9919, "step": 38077 }, { "epoch": 0.72, "learning_rate": 9.696064498308694e-07, "loss": 0.7759, "step": 38078 }, { "epoch": 0.72, "learning_rate": 9.694856554932988e-07, "loss": 0.8872, "step": 38079 }, { "epoch": 0.72, "learning_rate": 9.693648668706233e-07, "loss": 1.0255, "step": 38080 }, { "epoch": 0.72, "learning_rate": 9.692440839632917e-07, "loss": 1.0499, "step": 38081 }, { "epoch": 0.72, "learning_rate": 9.691233067717559e-07, "loss": 0.9606, "step": 38082 }, { "epoch": 0.72, "learning_rate": 9.690025352964666e-07, "loss": 0.8026, "step": 38083 }, { "epoch": 0.72, "learning_rate": 9.688817695378746e-07, "loss": 0.9449, "step": 38084 }, { "epoch": 0.72, "learning_rate": 9.687610094964317e-07, "loss": 0.8115, "step": 38085 }, { "epoch": 0.72, "learning_rate": 9.68640255172588e-07, "loss": 0.6354, "step": 38086 }, { "epoch": 0.72, "learning_rate": 9.685195065667954e-07, "loss": 1.1726, "step": 38087 }, { "epoch": 0.72, "learning_rate": 9.683987636795023e-07, "loss": 0.9924, "step": 38088 }, { "epoch": 0.72, "learning_rate": 9.68278026511163e-07, "loss": 1.0732, "step": 38089 }, { "epoch": 0.72, "learning_rate": 9.681572950622257e-07, "loss": 0.747, "step": 38090 }, { "epoch": 0.72, "learning_rate": 9.680365693331424e-07, "loss": 0.9568, "step": 38091 }, { "epoch": 0.72, "learning_rate": 9.67915849324363e-07, "loss": 1.0398, "step": 38092 }, { "epoch": 0.72, "learning_rate": 9.677951350363393e-07, "loss": 1.0836, "step": 38093 }, { "epoch": 0.72, "learning_rate": 9.676744264695214e-07, "loss": 0.8792, "step": 38094 }, { "epoch": 0.72, "learning_rate": 9.6755372362436e-07, "loss": 0.8775, "step": 38095 }, { "epoch": 0.72, "learning_rate": 9.674330265013073e-07, "loss": 0.7362, "step": 38096 }, { "epoch": 0.72, "learning_rate": 9.67312335100811e-07, "loss": 0.972, "step": 38097 }, { "epoch": 0.72, "learning_rate": 9.67191649423324e-07, "loss": 0.6933, "step": 38098 }, { "epoch": 0.72, "learning_rate": 9.670709694692974e-07, "loss": 1.0223, "step": 38099 }, { "epoch": 0.72, "learning_rate": 9.66950295239179e-07, "loss": 1.0291, "step": 38100 }, { "epoch": 0.72, "learning_rate": 9.668296267334229e-07, "loss": 0.9186, "step": 38101 }, { "epoch": 0.72, "learning_rate": 9.667089639524771e-07, "loss": 0.8403, "step": 38102 }, { "epoch": 0.72, "learning_rate": 9.665883068967929e-07, "loss": 0.8567, "step": 38103 }, { "epoch": 0.72, "learning_rate": 9.664676555668212e-07, "loss": 0.782, "step": 38104 }, { "epoch": 0.72, "learning_rate": 9.663470099630124e-07, "loss": 1.0278, "step": 38105 }, { "epoch": 0.72, "learning_rate": 9.662263700858166e-07, "loss": 0.888, "step": 38106 }, { "epoch": 0.72, "learning_rate": 9.661057359356844e-07, "loss": 0.7698, "step": 38107 }, { "epoch": 0.72, "learning_rate": 9.659851075130671e-07, "loss": 0.9265, "step": 38108 }, { "epoch": 0.72, "learning_rate": 9.658644848184132e-07, "loss": 0.903, "step": 38109 }, { "epoch": 0.72, "learning_rate": 9.657438678521754e-07, "loss": 0.8568, "step": 38110 }, { "epoch": 0.72, "learning_rate": 9.656232566148023e-07, "loss": 0.8992, "step": 38111 }, { "epoch": 0.72, "learning_rate": 9.655026511067453e-07, "loss": 1.1385, "step": 38112 }, { "epoch": 0.72, "learning_rate": 9.653820513284539e-07, "loss": 0.9437, "step": 38113 }, { "epoch": 0.72, "learning_rate": 9.652614572803789e-07, "loss": 0.9631, "step": 38114 }, { "epoch": 0.72, "learning_rate": 9.651408689629707e-07, "loss": 0.7827, "step": 38115 }, { "epoch": 0.72, "learning_rate": 9.650202863766793e-07, "loss": 0.9343, "step": 38116 }, { "epoch": 0.72, "learning_rate": 9.648997095219565e-07, "loss": 0.7987, "step": 38117 }, { "epoch": 0.72, "learning_rate": 9.64779138399249e-07, "loss": 1.105, "step": 38118 }, { "epoch": 0.72, "learning_rate": 9.646585730090097e-07, "loss": 0.963, "step": 38119 }, { "epoch": 0.72, "learning_rate": 9.645380133516893e-07, "loss": 0.8684, "step": 38120 }, { "epoch": 0.72, "learning_rate": 9.64417459427735e-07, "loss": 0.9066, "step": 38121 }, { "epoch": 0.72, "learning_rate": 9.642969112376007e-07, "loss": 0.9238, "step": 38122 }, { "epoch": 0.72, "learning_rate": 9.64176368781734e-07, "loss": 0.941, "step": 38123 }, { "epoch": 0.72, "learning_rate": 9.640558320605856e-07, "loss": 0.8759, "step": 38124 }, { "epoch": 0.72, "learning_rate": 9.639353010746052e-07, "loss": 0.9871, "step": 38125 }, { "epoch": 0.72, "learning_rate": 9.638147758242436e-07, "loss": 1.0382, "step": 38126 }, { "epoch": 0.72, "learning_rate": 9.636942563099504e-07, "loss": 0.7987, "step": 38127 }, { "epoch": 0.72, "learning_rate": 9.63573742532176e-07, "loss": 0.8584, "step": 38128 }, { "epoch": 0.72, "learning_rate": 9.634532344913707e-07, "loss": 0.6354, "step": 38129 }, { "epoch": 0.72, "learning_rate": 9.633327321879823e-07, "loss": 0.9315, "step": 38130 }, { "epoch": 0.72, "learning_rate": 9.632122356224644e-07, "loss": 1.1675, "step": 38131 }, { "epoch": 0.72, "learning_rate": 9.630917447952636e-07, "loss": 1.028, "step": 38132 }, { "epoch": 0.72, "learning_rate": 9.629712597068314e-07, "loss": 0.7463, "step": 38133 }, { "epoch": 0.72, "learning_rate": 9.62850780357617e-07, "loss": 0.8846, "step": 38134 }, { "epoch": 0.72, "learning_rate": 9.627303067480708e-07, "loss": 0.8257, "step": 38135 }, { "epoch": 0.72, "learning_rate": 9.626098388786427e-07, "loss": 1.0382, "step": 38136 }, { "epoch": 0.72, "learning_rate": 9.624893767497822e-07, "loss": 0.9417, "step": 38137 }, { "epoch": 0.72, "learning_rate": 9.623689203619402e-07, "loss": 0.9686, "step": 38138 }, { "epoch": 0.72, "learning_rate": 9.622484697155637e-07, "loss": 0.9321, "step": 38139 }, { "epoch": 0.72, "learning_rate": 9.62128024811105e-07, "loss": 0.8271, "step": 38140 }, { "epoch": 0.72, "learning_rate": 9.620075856490142e-07, "loss": 0.7785, "step": 38141 }, { "epoch": 0.72, "learning_rate": 9.61887152229738e-07, "loss": 0.7881, "step": 38142 }, { "epoch": 0.72, "learning_rate": 9.617667245537298e-07, "loss": 1.091, "step": 38143 }, { "epoch": 0.72, "learning_rate": 9.616463026214368e-07, "loss": 1.0707, "step": 38144 }, { "epoch": 0.72, "learning_rate": 9.615258864333091e-07, "loss": 0.9348, "step": 38145 }, { "epoch": 0.72, "learning_rate": 9.614054759897966e-07, "loss": 0.8666, "step": 38146 }, { "epoch": 0.72, "learning_rate": 9.61285071291349e-07, "loss": 0.899, "step": 38147 }, { "epoch": 0.72, "learning_rate": 9.611646723384157e-07, "loss": 0.8245, "step": 38148 }, { "epoch": 0.72, "learning_rate": 9.610442791314464e-07, "loss": 0.9797, "step": 38149 }, { "epoch": 0.72, "learning_rate": 9.609238916708913e-07, "loss": 1.0504, "step": 38150 }, { "epoch": 0.72, "learning_rate": 9.608035099571975e-07, "loss": 0.8981, "step": 38151 }, { "epoch": 0.72, "learning_rate": 9.60683133990818e-07, "loss": 0.9002, "step": 38152 }, { "epoch": 0.72, "learning_rate": 9.605627637721996e-07, "loss": 1.021, "step": 38153 }, { "epoch": 0.72, "learning_rate": 9.604423993017924e-07, "loss": 0.8016, "step": 38154 }, { "epoch": 0.72, "learning_rate": 9.603220405800465e-07, "loss": 1.0645, "step": 38155 }, { "epoch": 0.72, "learning_rate": 9.602016876074107e-07, "loss": 1.1852, "step": 38156 }, { "epoch": 0.72, "learning_rate": 9.600813403843346e-07, "loss": 0.9474, "step": 38157 }, { "epoch": 0.72, "learning_rate": 9.599609989112674e-07, "loss": 1.0037, "step": 38158 }, { "epoch": 0.72, "learning_rate": 9.598406631886598e-07, "loss": 0.8895, "step": 38159 }, { "epoch": 0.72, "learning_rate": 9.59720333216958e-07, "loss": 0.9307, "step": 38160 }, { "epoch": 0.72, "learning_rate": 9.59600008996614e-07, "loss": 0.8456, "step": 38161 }, { "epoch": 0.72, "learning_rate": 9.594796905280773e-07, "loss": 1.0208, "step": 38162 }, { "epoch": 0.72, "learning_rate": 9.593593778117947e-07, "loss": 0.9932, "step": 38163 }, { "epoch": 0.72, "learning_rate": 9.592390708482185e-07, "loss": 0.822, "step": 38164 }, { "epoch": 0.72, "learning_rate": 9.591187696377953e-07, "loss": 1.0903, "step": 38165 }, { "epoch": 0.72, "learning_rate": 9.589984741809758e-07, "loss": 0.9243, "step": 38166 }, { "epoch": 0.72, "learning_rate": 9.588781844782082e-07, "loss": 0.9773, "step": 38167 }, { "epoch": 0.72, "learning_rate": 9.587579005299428e-07, "loss": 0.9795, "step": 38168 }, { "epoch": 0.72, "learning_rate": 9.586376223366286e-07, "loss": 1.0365, "step": 38169 }, { "epoch": 0.72, "learning_rate": 9.585173498987127e-07, "loss": 0.9287, "step": 38170 }, { "epoch": 0.72, "learning_rate": 9.583970832166476e-07, "loss": 0.7355, "step": 38171 }, { "epoch": 0.72, "learning_rate": 9.582768222908796e-07, "loss": 0.8279, "step": 38172 }, { "epoch": 0.72, "learning_rate": 9.581565671218585e-07, "loss": 0.8755, "step": 38173 }, { "epoch": 0.72, "learning_rate": 9.580363177100335e-07, "loss": 0.8615, "step": 38174 }, { "epoch": 0.72, "learning_rate": 9.579160740558536e-07, "loss": 1.0536, "step": 38175 }, { "epoch": 0.72, "learning_rate": 9.577958361597679e-07, "loss": 1.0469, "step": 38176 }, { "epoch": 0.72, "learning_rate": 9.57675604022225e-07, "loss": 0.7587, "step": 38177 }, { "epoch": 0.72, "learning_rate": 9.575553776436755e-07, "loss": 0.7633, "step": 38178 }, { "epoch": 0.72, "learning_rate": 9.574351570245649e-07, "loss": 0.6319, "step": 38179 }, { "epoch": 0.72, "learning_rate": 9.573149421653458e-07, "loss": 1.1385, "step": 38180 }, { "epoch": 0.72, "learning_rate": 9.571947330664647e-07, "loss": 0.9506, "step": 38181 }, { "epoch": 0.72, "learning_rate": 9.570745297283701e-07, "loss": 0.8363, "step": 38182 }, { "epoch": 0.72, "learning_rate": 9.569543321515137e-07, "loss": 0.8355, "step": 38183 }, { "epoch": 0.72, "learning_rate": 9.568341403363418e-07, "loss": 0.852, "step": 38184 }, { "epoch": 0.72, "learning_rate": 9.56713954283304e-07, "loss": 0.8945, "step": 38185 }, { "epoch": 0.72, "learning_rate": 9.565937739928484e-07, "loss": 0.9931, "step": 38186 }, { "epoch": 0.72, "learning_rate": 9.56473599465425e-07, "loss": 1.1768, "step": 38187 }, { "epoch": 0.72, "learning_rate": 9.563534307014815e-07, "loss": 1.0495, "step": 38188 }, { "epoch": 0.72, "learning_rate": 9.56233267701467e-07, "loss": 0.9885, "step": 38189 }, { "epoch": 0.72, "learning_rate": 9.56113110465831e-07, "loss": 0.8897, "step": 38190 }, { "epoch": 0.72, "learning_rate": 9.559929589950195e-07, "loss": 0.8271, "step": 38191 }, { "epoch": 0.72, "learning_rate": 9.55872813289485e-07, "loss": 0.8988, "step": 38192 }, { "epoch": 0.72, "learning_rate": 9.55752673349673e-07, "loss": 1.0656, "step": 38193 }, { "epoch": 0.72, "learning_rate": 9.556325391760331e-07, "loss": 1.1088, "step": 38194 }, { "epoch": 0.72, "learning_rate": 9.55512410769014e-07, "loss": 0.7177, "step": 38195 }, { "epoch": 0.72, "learning_rate": 9.553922881290643e-07, "loss": 0.9753, "step": 38196 }, { "epoch": 0.72, "learning_rate": 9.552721712566323e-07, "loss": 0.8021, "step": 38197 }, { "epoch": 0.72, "learning_rate": 9.551520601521666e-07, "loss": 0.7711, "step": 38198 }, { "epoch": 0.72, "learning_rate": 9.55031954816117e-07, "loss": 1.0153, "step": 38199 }, { "epoch": 0.72, "learning_rate": 9.549118552489284e-07, "loss": 1.1627, "step": 38200 }, { "epoch": 0.72, "learning_rate": 9.547917614510538e-07, "loss": 0.769, "step": 38201 }, { "epoch": 0.72, "learning_rate": 9.546716734229384e-07, "loss": 0.9683, "step": 38202 }, { "epoch": 0.72, "learning_rate": 9.545515911650306e-07, "loss": 0.9415, "step": 38203 }, { "epoch": 0.72, "learning_rate": 9.544315146777812e-07, "loss": 0.8523, "step": 38204 }, { "epoch": 0.72, "learning_rate": 9.543114439616365e-07, "loss": 1.1816, "step": 38205 }, { "epoch": 0.72, "learning_rate": 9.54191379017046e-07, "loss": 1.0206, "step": 38206 }, { "epoch": 0.72, "learning_rate": 9.540713198444568e-07, "loss": 0.8384, "step": 38207 }, { "epoch": 0.72, "learning_rate": 9.539512664443183e-07, "loss": 0.8938, "step": 38208 }, { "epoch": 0.72, "learning_rate": 9.53831218817078e-07, "loss": 0.941, "step": 38209 }, { "epoch": 0.72, "learning_rate": 9.537111769631848e-07, "loss": 0.8596, "step": 38210 }, { "epoch": 0.72, "learning_rate": 9.535911408830876e-07, "loss": 0.8427, "step": 38211 }, { "epoch": 0.72, "learning_rate": 9.534711105772318e-07, "loss": 1.0421, "step": 38212 }, { "epoch": 0.72, "learning_rate": 9.533510860460693e-07, "loss": 0.8013, "step": 38213 }, { "epoch": 0.72, "learning_rate": 9.532310672900455e-07, "loss": 0.9707, "step": 38214 }, { "epoch": 0.72, "learning_rate": 9.531110543096092e-07, "loss": 0.6968, "step": 38215 }, { "epoch": 0.72, "learning_rate": 9.529910471052093e-07, "loss": 0.9567, "step": 38216 }, { "epoch": 0.72, "learning_rate": 9.52871045677293e-07, "loss": 0.9828, "step": 38217 }, { "epoch": 0.72, "learning_rate": 9.527510500263087e-07, "loss": 1.1216, "step": 38218 }, { "epoch": 0.72, "learning_rate": 9.52631060152705e-07, "loss": 0.729, "step": 38219 }, { "epoch": 0.72, "learning_rate": 9.525110760569301e-07, "loss": 0.9638, "step": 38220 }, { "epoch": 0.72, "learning_rate": 9.523910977394296e-07, "loss": 0.8831, "step": 38221 }, { "epoch": 0.72, "learning_rate": 9.522711252006551e-07, "loss": 0.8333, "step": 38222 }, { "epoch": 0.72, "learning_rate": 9.521511584410517e-07, "loss": 0.811, "step": 38223 }, { "epoch": 0.72, "learning_rate": 9.520311974610677e-07, "loss": 0.6208, "step": 38224 }, { "epoch": 0.72, "learning_rate": 9.519112422611535e-07, "loss": 1.1198, "step": 38225 }, { "epoch": 0.72, "learning_rate": 9.517912928417545e-07, "loss": 0.9742, "step": 38226 }, { "epoch": 0.72, "learning_rate": 9.516713492033191e-07, "loss": 0.8163, "step": 38227 }, { "epoch": 0.72, "learning_rate": 9.515514113462956e-07, "loss": 0.7819, "step": 38228 }, { "epoch": 0.72, "learning_rate": 9.514314792711316e-07, "loss": 0.75, "step": 38229 }, { "epoch": 0.72, "learning_rate": 9.513115529782749e-07, "loss": 0.7735, "step": 38230 }, { "epoch": 0.72, "learning_rate": 9.511916324681736e-07, "loss": 0.9794, "step": 38231 }, { "epoch": 0.72, "learning_rate": 9.510717177412759e-07, "loss": 1.0576, "step": 38232 }, { "epoch": 0.72, "learning_rate": 9.509518087980271e-07, "loss": 0.804, "step": 38233 }, { "epoch": 0.72, "learning_rate": 9.508319056388787e-07, "loss": 0.8849, "step": 38234 }, { "epoch": 0.72, "learning_rate": 9.507120082642757e-07, "loss": 0.7855, "step": 38235 }, { "epoch": 0.72, "learning_rate": 9.505921166746662e-07, "loss": 0.8049, "step": 38236 }, { "epoch": 0.72, "learning_rate": 9.504722308704986e-07, "loss": 0.9785, "step": 38237 }, { "epoch": 0.72, "learning_rate": 9.5035235085222e-07, "loss": 0.8854, "step": 38238 }, { "epoch": 0.72, "learning_rate": 9.502324766202781e-07, "loss": 0.8896, "step": 38239 }, { "epoch": 0.72, "learning_rate": 9.501126081751208e-07, "loss": 0.895, "step": 38240 }, { "epoch": 0.72, "learning_rate": 9.499927455171962e-07, "loss": 0.7344, "step": 38241 }, { "epoch": 0.72, "learning_rate": 9.498728886469497e-07, "loss": 0.8392, "step": 38242 }, { "epoch": 0.72, "learning_rate": 9.497530375648317e-07, "loss": 0.9153, "step": 38243 }, { "epoch": 0.72, "learning_rate": 9.496331922712876e-07, "loss": 1.1041, "step": 38244 }, { "epoch": 0.72, "learning_rate": 9.49513352766765e-07, "loss": 1.0153, "step": 38245 }, { "epoch": 0.72, "learning_rate": 9.493935190517134e-07, "loss": 0.7587, "step": 38246 }, { "epoch": 0.72, "learning_rate": 9.492736911265779e-07, "loss": 0.9966, "step": 38247 }, { "epoch": 0.72, "learning_rate": 9.491538689918073e-07, "loss": 0.7583, "step": 38248 }, { "epoch": 0.72, "learning_rate": 9.490340526478484e-07, "loss": 0.9638, "step": 38249 }, { "epoch": 0.72, "learning_rate": 9.489142420951488e-07, "loss": 1.2238, "step": 38250 }, { "epoch": 0.72, "learning_rate": 9.487944373341556e-07, "loss": 0.9471, "step": 38251 }, { "epoch": 0.72, "learning_rate": 9.48674638365317e-07, "loss": 0.874, "step": 38252 }, { "epoch": 0.72, "learning_rate": 9.485548451890802e-07, "loss": 0.8057, "step": 38253 }, { "epoch": 0.72, "learning_rate": 9.484350578058904e-07, "loss": 0.7842, "step": 38254 }, { "epoch": 0.72, "learning_rate": 9.483152762161982e-07, "loss": 0.9063, "step": 38255 }, { "epoch": 0.72, "learning_rate": 9.481955004204483e-07, "loss": 1.1959, "step": 38256 }, { "epoch": 0.72, "learning_rate": 9.480757304190887e-07, "loss": 0.9024, "step": 38257 }, { "epoch": 0.72, "learning_rate": 9.47955966212567e-07, "loss": 0.9543, "step": 38258 }, { "epoch": 0.72, "learning_rate": 9.4783620780133e-07, "loss": 0.808, "step": 38259 }, { "epoch": 0.72, "learning_rate": 9.477164551858251e-07, "loss": 0.7922, "step": 38260 }, { "epoch": 0.72, "learning_rate": 9.475967083664995e-07, "loss": 0.8631, "step": 38261 }, { "epoch": 0.72, "learning_rate": 9.474769673438008e-07, "loss": 1.0706, "step": 38262 }, { "epoch": 0.72, "learning_rate": 9.473572321181737e-07, "loss": 0.8799, "step": 38263 }, { "epoch": 0.72, "learning_rate": 9.472375026900691e-07, "loss": 0.8959, "step": 38264 }, { "epoch": 0.72, "learning_rate": 9.471177790599309e-07, "loss": 0.8658, "step": 38265 }, { "epoch": 0.72, "learning_rate": 9.469980612282067e-07, "loss": 0.8766, "step": 38266 }, { "epoch": 0.72, "learning_rate": 9.468783491953456e-07, "loss": 0.8469, "step": 38267 }, { "epoch": 0.72, "learning_rate": 9.467586429617926e-07, "loss": 1.1209, "step": 38268 }, { "epoch": 0.72, "learning_rate": 9.466389425279951e-07, "loss": 0.9366, "step": 38269 }, { "epoch": 0.72, "learning_rate": 9.465192478943999e-07, "loss": 0.8463, "step": 38270 }, { "epoch": 0.72, "learning_rate": 9.463995590614544e-07, "loss": 0.8115, "step": 38271 }, { "epoch": 0.72, "learning_rate": 9.462798760296052e-07, "loss": 0.7945, "step": 38272 }, { "epoch": 0.72, "learning_rate": 9.461601987992993e-07, "loss": 0.7841, "step": 38273 }, { "epoch": 0.72, "learning_rate": 9.460405273709846e-07, "loss": 0.8967, "step": 38274 }, { "epoch": 0.72, "learning_rate": 9.459208617451051e-07, "loss": 0.9907, "step": 38275 }, { "epoch": 0.72, "learning_rate": 9.458012019221113e-07, "loss": 0.7382, "step": 38276 }, { "epoch": 0.72, "learning_rate": 9.456815479024473e-07, "loss": 0.8621, "step": 38277 }, { "epoch": 0.72, "learning_rate": 9.455618996865606e-07, "loss": 1.0201, "step": 38278 }, { "epoch": 0.72, "learning_rate": 9.45442257274898e-07, "loss": 0.7289, "step": 38279 }, { "epoch": 0.72, "learning_rate": 9.453226206679067e-07, "loss": 0.8624, "step": 38280 }, { "epoch": 0.72, "learning_rate": 9.452029898660329e-07, "loss": 1.0027, "step": 38281 }, { "epoch": 0.72, "learning_rate": 9.450833648697233e-07, "loss": 0.8573, "step": 38282 }, { "epoch": 0.72, "learning_rate": 9.449637456794258e-07, "loss": 1.0297, "step": 38283 }, { "epoch": 0.72, "learning_rate": 9.448441322955843e-07, "loss": 0.9417, "step": 38284 }, { "epoch": 0.72, "learning_rate": 9.447245247186488e-07, "loss": 0.6952, "step": 38285 }, { "epoch": 0.72, "learning_rate": 9.446049229490631e-07, "loss": 0.998, "step": 38286 }, { "epoch": 0.72, "learning_rate": 9.444853269872744e-07, "loss": 1.1841, "step": 38287 }, { "epoch": 0.72, "learning_rate": 9.443657368337314e-07, "loss": 0.9558, "step": 38288 }, { "epoch": 0.72, "learning_rate": 9.442461524888782e-07, "loss": 0.7539, "step": 38289 }, { "epoch": 0.72, "learning_rate": 9.441265739531622e-07, "loss": 0.7444, "step": 38290 }, { "epoch": 0.72, "learning_rate": 9.440070012270297e-07, "loss": 0.7588, "step": 38291 }, { "epoch": 0.72, "learning_rate": 9.438874343109275e-07, "loss": 1.0244, "step": 38292 }, { "epoch": 0.72, "learning_rate": 9.437678732053022e-07, "loss": 0.9934, "step": 38293 }, { "epoch": 0.72, "learning_rate": 9.436483179105993e-07, "loss": 0.9426, "step": 38294 }, { "epoch": 0.72, "learning_rate": 9.435287684272674e-07, "loss": 0.8348, "step": 38295 }, { "epoch": 0.72, "learning_rate": 9.434092247557491e-07, "loss": 0.968, "step": 38296 }, { "epoch": 0.72, "learning_rate": 9.43289686896495e-07, "loss": 0.8392, "step": 38297 }, { "epoch": 0.72, "learning_rate": 9.431701548499486e-07, "loss": 1.0473, "step": 38298 }, { "epoch": 0.72, "learning_rate": 9.430506286165569e-07, "loss": 1.1445, "step": 38299 }, { "epoch": 0.72, "learning_rate": 9.429311081967666e-07, "loss": 0.8604, "step": 38300 }, { "epoch": 0.72, "learning_rate": 9.428115935910239e-07, "loss": 0.8596, "step": 38301 }, { "epoch": 0.72, "learning_rate": 9.426920847997747e-07, "loss": 0.7814, "step": 38302 }, { "epoch": 0.72, "learning_rate": 9.425725818234657e-07, "loss": 0.9395, "step": 38303 }, { "epoch": 0.72, "learning_rate": 9.424530846625437e-07, "loss": 0.885, "step": 38304 }, { "epoch": 0.72, "learning_rate": 9.423335933174527e-07, "loss": 0.8478, "step": 38305 }, { "epoch": 0.72, "learning_rate": 9.422141077886416e-07, "loss": 1.0223, "step": 38306 }, { "epoch": 0.72, "learning_rate": 9.420946280765547e-07, "loss": 1.1778, "step": 38307 }, { "epoch": 0.72, "learning_rate": 9.419751541816377e-07, "loss": 0.8174, "step": 38308 }, { "epoch": 0.72, "learning_rate": 9.418556861043393e-07, "loss": 0.9751, "step": 38309 }, { "epoch": 0.72, "learning_rate": 9.417362238451033e-07, "loss": 0.9519, "step": 38310 }, { "epoch": 0.72, "learning_rate": 9.416167674043767e-07, "loss": 1.0374, "step": 38311 }, { "epoch": 0.72, "learning_rate": 9.41497316782605e-07, "loss": 1.1063, "step": 38312 }, { "epoch": 0.72, "learning_rate": 9.413778719802344e-07, "loss": 0.925, "step": 38313 }, { "epoch": 0.72, "learning_rate": 9.412584329977112e-07, "loss": 0.8932, "step": 38314 }, { "epoch": 0.72, "learning_rate": 9.411389998354811e-07, "loss": 0.9679, "step": 38315 }, { "epoch": 0.72, "learning_rate": 9.410195724939913e-07, "loss": 0.869, "step": 38316 }, { "epoch": 0.72, "learning_rate": 9.409001509736848e-07, "loss": 0.7945, "step": 38317 }, { "epoch": 0.72, "learning_rate": 9.407807352750109e-07, "loss": 1.0287, "step": 38318 }, { "epoch": 0.72, "learning_rate": 9.406613253984134e-07, "loss": 0.8001, "step": 38319 }, { "epoch": 0.72, "learning_rate": 9.405419213443384e-07, "loss": 0.785, "step": 38320 }, { "epoch": 0.72, "learning_rate": 9.404225231132322e-07, "loss": 0.8966, "step": 38321 }, { "epoch": 0.72, "learning_rate": 9.403031307055405e-07, "loss": 0.8393, "step": 38322 }, { "epoch": 0.72, "learning_rate": 9.401837441217088e-07, "loss": 0.9444, "step": 38323 }, { "epoch": 0.72, "learning_rate": 9.400643633621834e-07, "loss": 0.9051, "step": 38324 }, { "epoch": 0.72, "learning_rate": 9.399449884274108e-07, "loss": 1.1747, "step": 38325 }, { "epoch": 0.72, "learning_rate": 9.39825619317834e-07, "loss": 0.8121, "step": 38326 }, { "epoch": 0.72, "learning_rate": 9.397062560339012e-07, "loss": 0.8392, "step": 38327 }, { "epoch": 0.72, "learning_rate": 9.395868985760584e-07, "loss": 0.8301, "step": 38328 }, { "epoch": 0.72, "learning_rate": 9.394675469447484e-07, "loss": 0.8542, "step": 38329 }, { "epoch": 0.72, "learning_rate": 9.393482011404206e-07, "loss": 0.9676, "step": 38330 }, { "epoch": 0.72, "learning_rate": 9.39228861163518e-07, "loss": 1.1381, "step": 38331 }, { "epoch": 0.72, "learning_rate": 9.391095270144868e-07, "loss": 0.8096, "step": 38332 }, { "epoch": 0.72, "learning_rate": 9.38990198693773e-07, "loss": 0.6875, "step": 38333 }, { "epoch": 0.72, "learning_rate": 9.388708762018217e-07, "loss": 0.8876, "step": 38334 }, { "epoch": 0.72, "learning_rate": 9.387515595390786e-07, "loss": 0.829, "step": 38335 }, { "epoch": 0.72, "learning_rate": 9.386322487059896e-07, "loss": 0.8912, "step": 38336 }, { "epoch": 0.72, "learning_rate": 9.385129437030005e-07, "loss": 1.0319, "step": 38337 }, { "epoch": 0.72, "learning_rate": 9.383936445305547e-07, "loss": 1.0981, "step": 38338 }, { "epoch": 0.72, "learning_rate": 9.382743511891007e-07, "loss": 0.7718, "step": 38339 }, { "epoch": 0.72, "learning_rate": 9.381550636790818e-07, "loss": 0.8578, "step": 38340 }, { "epoch": 0.72, "learning_rate": 9.380357820009436e-07, "loss": 0.8162, "step": 38341 }, { "epoch": 0.72, "learning_rate": 9.379165061551321e-07, "loss": 0.6696, "step": 38342 }, { "epoch": 0.72, "learning_rate": 9.377972361420926e-07, "loss": 0.9677, "step": 38343 }, { "epoch": 0.72, "learning_rate": 9.376779719622703e-07, "loss": 0.9623, "step": 38344 }, { "epoch": 0.72, "learning_rate": 9.375587136161101e-07, "loss": 0.8652, "step": 38345 }, { "epoch": 0.72, "learning_rate": 9.374394611040591e-07, "loss": 0.9368, "step": 38346 }, { "epoch": 0.72, "learning_rate": 9.373202144265595e-07, "loss": 0.7704, "step": 38347 }, { "epoch": 0.72, "learning_rate": 9.37200973584059e-07, "loss": 0.9067, "step": 38348 }, { "epoch": 0.72, "learning_rate": 9.370817385770031e-07, "loss": 0.9767, "step": 38349 }, { "epoch": 0.72, "learning_rate": 9.369625094058343e-07, "loss": 1.0038, "step": 38350 }, { "epoch": 0.72, "learning_rate": 9.368432860710013e-07, "loss": 1.0476, "step": 38351 }, { "epoch": 0.72, "learning_rate": 9.367240685729468e-07, "loss": 0.8258, "step": 38352 }, { "epoch": 0.72, "learning_rate": 9.366048569121164e-07, "loss": 0.7331, "step": 38353 }, { "epoch": 0.72, "learning_rate": 9.364856510889558e-07, "loss": 0.5688, "step": 38354 }, { "epoch": 0.72, "learning_rate": 9.363664511039098e-07, "loss": 1.1159, "step": 38355 }, { "epoch": 0.72, "learning_rate": 9.362472569574235e-07, "loss": 0.8761, "step": 38356 }, { "epoch": 0.72, "learning_rate": 9.361280686499419e-07, "loss": 0.7436, "step": 38357 }, { "epoch": 0.72, "learning_rate": 9.360088861819111e-07, "loss": 0.853, "step": 38358 }, { "epoch": 0.72, "learning_rate": 9.358897095537734e-07, "loss": 1.1596, "step": 38359 }, { "epoch": 0.72, "learning_rate": 9.357705387659774e-07, "loss": 0.8427, "step": 38360 }, { "epoch": 0.72, "learning_rate": 9.356513738189651e-07, "loss": 0.7988, "step": 38361 }, { "epoch": 0.72, "learning_rate": 9.355322147131829e-07, "loss": 0.8434, "step": 38362 }, { "epoch": 0.72, "learning_rate": 9.354130614490753e-07, "loss": 1.0237, "step": 38363 }, { "epoch": 0.72, "learning_rate": 9.352939140270875e-07, "loss": 0.627, "step": 38364 }, { "epoch": 0.72, "learning_rate": 9.351747724476639e-07, "loss": 0.7551, "step": 38365 }, { "epoch": 0.72, "learning_rate": 9.350556367112501e-07, "loss": 0.7332, "step": 38366 }, { "epoch": 0.72, "learning_rate": 9.349365068182914e-07, "loss": 0.7368, "step": 38367 }, { "epoch": 0.72, "learning_rate": 9.3481738276923e-07, "loss": 0.7547, "step": 38368 }, { "epoch": 0.72, "learning_rate": 9.346982645645133e-07, "loss": 0.9752, "step": 38369 }, { "epoch": 0.72, "learning_rate": 9.345791522045863e-07, "loss": 1.0616, "step": 38370 }, { "epoch": 0.72, "learning_rate": 9.344600456898909e-07, "loss": 1.0012, "step": 38371 }, { "epoch": 0.72, "learning_rate": 9.343409450208754e-07, "loss": 0.9244, "step": 38372 }, { "epoch": 0.72, "learning_rate": 9.342218501979819e-07, "loss": 0.7963, "step": 38373 }, { "epoch": 0.72, "learning_rate": 9.341027612216561e-07, "loss": 1.0768, "step": 38374 }, { "epoch": 0.72, "learning_rate": 9.339836780923425e-07, "loss": 0.9146, "step": 38375 }, { "epoch": 0.72, "learning_rate": 9.33864600810486e-07, "loss": 1.0296, "step": 38376 }, { "epoch": 0.72, "learning_rate": 9.33745529376531e-07, "loss": 0.8926, "step": 38377 }, { "epoch": 0.72, "learning_rate": 9.33626463790922e-07, "loss": 0.7884, "step": 38378 }, { "epoch": 0.72, "learning_rate": 9.335074040541048e-07, "loss": 0.7229, "step": 38379 }, { "epoch": 0.72, "learning_rate": 9.333883501665211e-07, "loss": 1.111, "step": 38380 }, { "epoch": 0.72, "learning_rate": 9.33269302128619e-07, "loss": 0.791, "step": 38381 }, { "epoch": 0.72, "learning_rate": 9.331502599408407e-07, "loss": 0.8114, "step": 38382 }, { "epoch": 0.72, "learning_rate": 9.33031223603631e-07, "loss": 0.9167, "step": 38383 }, { "epoch": 0.72, "learning_rate": 9.329121931174345e-07, "loss": 0.8613, "step": 38384 }, { "epoch": 0.72, "learning_rate": 9.327931684826963e-07, "loss": 0.9698, "step": 38385 }, { "epoch": 0.72, "learning_rate": 9.3267414969986e-07, "loss": 0.6354, "step": 38386 }, { "epoch": 0.72, "learning_rate": 9.325551367693706e-07, "loss": 1.0542, "step": 38387 }, { "epoch": 0.72, "learning_rate": 9.324361296916729e-07, "loss": 0.9434, "step": 38388 }, { "epoch": 0.72, "learning_rate": 9.323171284672089e-07, "loss": 0.8485, "step": 38389 }, { "epoch": 0.72, "learning_rate": 9.321981330964255e-07, "loss": 0.6197, "step": 38390 }, { "epoch": 0.72, "learning_rate": 9.320791435797675e-07, "loss": 0.8073, "step": 38391 }, { "epoch": 0.72, "learning_rate": 9.319601599176758e-07, "loss": 0.8574, "step": 38392 }, { "epoch": 0.72, "learning_rate": 9.318411821105986e-07, "loss": 1.1199, "step": 38393 }, { "epoch": 0.72, "learning_rate": 9.317222101589774e-07, "loss": 0.735, "step": 38394 }, { "epoch": 0.72, "learning_rate": 9.316032440632575e-07, "loss": 0.8404, "step": 38395 }, { "epoch": 0.72, "learning_rate": 9.314842838238831e-07, "loss": 0.8928, "step": 38396 }, { "epoch": 0.72, "learning_rate": 9.31365329441298e-07, "loss": 0.9572, "step": 38397 }, { "epoch": 0.72, "learning_rate": 9.312463809159475e-07, "loss": 0.7769, "step": 38398 }, { "epoch": 0.72, "learning_rate": 9.311274382482735e-07, "loss": 0.8749, "step": 38399 }, { "epoch": 0.72, "learning_rate": 9.310085014387232e-07, "loss": 1.1429, "step": 38400 }, { "epoch": 0.72, "learning_rate": 9.30889570487738e-07, "loss": 0.8356, "step": 38401 }, { "epoch": 0.72, "learning_rate": 9.307706453957632e-07, "loss": 0.806, "step": 38402 }, { "epoch": 0.72, "learning_rate": 9.306517261632425e-07, "loss": 0.6998, "step": 38403 }, { "epoch": 0.72, "learning_rate": 9.305328127906205e-07, "loss": 1.0039, "step": 38404 }, { "epoch": 0.72, "learning_rate": 9.304139052783406e-07, "loss": 1.0629, "step": 38405 }, { "epoch": 0.72, "learning_rate": 9.302950036268471e-07, "loss": 1.0814, "step": 38406 }, { "epoch": 0.72, "learning_rate": 9.301761078365848e-07, "loss": 0.9663, "step": 38407 }, { "epoch": 0.72, "learning_rate": 9.30057217907995e-07, "loss": 0.8737, "step": 38408 }, { "epoch": 0.72, "learning_rate": 9.299383338415252e-07, "loss": 0.7763, "step": 38409 }, { "epoch": 0.72, "learning_rate": 9.298194556376167e-07, "loss": 0.773, "step": 38410 }, { "epoch": 0.72, "learning_rate": 9.297005832967132e-07, "loss": 0.8339, "step": 38411 }, { "epoch": 0.72, "learning_rate": 9.295817168192614e-07, "loss": 1.3195, "step": 38412 }, { "epoch": 0.72, "learning_rate": 9.294628562057023e-07, "loss": 0.8919, "step": 38413 }, { "epoch": 0.72, "learning_rate": 9.293440014564809e-07, "loss": 0.8663, "step": 38414 }, { "epoch": 0.72, "learning_rate": 9.292251525720408e-07, "loss": 0.8931, "step": 38415 }, { "epoch": 0.72, "learning_rate": 9.29106309552826e-07, "loss": 0.9031, "step": 38416 }, { "epoch": 0.72, "learning_rate": 9.289874723992798e-07, "loss": 0.7421, "step": 38417 }, { "epoch": 0.72, "learning_rate": 9.288686411118463e-07, "loss": 0.807, "step": 38418 }, { "epoch": 0.72, "learning_rate": 9.287498156909703e-07, "loss": 1.1987, "step": 38419 }, { "epoch": 0.72, "learning_rate": 9.286309961370921e-07, "loss": 0.8249, "step": 38420 }, { "epoch": 0.72, "learning_rate": 9.285121824506596e-07, "loss": 1.0578, "step": 38421 }, { "epoch": 0.72, "learning_rate": 9.283933746321133e-07, "loss": 0.9385, "step": 38422 }, { "epoch": 0.72, "learning_rate": 9.282745726818981e-07, "loss": 1.0131, "step": 38423 }, { "epoch": 0.72, "learning_rate": 9.281557766004576e-07, "loss": 1.0624, "step": 38424 }, { "epoch": 0.72, "learning_rate": 9.280369863882352e-07, "loss": 1.083, "step": 38425 }, { "epoch": 0.72, "learning_rate": 9.279182020456742e-07, "loss": 1.0201, "step": 38426 }, { "epoch": 0.72, "learning_rate": 9.277994235732188e-07, "loss": 0.7589, "step": 38427 }, { "epoch": 0.73, "learning_rate": 9.276806509713129e-07, "loss": 0.7366, "step": 38428 }, { "epoch": 0.73, "learning_rate": 9.275618842403974e-07, "loss": 0.8282, "step": 38429 }, { "epoch": 0.73, "learning_rate": 9.274431233809194e-07, "loss": 0.9355, "step": 38430 }, { "epoch": 0.73, "learning_rate": 9.273243683933197e-07, "loss": 1.28, "step": 38431 }, { "epoch": 0.73, "learning_rate": 9.272056192780418e-07, "loss": 0.9716, "step": 38432 }, { "epoch": 0.73, "learning_rate": 9.270868760355315e-07, "loss": 0.9363, "step": 38433 }, { "epoch": 0.73, "learning_rate": 9.269681386662297e-07, "loss": 0.8481, "step": 38434 }, { "epoch": 0.73, "learning_rate": 9.268494071705808e-07, "loss": 0.8133, "step": 38435 }, { "epoch": 0.73, "learning_rate": 9.267306815490279e-07, "loss": 0.779, "step": 38436 }, { "epoch": 0.73, "learning_rate": 9.266119618020144e-07, "loss": 1.1247, "step": 38437 }, { "epoch": 0.73, "learning_rate": 9.264932479299834e-07, "loss": 0.9425, "step": 38438 }, { "epoch": 0.73, "learning_rate": 9.263745399333787e-07, "loss": 0.8575, "step": 38439 }, { "epoch": 0.73, "learning_rate": 9.262558378126441e-07, "loss": 0.9068, "step": 38440 }, { "epoch": 0.73, "learning_rate": 9.261371415682199e-07, "loss": 0.8229, "step": 38441 }, { "epoch": 0.73, "learning_rate": 9.260184512005532e-07, "loss": 0.9013, "step": 38442 }, { "epoch": 0.73, "learning_rate": 9.258997667100844e-07, "loss": 1.0086, "step": 38443 }, { "epoch": 0.73, "learning_rate": 9.257810880972579e-07, "loss": 1.0749, "step": 38444 }, { "epoch": 0.73, "learning_rate": 9.256624153625162e-07, "loss": 0.9542, "step": 38445 }, { "epoch": 0.73, "learning_rate": 9.255437485063032e-07, "loss": 0.6234, "step": 38446 }, { "epoch": 0.73, "learning_rate": 9.254250875290613e-07, "loss": 0.9415, "step": 38447 }, { "epoch": 0.73, "learning_rate": 9.253064324312339e-07, "loss": 0.9465, "step": 38448 }, { "epoch": 0.73, "learning_rate": 9.251877832132647e-07, "loss": 1.0782, "step": 38449 }, { "epoch": 0.73, "learning_rate": 9.250691398755946e-07, "loss": 0.9051, "step": 38450 }, { "epoch": 0.73, "learning_rate": 9.249505024186695e-07, "loss": 0.9453, "step": 38451 }, { "epoch": 0.73, "learning_rate": 9.248318708429301e-07, "loss": 0.6827, "step": 38452 }, { "epoch": 0.73, "learning_rate": 9.247132451488194e-07, "loss": 0.9852, "step": 38453 }, { "epoch": 0.73, "learning_rate": 9.245946253367829e-07, "loss": 0.7792, "step": 38454 }, { "epoch": 0.73, "learning_rate": 9.24476011407261e-07, "loss": 1.0301, "step": 38455 }, { "epoch": 0.73, "learning_rate": 9.243574033606973e-07, "loss": 1.0131, "step": 38456 }, { "epoch": 0.73, "learning_rate": 9.242388011975346e-07, "loss": 0.89, "step": 38457 }, { "epoch": 0.73, "learning_rate": 9.24120204918216e-07, "loss": 0.9005, "step": 38458 }, { "epoch": 0.73, "learning_rate": 9.240016145231842e-07, "loss": 0.9487, "step": 38459 }, { "epoch": 0.73, "learning_rate": 9.23883030012882e-07, "loss": 0.8856, "step": 38460 }, { "epoch": 0.73, "learning_rate": 9.237644513877531e-07, "loss": 0.6782, "step": 38461 }, { "epoch": 0.73, "learning_rate": 9.236458786482377e-07, "loss": 1.0373, "step": 38462 }, { "epoch": 0.73, "learning_rate": 9.235273117947821e-07, "loss": 0.7787, "step": 38463 }, { "epoch": 0.73, "learning_rate": 9.234087508278264e-07, "loss": 0.78, "step": 38464 }, { "epoch": 0.73, "learning_rate": 9.232901957478139e-07, "loss": 0.7629, "step": 38465 }, { "epoch": 0.73, "learning_rate": 9.231716465551876e-07, "loss": 0.9752, "step": 38466 }, { "epoch": 0.73, "learning_rate": 9.230531032503901e-07, "loss": 0.8199, "step": 38467 }, { "epoch": 0.73, "learning_rate": 9.229345658338637e-07, "loss": 1.1113, "step": 38468 }, { "epoch": 0.73, "learning_rate": 9.228160343060513e-07, "loss": 1.0241, "step": 38469 }, { "epoch": 0.73, "learning_rate": 9.226975086673965e-07, "loss": 0.9456, "step": 38470 }, { "epoch": 0.73, "learning_rate": 9.22578988918339e-07, "loss": 0.8181, "step": 38471 }, { "epoch": 0.73, "learning_rate": 9.22460475059325e-07, "loss": 0.8517, "step": 38472 }, { "epoch": 0.73, "learning_rate": 9.223419670907943e-07, "loss": 0.7751, "step": 38473 }, { "epoch": 0.73, "learning_rate": 9.222234650131895e-07, "loss": 0.9749, "step": 38474 }, { "epoch": 0.73, "learning_rate": 9.221049688269554e-07, "loss": 0.9634, "step": 38475 }, { "epoch": 0.73, "learning_rate": 9.219864785325325e-07, "loss": 1.0271, "step": 38476 }, { "epoch": 0.73, "learning_rate": 9.218679941303635e-07, "loss": 0.8743, "step": 38477 }, { "epoch": 0.73, "learning_rate": 9.217495156208909e-07, "loss": 0.7805, "step": 38478 }, { "epoch": 0.73, "learning_rate": 9.216310430045575e-07, "loss": 0.7314, "step": 38479 }, { "epoch": 0.73, "learning_rate": 9.21512576281805e-07, "loss": 0.7762, "step": 38480 }, { "epoch": 0.73, "learning_rate": 9.213941154530765e-07, "loss": 0.9423, "step": 38481 }, { "epoch": 0.73, "learning_rate": 9.212756605188148e-07, "loss": 0.9045, "step": 38482 }, { "epoch": 0.73, "learning_rate": 9.211572114794595e-07, "loss": 0.9951, "step": 38483 }, { "epoch": 0.73, "learning_rate": 9.210387683354566e-07, "loss": 0.9194, "step": 38484 }, { "epoch": 0.73, "learning_rate": 9.209203310872456e-07, "loss": 0.806, "step": 38485 }, { "epoch": 0.73, "learning_rate": 9.208018997352696e-07, "loss": 0.9115, "step": 38486 }, { "epoch": 0.73, "learning_rate": 9.206834742799711e-07, "loss": 0.8879, "step": 38487 }, { "epoch": 0.73, "learning_rate": 9.20565054721792e-07, "loss": 0.959, "step": 38488 }, { "epoch": 0.73, "learning_rate": 9.204466410611745e-07, "loss": 0.7974, "step": 38489 }, { "epoch": 0.73, "learning_rate": 9.203282332985608e-07, "loss": 0.7841, "step": 38490 }, { "epoch": 0.73, "learning_rate": 9.20209831434394e-07, "loss": 0.8646, "step": 38491 }, { "epoch": 0.73, "learning_rate": 9.200914354691135e-07, "loss": 0.7211, "step": 38492 }, { "epoch": 0.73, "learning_rate": 9.199730454031646e-07, "loss": 1.1948, "step": 38493 }, { "epoch": 0.73, "learning_rate": 9.198546612369874e-07, "loss": 1.147, "step": 38494 }, { "epoch": 0.73, "learning_rate": 9.197362829710235e-07, "loss": 1.0356, "step": 38495 }, { "epoch": 0.73, "learning_rate": 9.196179106057176e-07, "loss": 0.733, "step": 38496 }, { "epoch": 0.73, "learning_rate": 9.194995441415089e-07, "loss": 0.8845, "step": 38497 }, { "epoch": 0.73, "learning_rate": 9.193811835788408e-07, "loss": 0.8569, "step": 38498 }, { "epoch": 0.73, "learning_rate": 9.192628289181546e-07, "loss": 1.0905, "step": 38499 }, { "epoch": 0.73, "learning_rate": 9.191444801598925e-07, "loss": 0.9769, "step": 38500 }, { "epoch": 0.73, "learning_rate": 9.190261373044968e-07, "loss": 0.9645, "step": 38501 }, { "epoch": 0.73, "learning_rate": 9.189078003524088e-07, "loss": 0.7894, "step": 38502 }, { "epoch": 0.73, "learning_rate": 9.187894693040714e-07, "loss": 0.6929, "step": 38503 }, { "epoch": 0.73, "learning_rate": 9.186711441599239e-07, "loss": 0.7018, "step": 38504 }, { "epoch": 0.73, "learning_rate": 9.185528249204118e-07, "loss": 0.8735, "step": 38505 }, { "epoch": 0.73, "learning_rate": 9.184345115859739e-07, "loss": 0.7705, "step": 38506 }, { "epoch": 0.73, "learning_rate": 9.183162041570531e-07, "loss": 0.9905, "step": 38507 }, { "epoch": 0.73, "learning_rate": 9.181979026340912e-07, "loss": 0.6895, "step": 38508 }, { "epoch": 0.73, "learning_rate": 9.180796070175296e-07, "loss": 0.8917, "step": 38509 }, { "epoch": 0.73, "learning_rate": 9.179613173078103e-07, "loss": 0.6437, "step": 38510 }, { "epoch": 0.73, "learning_rate": 9.178430335053751e-07, "loss": 0.9799, "step": 38511 }, { "epoch": 0.73, "learning_rate": 9.177247556106664e-07, "loss": 1.0674, "step": 38512 }, { "epoch": 0.73, "learning_rate": 9.17606483624123e-07, "loss": 0.9056, "step": 38513 }, { "epoch": 0.73, "learning_rate": 9.174882175461902e-07, "loss": 0.7842, "step": 38514 }, { "epoch": 0.73, "learning_rate": 9.173699573773073e-07, "loss": 0.9019, "step": 38515 }, { "epoch": 0.73, "learning_rate": 9.172517031179154e-07, "loss": 0.7555, "step": 38516 }, { "epoch": 0.73, "learning_rate": 9.171334547684588e-07, "loss": 0.9156, "step": 38517 }, { "epoch": 0.73, "learning_rate": 9.170152123293766e-07, "loss": 0.956, "step": 38518 }, { "epoch": 0.73, "learning_rate": 9.168969758011109e-07, "loss": 0.9929, "step": 38519 }, { "epoch": 0.73, "learning_rate": 9.167787451841034e-07, "loss": 0.7938, "step": 38520 }, { "epoch": 0.73, "learning_rate": 9.166605204787956e-07, "loss": 0.9475, "step": 38521 }, { "epoch": 0.73, "learning_rate": 9.165423016856287e-07, "loss": 0.9224, "step": 38522 }, { "epoch": 0.73, "learning_rate": 9.164240888050446e-07, "loss": 0.7379, "step": 38523 }, { "epoch": 0.73, "learning_rate": 9.16305881837485e-07, "loss": 1.1934, "step": 38524 }, { "epoch": 0.73, "learning_rate": 9.161876807833891e-07, "loss": 1.0118, "step": 38525 }, { "epoch": 0.73, "learning_rate": 9.160694856432015e-07, "loss": 1.0902, "step": 38526 }, { "epoch": 0.73, "learning_rate": 9.159512964173611e-07, "loss": 0.8176, "step": 38527 }, { "epoch": 0.73, "learning_rate": 9.158331131063098e-07, "loss": 0.5043, "step": 38528 }, { "epoch": 0.73, "learning_rate": 9.157149357104892e-07, "loss": 1.0137, "step": 38529 }, { "epoch": 0.73, "learning_rate": 9.155967642303404e-07, "loss": 0.9478, "step": 38530 }, { "epoch": 0.73, "learning_rate": 9.154785986663047e-07, "loss": 1.0812, "step": 38531 }, { "epoch": 0.73, "learning_rate": 9.153604390188236e-07, "loss": 0.886, "step": 38532 }, { "epoch": 0.73, "learning_rate": 9.152422852883386e-07, "loss": 0.8536, "step": 38533 }, { "epoch": 0.73, "learning_rate": 9.151241374752886e-07, "loss": 1.0814, "step": 38534 }, { "epoch": 0.73, "learning_rate": 9.150059955801182e-07, "loss": 0.9681, "step": 38535 }, { "epoch": 0.73, "learning_rate": 9.148878596032662e-07, "loss": 0.9646, "step": 38536 }, { "epoch": 0.73, "learning_rate": 9.147697295451733e-07, "loss": 0.9972, "step": 38537 }, { "epoch": 0.73, "learning_rate": 9.146516054062835e-07, "loss": 0.8854, "step": 38538 }, { "epoch": 0.73, "learning_rate": 9.145334871870348e-07, "loss": 0.9411, "step": 38539 }, { "epoch": 0.73, "learning_rate": 9.144153748878698e-07, "loss": 0.8579, "step": 38540 }, { "epoch": 0.73, "learning_rate": 9.142972685092288e-07, "loss": 0.893, "step": 38541 }, { "epoch": 0.73, "learning_rate": 9.141791680515535e-07, "loss": 0.7592, "step": 38542 }, { "epoch": 0.73, "learning_rate": 9.140610735152844e-07, "loss": 0.9885, "step": 38543 }, { "epoch": 0.73, "learning_rate": 9.139429849008626e-07, "loss": 0.8848, "step": 38544 }, { "epoch": 0.73, "learning_rate": 9.1382490220873e-07, "loss": 0.8919, "step": 38545 }, { "epoch": 0.73, "learning_rate": 9.13706825439325e-07, "loss": 0.9366, "step": 38546 }, { "epoch": 0.73, "learning_rate": 9.135887545930916e-07, "loss": 0.7561, "step": 38547 }, { "epoch": 0.73, "learning_rate": 9.134706896704684e-07, "loss": 0.6363, "step": 38548 }, { "epoch": 0.73, "learning_rate": 9.13352630671897e-07, "loss": 1.0989, "step": 38549 }, { "epoch": 0.73, "learning_rate": 9.132345775978182e-07, "loss": 1.1154, "step": 38550 }, { "epoch": 0.73, "learning_rate": 9.131165304486727e-07, "loss": 1.0004, "step": 38551 }, { "epoch": 0.73, "learning_rate": 9.129984892249017e-07, "loss": 0.9651, "step": 38552 }, { "epoch": 0.73, "learning_rate": 9.128804539269456e-07, "loss": 1.0177, "step": 38553 }, { "epoch": 0.73, "learning_rate": 9.12762424555246e-07, "loss": 0.803, "step": 38554 }, { "epoch": 0.73, "learning_rate": 9.126444011102412e-07, "loss": 0.8694, "step": 38555 }, { "epoch": 0.73, "learning_rate": 9.125263835923751e-07, "loss": 1.0018, "step": 38556 }, { "epoch": 0.73, "learning_rate": 9.12408372002086e-07, "loss": 0.8855, "step": 38557 }, { "epoch": 0.73, "learning_rate": 9.122903663398144e-07, "loss": 0.6394, "step": 38558 }, { "epoch": 0.73, "learning_rate": 9.12172366606004e-07, "loss": 0.8118, "step": 38559 }, { "epoch": 0.73, "learning_rate": 9.120543728010919e-07, "loss": 0.7111, "step": 38560 }, { "epoch": 0.73, "learning_rate": 9.119363849255206e-07, "loss": 0.8912, "step": 38561 }, { "epoch": 0.73, "learning_rate": 9.118184029797297e-07, "loss": 1.1198, "step": 38562 }, { "epoch": 0.73, "learning_rate": 9.117004269641605e-07, "loss": 1.0221, "step": 38563 }, { "epoch": 0.73, "learning_rate": 9.115824568792531e-07, "loss": 0.7805, "step": 38564 }, { "epoch": 0.73, "learning_rate": 9.114644927254482e-07, "loss": 0.9052, "step": 38565 }, { "epoch": 0.73, "learning_rate": 9.113465345031869e-07, "loss": 0.7617, "step": 38566 }, { "epoch": 0.73, "learning_rate": 9.112285822129074e-07, "loss": 0.6709, "step": 38567 }, { "epoch": 0.73, "learning_rate": 9.111106358550531e-07, "loss": 1.1443, "step": 38568 }, { "epoch": 0.73, "learning_rate": 9.109926954300624e-07, "loss": 0.8624, "step": 38569 }, { "epoch": 0.73, "learning_rate": 9.108747609383761e-07, "loss": 0.9802, "step": 38570 }, { "epoch": 0.73, "learning_rate": 9.107568323804347e-07, "loss": 0.8337, "step": 38571 }, { "epoch": 0.73, "learning_rate": 9.106389097566787e-07, "loss": 0.8227, "step": 38572 }, { "epoch": 0.73, "learning_rate": 9.105209930675482e-07, "loss": 0.8138, "step": 38573 }, { "epoch": 0.73, "learning_rate": 9.104030823134835e-07, "loss": 1.1426, "step": 38574 }, { "epoch": 0.73, "learning_rate": 9.102851774949259e-07, "loss": 1.2231, "step": 38575 }, { "epoch": 0.73, "learning_rate": 9.101672786123128e-07, "loss": 0.9478, "step": 38576 }, { "epoch": 0.73, "learning_rate": 9.100493856660883e-07, "loss": 1.1151, "step": 38577 }, { "epoch": 0.73, "learning_rate": 9.099314986566896e-07, "loss": 0.7627, "step": 38578 }, { "epoch": 0.73, "learning_rate": 9.098136175845574e-07, "loss": 1.0406, "step": 38579 }, { "epoch": 0.73, "learning_rate": 9.096957424501338e-07, "loss": 1.0384, "step": 38580 }, { "epoch": 0.73, "learning_rate": 9.095778732538566e-07, "loss": 0.8482, "step": 38581 }, { "epoch": 0.73, "learning_rate": 9.09460009996167e-07, "loss": 0.9243, "step": 38582 }, { "epoch": 0.73, "learning_rate": 9.093421526775051e-07, "loss": 0.772, "step": 38583 }, { "epoch": 0.73, "learning_rate": 9.092243012983107e-07, "loss": 0.9525, "step": 38584 }, { "epoch": 0.73, "learning_rate": 9.09106455859024e-07, "loss": 0.8995, "step": 38585 }, { "epoch": 0.73, "learning_rate": 9.08988616360085e-07, "loss": 0.6747, "step": 38586 }, { "epoch": 0.73, "learning_rate": 9.088707828019347e-07, "loss": 0.9149, "step": 38587 }, { "epoch": 0.73, "learning_rate": 9.087529551850102e-07, "loss": 0.8931, "step": 38588 }, { "epoch": 0.73, "learning_rate": 9.086351335097552e-07, "loss": 0.8363, "step": 38589 }, { "epoch": 0.73, "learning_rate": 9.085173177766068e-07, "loss": 0.9155, "step": 38590 }, { "epoch": 0.73, "learning_rate": 9.083995079860061e-07, "loss": 0.803, "step": 38591 }, { "epoch": 0.73, "learning_rate": 9.082817041383929e-07, "loss": 0.6829, "step": 38592 }, { "epoch": 0.73, "learning_rate": 9.081639062342068e-07, "loss": 1.0104, "step": 38593 }, { "epoch": 0.73, "learning_rate": 9.08046114273888e-07, "loss": 0.9467, "step": 38594 }, { "epoch": 0.73, "learning_rate": 9.079283282578763e-07, "loss": 0.9715, "step": 38595 }, { "epoch": 0.73, "learning_rate": 9.07810548186612e-07, "loss": 0.7914, "step": 38596 }, { "epoch": 0.73, "learning_rate": 9.076927740605329e-07, "loss": 0.9875, "step": 38597 }, { "epoch": 0.73, "learning_rate": 9.075750058800817e-07, "loss": 0.9335, "step": 38598 }, { "epoch": 0.73, "learning_rate": 9.074572436456958e-07, "loss": 0.881, "step": 38599 }, { "epoch": 0.73, "learning_rate": 9.073394873578148e-07, "loss": 1.0607, "step": 38600 }, { "epoch": 0.73, "learning_rate": 9.072217370168809e-07, "loss": 0.8394, "step": 38601 }, { "epoch": 0.73, "learning_rate": 9.071039926233316e-07, "loss": 0.8652, "step": 38602 }, { "epoch": 0.73, "learning_rate": 9.06986254177607e-07, "loss": 0.8446, "step": 38603 }, { "epoch": 0.73, "learning_rate": 9.06868521680147e-07, "loss": 0.9221, "step": 38604 }, { "epoch": 0.73, "learning_rate": 9.067507951313912e-07, "loss": 0.87, "step": 38605 }, { "epoch": 0.73, "learning_rate": 9.066330745317789e-07, "loss": 0.8908, "step": 38606 }, { "epoch": 0.73, "learning_rate": 9.065153598817497e-07, "loss": 0.7361, "step": 38607 }, { "epoch": 0.73, "learning_rate": 9.063976511817443e-07, "loss": 0.9279, "step": 38608 }, { "epoch": 0.73, "learning_rate": 9.062799484321996e-07, "loss": 0.8369, "step": 38609 }, { "epoch": 0.73, "learning_rate": 9.061622516335583e-07, "loss": 0.9332, "step": 38610 }, { "epoch": 0.73, "learning_rate": 9.060445607862575e-07, "loss": 0.8687, "step": 38611 }, { "epoch": 0.73, "learning_rate": 9.059268758907375e-07, "loss": 0.9476, "step": 38612 }, { "epoch": 0.73, "learning_rate": 9.058091969474376e-07, "loss": 0.8694, "step": 38613 }, { "epoch": 0.73, "learning_rate": 9.05691523956797e-07, "loss": 0.9299, "step": 38614 }, { "epoch": 0.73, "learning_rate": 9.055738569192557e-07, "loss": 0.9617, "step": 38615 }, { "epoch": 0.73, "learning_rate": 9.054561958352526e-07, "loss": 0.827, "step": 38616 }, { "epoch": 0.73, "learning_rate": 9.053385407052282e-07, "loss": 0.7577, "step": 38617 }, { "epoch": 0.73, "learning_rate": 9.05220891529619e-07, "loss": 1.1041, "step": 38618 }, { "epoch": 0.73, "learning_rate": 9.051032483088675e-07, "loss": 0.9282, "step": 38619 }, { "epoch": 0.73, "learning_rate": 9.04985611043411e-07, "loss": 0.9354, "step": 38620 }, { "epoch": 0.73, "learning_rate": 9.048679797336884e-07, "loss": 0.8063, "step": 38621 }, { "epoch": 0.73, "learning_rate": 9.047503543801417e-07, "loss": 0.9652, "step": 38622 }, { "epoch": 0.73, "learning_rate": 9.046327349832074e-07, "loss": 0.9583, "step": 38623 }, { "epoch": 0.73, "learning_rate": 9.045151215433254e-07, "loss": 0.9644, "step": 38624 }, { "epoch": 0.73, "learning_rate": 9.043975140609351e-07, "loss": 1.2323, "step": 38625 }, { "epoch": 0.73, "learning_rate": 9.042799125364757e-07, "loss": 0.7904, "step": 38626 }, { "epoch": 0.73, "learning_rate": 9.041623169703859e-07, "loss": 0.7034, "step": 38627 }, { "epoch": 0.73, "learning_rate": 9.040447273631053e-07, "loss": 1.0463, "step": 38628 }, { "epoch": 0.73, "learning_rate": 9.039271437150734e-07, "loss": 0.8244, "step": 38629 }, { "epoch": 0.73, "learning_rate": 9.038095660267271e-07, "loss": 0.8004, "step": 38630 }, { "epoch": 0.73, "learning_rate": 9.036919942985087e-07, "loss": 1.1269, "step": 38631 }, { "epoch": 0.73, "learning_rate": 9.035744285308543e-07, "loss": 1.0257, "step": 38632 }, { "epoch": 0.73, "learning_rate": 9.034568687242043e-07, "loss": 0.9784, "step": 38633 }, { "epoch": 0.73, "learning_rate": 9.033393148789973e-07, "loss": 1.0491, "step": 38634 }, { "epoch": 0.73, "learning_rate": 9.032217669956723e-07, "loss": 0.9337, "step": 38635 }, { "epoch": 0.73, "learning_rate": 9.031042250746691e-07, "loss": 0.8323, "step": 38636 }, { "epoch": 0.73, "learning_rate": 9.02986689116424e-07, "loss": 1.107, "step": 38637 }, { "epoch": 0.73, "learning_rate": 9.028691591213795e-07, "loss": 0.999, "step": 38638 }, { "epoch": 0.73, "learning_rate": 9.027516350899718e-07, "loss": 0.7521, "step": 38639 }, { "epoch": 0.73, "learning_rate": 9.026341170226405e-07, "loss": 0.8911, "step": 38640 }, { "epoch": 0.73, "learning_rate": 9.025166049198244e-07, "loss": 0.9863, "step": 38641 }, { "epoch": 0.73, "learning_rate": 9.023990987819622e-07, "loss": 0.8164, "step": 38642 }, { "epoch": 0.73, "learning_rate": 9.022815986094929e-07, "loss": 0.9753, "step": 38643 }, { "epoch": 0.73, "learning_rate": 9.02164104402855e-07, "loss": 1.0693, "step": 38644 }, { "epoch": 0.73, "learning_rate": 9.020466161624883e-07, "loss": 0.9083, "step": 38645 }, { "epoch": 0.73, "learning_rate": 9.01929133888829e-07, "loss": 0.792, "step": 38646 }, { "epoch": 0.73, "learning_rate": 9.018116575823177e-07, "loss": 0.7681, "step": 38647 }, { "epoch": 0.73, "learning_rate": 9.016941872433937e-07, "loss": 0.8816, "step": 38648 }, { "epoch": 0.73, "learning_rate": 9.015767228724931e-07, "loss": 0.8769, "step": 38649 }, { "epoch": 0.73, "learning_rate": 9.014592644700577e-07, "loss": 1.1436, "step": 38650 }, { "epoch": 0.73, "learning_rate": 9.013418120365233e-07, "loss": 0.8933, "step": 38651 }, { "epoch": 0.73, "learning_rate": 9.012243655723299e-07, "loss": 0.8924, "step": 38652 }, { "epoch": 0.73, "learning_rate": 9.011069250779153e-07, "loss": 1.0478, "step": 38653 }, { "epoch": 0.73, "learning_rate": 9.009894905537187e-07, "loss": 0.8167, "step": 38654 }, { "epoch": 0.73, "learning_rate": 9.008720620001782e-07, "loss": 1.0147, "step": 38655 }, { "epoch": 0.73, "learning_rate": 9.007546394177324e-07, "loss": 0.9338, "step": 38656 }, { "epoch": 0.73, "learning_rate": 9.006372228068208e-07, "loss": 0.826, "step": 38657 }, { "epoch": 0.73, "learning_rate": 9.005198121678787e-07, "loss": 0.8952, "step": 38658 }, { "epoch": 0.73, "learning_rate": 9.004024075013487e-07, "loss": 0.9874, "step": 38659 }, { "epoch": 0.73, "learning_rate": 9.002850088076659e-07, "loss": 0.9648, "step": 38660 }, { "epoch": 0.73, "learning_rate": 9.001676160872699e-07, "loss": 0.745, "step": 38661 }, { "epoch": 0.73, "learning_rate": 9.000502293405991e-07, "loss": 1.1898, "step": 38662 }, { "epoch": 0.73, "learning_rate": 8.999328485680913e-07, "loss": 0.9262, "step": 38663 }, { "epoch": 0.73, "learning_rate": 8.998154737701856e-07, "loss": 0.7625, "step": 38664 }, { "epoch": 0.73, "learning_rate": 8.996981049473197e-07, "loss": 0.7971, "step": 38665 }, { "epoch": 0.73, "learning_rate": 8.995807420999331e-07, "loss": 0.9911, "step": 38666 }, { "epoch": 0.73, "learning_rate": 8.99463385228461e-07, "loss": 0.7272, "step": 38667 }, { "epoch": 0.73, "learning_rate": 8.993460343333443e-07, "loss": 0.8397, "step": 38668 }, { "epoch": 0.73, "learning_rate": 8.992286894150215e-07, "loss": 1.0025, "step": 38669 }, { "epoch": 0.73, "learning_rate": 8.991113504739276e-07, "loss": 0.8983, "step": 38670 }, { "epoch": 0.73, "learning_rate": 8.98994017510505e-07, "loss": 0.881, "step": 38671 }, { "epoch": 0.73, "learning_rate": 8.988766905251886e-07, "loss": 0.7945, "step": 38672 }, { "epoch": 0.73, "learning_rate": 8.987593695184177e-07, "loss": 0.7419, "step": 38673 }, { "epoch": 0.73, "learning_rate": 8.986420544906299e-07, "loss": 0.992, "step": 38674 }, { "epoch": 0.73, "learning_rate": 8.985247454422638e-07, "loss": 0.8944, "step": 38675 }, { "epoch": 0.73, "learning_rate": 8.984074423737571e-07, "loss": 0.9057, "step": 38676 }, { "epoch": 0.73, "learning_rate": 8.98290145285548e-07, "loss": 0.8767, "step": 38677 }, { "epoch": 0.73, "learning_rate": 8.981728541780752e-07, "loss": 0.9274, "step": 38678 }, { "epoch": 0.73, "learning_rate": 8.980555690517743e-07, "loss": 0.8499, "step": 38679 }, { "epoch": 0.73, "learning_rate": 8.979382899070863e-07, "loss": 0.9399, "step": 38680 }, { "epoch": 0.73, "learning_rate": 8.978210167444468e-07, "loss": 1.0211, "step": 38681 }, { "epoch": 0.73, "learning_rate": 8.977037495642942e-07, "loss": 0.9738, "step": 38682 }, { "epoch": 0.73, "learning_rate": 8.975864883670671e-07, "loss": 0.9177, "step": 38683 }, { "epoch": 0.73, "learning_rate": 8.974692331532028e-07, "loss": 0.8124, "step": 38684 }, { "epoch": 0.73, "learning_rate": 8.973519839231392e-07, "loss": 0.8274, "step": 38685 }, { "epoch": 0.73, "learning_rate": 8.972347406773143e-07, "loss": 0.8442, "step": 38686 }, { "epoch": 0.73, "learning_rate": 8.971175034161664e-07, "loss": 1.0871, "step": 38687 }, { "epoch": 0.73, "learning_rate": 8.970002721401311e-07, "loss": 0.947, "step": 38688 }, { "epoch": 0.73, "learning_rate": 8.968830468496484e-07, "loss": 0.8786, "step": 38689 }, { "epoch": 0.73, "learning_rate": 8.96765827545156e-07, "loss": 0.8584, "step": 38690 }, { "epoch": 0.73, "learning_rate": 8.966486142270892e-07, "loss": 1.0275, "step": 38691 }, { "epoch": 0.73, "learning_rate": 8.965314068958889e-07, "loss": 0.8943, "step": 38692 }, { "epoch": 0.73, "learning_rate": 8.964142055519903e-07, "loss": 1.2617, "step": 38693 }, { "epoch": 0.73, "learning_rate": 8.962970101958321e-07, "loss": 1.0137, "step": 38694 }, { "epoch": 0.73, "learning_rate": 8.961798208278516e-07, "loss": 0.9778, "step": 38695 }, { "epoch": 0.73, "learning_rate": 8.960626374484866e-07, "loss": 0.8661, "step": 38696 }, { "epoch": 0.73, "learning_rate": 8.959454600581743e-07, "loss": 0.6882, "step": 38697 }, { "epoch": 0.73, "learning_rate": 8.958282886573527e-07, "loss": 0.96, "step": 38698 }, { "epoch": 0.73, "learning_rate": 8.9571112324646e-07, "loss": 1.0456, "step": 38699 }, { "epoch": 0.73, "learning_rate": 8.955939638259306e-07, "loss": 0.9378, "step": 38700 }, { "epoch": 0.73, "learning_rate": 8.954768103962063e-07, "loss": 0.6781, "step": 38701 }, { "epoch": 0.73, "learning_rate": 8.953596629577213e-07, "loss": 0.8353, "step": 38702 }, { "epoch": 0.73, "learning_rate": 8.952425215109142e-07, "loss": 0.8627, "step": 38703 }, { "epoch": 0.73, "learning_rate": 8.951253860562223e-07, "loss": 0.9968, "step": 38704 }, { "epoch": 0.73, "learning_rate": 8.950082565940832e-07, "loss": 0.897, "step": 38705 }, { "epoch": 0.73, "learning_rate": 8.948911331249338e-07, "loss": 1.0132, "step": 38706 }, { "epoch": 0.73, "learning_rate": 8.947740156492119e-07, "loss": 1.0106, "step": 38707 }, { "epoch": 0.73, "learning_rate": 8.946569041673553e-07, "loss": 0.9547, "step": 38708 }, { "epoch": 0.73, "learning_rate": 8.945397986797988e-07, "loss": 0.8761, "step": 38709 }, { "epoch": 0.73, "learning_rate": 8.944226991869826e-07, "loss": 1.007, "step": 38710 }, { "epoch": 0.73, "learning_rate": 8.943056056893434e-07, "loss": 0.9047, "step": 38711 }, { "epoch": 0.73, "learning_rate": 8.941885181873164e-07, "loss": 1.0103, "step": 38712 }, { "epoch": 0.73, "learning_rate": 8.940714366813416e-07, "loss": 0.8907, "step": 38713 }, { "epoch": 0.73, "learning_rate": 8.939543611718543e-07, "loss": 0.8812, "step": 38714 }, { "epoch": 0.73, "learning_rate": 8.938372916592922e-07, "loss": 0.897, "step": 38715 }, { "epoch": 0.73, "learning_rate": 8.937202281440921e-07, "loss": 0.9663, "step": 38716 }, { "epoch": 0.73, "learning_rate": 8.936031706266915e-07, "loss": 0.8098, "step": 38717 }, { "epoch": 0.73, "learning_rate": 8.934861191075275e-07, "loss": 1.0018, "step": 38718 }, { "epoch": 0.73, "learning_rate": 8.933690735870371e-07, "loss": 0.8401, "step": 38719 }, { "epoch": 0.73, "learning_rate": 8.932520340656581e-07, "loss": 0.8141, "step": 38720 }, { "epoch": 0.73, "learning_rate": 8.93135000543825e-07, "loss": 0.8578, "step": 38721 }, { "epoch": 0.73, "learning_rate": 8.930179730219784e-07, "loss": 0.9153, "step": 38722 }, { "epoch": 0.73, "learning_rate": 8.929009515005524e-07, "loss": 0.9753, "step": 38723 }, { "epoch": 0.73, "learning_rate": 8.92783935979985e-07, "loss": 0.7818, "step": 38724 }, { "epoch": 0.73, "learning_rate": 8.926669264607132e-07, "loss": 1.0301, "step": 38725 }, { "epoch": 0.73, "learning_rate": 8.925499229431739e-07, "loss": 0.9288, "step": 38726 }, { "epoch": 0.73, "learning_rate": 8.924329254278035e-07, "loss": 0.8751, "step": 38727 }, { "epoch": 0.73, "learning_rate": 8.923159339150397e-07, "loss": 0.6842, "step": 38728 }, { "epoch": 0.73, "learning_rate": 8.921989484053195e-07, "loss": 0.932, "step": 38729 }, { "epoch": 0.73, "learning_rate": 8.920819688990775e-07, "loss": 1.1265, "step": 38730 }, { "epoch": 0.73, "learning_rate": 8.91964995396753e-07, "loss": 0.9455, "step": 38731 }, { "epoch": 0.73, "learning_rate": 8.918480278987829e-07, "loss": 0.92, "step": 38732 }, { "epoch": 0.73, "learning_rate": 8.917310664056011e-07, "loss": 0.8268, "step": 38733 }, { "epoch": 0.73, "learning_rate": 8.91614110917648e-07, "loss": 0.8915, "step": 38734 }, { "epoch": 0.73, "learning_rate": 8.914971614353574e-07, "loss": 1.085, "step": 38735 }, { "epoch": 0.73, "learning_rate": 8.913802179591672e-07, "loss": 0.8837, "step": 38736 }, { "epoch": 0.73, "learning_rate": 8.912632804895138e-07, "loss": 1.3263, "step": 38737 }, { "epoch": 0.73, "learning_rate": 8.911463490268343e-07, "loss": 1.1664, "step": 38738 }, { "epoch": 0.73, "learning_rate": 8.910294235715649e-07, "loss": 1.0019, "step": 38739 }, { "epoch": 0.73, "learning_rate": 8.909125041241423e-07, "loss": 0.7972, "step": 38740 }, { "epoch": 0.73, "learning_rate": 8.907955906850038e-07, "loss": 0.8882, "step": 38741 }, { "epoch": 0.73, "learning_rate": 8.906786832545836e-07, "loss": 0.9454, "step": 38742 }, { "epoch": 0.73, "learning_rate": 8.905617818333214e-07, "loss": 1.0779, "step": 38743 }, { "epoch": 0.73, "learning_rate": 8.904448864216517e-07, "loss": 1.0285, "step": 38744 }, { "epoch": 0.73, "learning_rate": 8.903279970200113e-07, "loss": 0.8424, "step": 38745 }, { "epoch": 0.73, "learning_rate": 8.902111136288366e-07, "loss": 0.8079, "step": 38746 }, { "epoch": 0.73, "learning_rate": 8.900942362485643e-07, "loss": 0.9647, "step": 38747 }, { "epoch": 0.73, "learning_rate": 8.899773648796309e-07, "loss": 0.7018, "step": 38748 }, { "epoch": 0.73, "learning_rate": 8.898604995224725e-07, "loss": 1.0117, "step": 38749 }, { "epoch": 0.73, "learning_rate": 8.897436401775267e-07, "loss": 1.0734, "step": 38750 }, { "epoch": 0.73, "learning_rate": 8.896267868452269e-07, "loss": 0.8872, "step": 38751 }, { "epoch": 0.73, "learning_rate": 8.895099395260121e-07, "loss": 0.8091, "step": 38752 }, { "epoch": 0.73, "learning_rate": 8.893930982203188e-07, "loss": 0.7868, "step": 38753 }, { "epoch": 0.73, "learning_rate": 8.892762629285806e-07, "loss": 0.7248, "step": 38754 }, { "epoch": 0.73, "learning_rate": 8.891594336512368e-07, "loss": 0.8498, "step": 38755 }, { "epoch": 0.73, "learning_rate": 8.890426103887217e-07, "loss": 1.1103, "step": 38756 }, { "epoch": 0.73, "learning_rate": 8.889257931414724e-07, "loss": 0.8785, "step": 38757 }, { "epoch": 0.73, "learning_rate": 8.888089819099243e-07, "loss": 0.8666, "step": 38758 }, { "epoch": 0.73, "learning_rate": 8.886921766945145e-07, "loss": 0.9935, "step": 38759 }, { "epoch": 0.73, "learning_rate": 8.885753774956785e-07, "loss": 0.6694, "step": 38760 }, { "epoch": 0.73, "learning_rate": 8.884585843138524e-07, "loss": 0.9688, "step": 38761 }, { "epoch": 0.73, "learning_rate": 8.883417971494737e-07, "loss": 1.0024, "step": 38762 }, { "epoch": 0.73, "learning_rate": 8.882250160029753e-07, "loss": 1.0001, "step": 38763 }, { "epoch": 0.73, "learning_rate": 8.881082408747974e-07, "loss": 0.9077, "step": 38764 }, { "epoch": 0.73, "learning_rate": 8.879914717653728e-07, "loss": 0.7965, "step": 38765 }, { "epoch": 0.73, "learning_rate": 8.878747086751386e-07, "loss": 0.8026, "step": 38766 }, { "epoch": 0.73, "learning_rate": 8.877579516045309e-07, "loss": 0.9707, "step": 38767 }, { "epoch": 0.73, "learning_rate": 8.876412005539855e-07, "loss": 1.0232, "step": 38768 }, { "epoch": 0.73, "learning_rate": 8.875244555239384e-07, "loss": 1.0605, "step": 38769 }, { "epoch": 0.73, "learning_rate": 8.874077165148257e-07, "loss": 0.7758, "step": 38770 }, { "epoch": 0.73, "learning_rate": 8.87290983527084e-07, "loss": 0.8039, "step": 38771 }, { "epoch": 0.73, "learning_rate": 8.871742565611466e-07, "loss": 0.8443, "step": 38772 }, { "epoch": 0.73, "learning_rate": 8.870575356174518e-07, "loss": 0.8831, "step": 38773 }, { "epoch": 0.73, "learning_rate": 8.869408206964356e-07, "loss": 1.0525, "step": 38774 }, { "epoch": 0.73, "learning_rate": 8.86824111798531e-07, "loss": 0.9995, "step": 38775 }, { "epoch": 0.73, "learning_rate": 8.867074089241778e-07, "loss": 0.7712, "step": 38776 }, { "epoch": 0.73, "learning_rate": 8.865907120738087e-07, "loss": 0.9249, "step": 38777 }, { "epoch": 0.73, "learning_rate": 8.864740212478604e-07, "loss": 0.7654, "step": 38778 }, { "epoch": 0.73, "learning_rate": 8.863573364467684e-07, "loss": 0.918, "step": 38779 }, { "epoch": 0.73, "learning_rate": 8.86240657670969e-07, "loss": 0.9709, "step": 38780 }, { "epoch": 0.73, "learning_rate": 8.861239849208972e-07, "loss": 1.0018, "step": 38781 }, { "epoch": 0.73, "learning_rate": 8.860073181969892e-07, "loss": 0.8917, "step": 38782 }, { "epoch": 0.73, "learning_rate": 8.858906574996812e-07, "loss": 0.7397, "step": 38783 }, { "epoch": 0.73, "learning_rate": 8.85774002829406e-07, "loss": 0.9545, "step": 38784 }, { "epoch": 0.73, "learning_rate": 8.856573541866032e-07, "loss": 0.8531, "step": 38785 }, { "epoch": 0.73, "learning_rate": 8.855407115717054e-07, "loss": 0.911, "step": 38786 }, { "epoch": 0.73, "learning_rate": 8.85424074985149e-07, "loss": 0.9258, "step": 38787 }, { "epoch": 0.73, "learning_rate": 8.853074444273696e-07, "loss": 0.9564, "step": 38788 }, { "epoch": 0.73, "learning_rate": 8.851908198988029e-07, "loss": 0.8928, "step": 38789 }, { "epoch": 0.73, "learning_rate": 8.85074201399884e-07, "loss": 1.1092, "step": 38790 }, { "epoch": 0.73, "learning_rate": 8.849575889310485e-07, "loss": 0.9045, "step": 38791 }, { "epoch": 0.73, "learning_rate": 8.848409824927328e-07, "loss": 0.7657, "step": 38792 }, { "epoch": 0.73, "learning_rate": 8.847243820853696e-07, "loss": 1.0167, "step": 38793 }, { "epoch": 0.73, "learning_rate": 8.84607787709397e-07, "loss": 0.9925, "step": 38794 }, { "epoch": 0.73, "learning_rate": 8.844911993652499e-07, "loss": 0.8151, "step": 38795 }, { "epoch": 0.73, "learning_rate": 8.843746170533618e-07, "loss": 0.7449, "step": 38796 }, { "epoch": 0.73, "learning_rate": 8.842580407741711e-07, "loss": 0.8687, "step": 38797 }, { "epoch": 0.73, "learning_rate": 8.841414705281101e-07, "loss": 0.8155, "step": 38798 }, { "epoch": 0.73, "learning_rate": 8.840249063156157e-07, "loss": 0.9915, "step": 38799 }, { "epoch": 0.73, "learning_rate": 8.839083481371225e-07, "loss": 1.0863, "step": 38800 }, { "epoch": 0.73, "learning_rate": 8.837917959930659e-07, "loss": 0.952, "step": 38801 }, { "epoch": 0.73, "learning_rate": 8.836752498838813e-07, "loss": 0.812, "step": 38802 }, { "epoch": 0.73, "learning_rate": 8.835587098100038e-07, "loss": 0.8424, "step": 38803 }, { "epoch": 0.73, "learning_rate": 8.834421757718692e-07, "loss": 0.8964, "step": 38804 }, { "epoch": 0.73, "learning_rate": 8.833256477699103e-07, "loss": 0.9367, "step": 38805 }, { "epoch": 0.73, "learning_rate": 8.832091258045658e-07, "loss": 0.9755, "step": 38806 }, { "epoch": 0.73, "learning_rate": 8.830926098762679e-07, "loss": 0.9868, "step": 38807 }, { "epoch": 0.73, "learning_rate": 8.829760999854525e-07, "loss": 0.7022, "step": 38808 }, { "epoch": 0.73, "learning_rate": 8.828595961325547e-07, "loss": 0.8841, "step": 38809 }, { "epoch": 0.73, "learning_rate": 8.827430983180099e-07, "loss": 0.7699, "step": 38810 }, { "epoch": 0.73, "learning_rate": 8.826266065422526e-07, "loss": 0.8147, "step": 38811 }, { "epoch": 0.73, "learning_rate": 8.82510120805718e-07, "loss": 1.053, "step": 38812 }, { "epoch": 0.73, "learning_rate": 8.823936411088415e-07, "loss": 0.9024, "step": 38813 }, { "epoch": 0.73, "learning_rate": 8.822771674520564e-07, "loss": 0.7834, "step": 38814 }, { "epoch": 0.73, "learning_rate": 8.821606998357992e-07, "loss": 0.813, "step": 38815 }, { "epoch": 0.73, "learning_rate": 8.820442382605055e-07, "loss": 0.8268, "step": 38816 }, { "epoch": 0.73, "learning_rate": 8.819277827266071e-07, "loss": 0.7635, "step": 38817 }, { "epoch": 0.73, "learning_rate": 8.818113332345427e-07, "loss": 0.8975, "step": 38818 }, { "epoch": 0.73, "learning_rate": 8.816948897847441e-07, "loss": 0.8284, "step": 38819 }, { "epoch": 0.73, "learning_rate": 8.815784523776471e-07, "loss": 0.8034, "step": 38820 }, { "epoch": 0.73, "learning_rate": 8.814620210136868e-07, "loss": 0.9198, "step": 38821 }, { "epoch": 0.73, "learning_rate": 8.813455956932973e-07, "loss": 0.7971, "step": 38822 }, { "epoch": 0.73, "learning_rate": 8.812291764169139e-07, "loss": 0.8572, "step": 38823 }, { "epoch": 0.73, "learning_rate": 8.811127631849714e-07, "loss": 0.7775, "step": 38824 }, { "epoch": 0.73, "learning_rate": 8.809963559979048e-07, "loss": 1.039, "step": 38825 }, { "epoch": 0.73, "learning_rate": 8.808799548561464e-07, "loss": 0.9734, "step": 38826 }, { "epoch": 0.73, "learning_rate": 8.807635597601344e-07, "loss": 1.0076, "step": 38827 }, { "epoch": 0.73, "learning_rate": 8.80647170710301e-07, "loss": 0.8955, "step": 38828 }, { "epoch": 0.73, "learning_rate": 8.805307877070809e-07, "loss": 1.0559, "step": 38829 }, { "epoch": 0.73, "learning_rate": 8.804144107509097e-07, "loss": 1.0512, "step": 38830 }, { "epoch": 0.73, "learning_rate": 8.802980398422212e-07, "loss": 0.9351, "step": 38831 }, { "epoch": 0.73, "learning_rate": 8.801816749814502e-07, "loss": 1.0511, "step": 38832 }, { "epoch": 0.73, "learning_rate": 8.80065316169031e-07, "loss": 0.9066, "step": 38833 }, { "epoch": 0.73, "learning_rate": 8.799489634053993e-07, "loss": 0.9402, "step": 38834 }, { "epoch": 0.73, "learning_rate": 8.798326166909865e-07, "loss": 0.8113, "step": 38835 }, { "epoch": 0.73, "learning_rate": 8.797162760262302e-07, "loss": 0.6928, "step": 38836 }, { "epoch": 0.73, "learning_rate": 8.795999414115644e-07, "loss": 1.0005, "step": 38837 }, { "epoch": 0.73, "learning_rate": 8.794836128474211e-07, "loss": 1.0989, "step": 38838 }, { "epoch": 0.73, "learning_rate": 8.793672903342379e-07, "loss": 0.7378, "step": 38839 }, { "epoch": 0.73, "learning_rate": 8.792509738724467e-07, "loss": 0.9531, "step": 38840 }, { "epoch": 0.73, "learning_rate": 8.791346634624826e-07, "loss": 1.0174, "step": 38841 }, { "epoch": 0.73, "learning_rate": 8.790183591047802e-07, "loss": 0.628, "step": 38842 }, { "epoch": 0.73, "learning_rate": 8.789020607997734e-07, "loss": 1.0014, "step": 38843 }, { "epoch": 0.73, "learning_rate": 8.787857685478965e-07, "loss": 1.0411, "step": 38844 }, { "epoch": 0.73, "learning_rate": 8.786694823495839e-07, "loss": 0.9711, "step": 38845 }, { "epoch": 0.73, "learning_rate": 8.785532022052706e-07, "loss": 0.7412, "step": 38846 }, { "epoch": 0.73, "learning_rate": 8.784369281153885e-07, "loss": 0.6788, "step": 38847 }, { "epoch": 0.73, "learning_rate": 8.783206600803745e-07, "loss": 1.0511, "step": 38848 }, { "epoch": 0.73, "learning_rate": 8.782043981006607e-07, "loss": 0.9089, "step": 38849 }, { "epoch": 0.73, "learning_rate": 8.780881421766821e-07, "loss": 0.9646, "step": 38850 }, { "epoch": 0.73, "learning_rate": 8.779718923088726e-07, "loss": 1.0126, "step": 38851 }, { "epoch": 0.73, "learning_rate": 8.778556484976661e-07, "loss": 0.9536, "step": 38852 }, { "epoch": 0.73, "learning_rate": 8.777394107434973e-07, "loss": 0.9855, "step": 38853 }, { "epoch": 0.73, "learning_rate": 8.776231790467993e-07, "loss": 0.733, "step": 38854 }, { "epoch": 0.73, "learning_rate": 8.775069534080077e-07, "loss": 0.9538, "step": 38855 }, { "epoch": 0.73, "learning_rate": 8.773907338275536e-07, "loss": 0.8966, "step": 38856 }, { "epoch": 0.73, "learning_rate": 8.772745203058738e-07, "loss": 1.1636, "step": 38857 }, { "epoch": 0.73, "learning_rate": 8.77158312843402e-07, "loss": 0.8054, "step": 38858 }, { "epoch": 0.73, "learning_rate": 8.770421114405695e-07, "loss": 0.8735, "step": 38859 }, { "epoch": 0.73, "learning_rate": 8.769259160978136e-07, "loss": 0.962, "step": 38860 }, { "epoch": 0.73, "learning_rate": 8.768097268155659e-07, "loss": 1.0087, "step": 38861 }, { "epoch": 0.73, "learning_rate": 8.766935435942608e-07, "loss": 1.0756, "step": 38862 }, { "epoch": 0.73, "learning_rate": 8.765773664343324e-07, "loss": 1.0512, "step": 38863 }, { "epoch": 0.73, "learning_rate": 8.764611953362143e-07, "loss": 1.0163, "step": 38864 }, { "epoch": 0.73, "learning_rate": 8.76345030300341e-07, "loss": 0.9831, "step": 38865 }, { "epoch": 0.73, "learning_rate": 8.762288713271438e-07, "loss": 0.8252, "step": 38866 }, { "epoch": 0.73, "learning_rate": 8.761127184170601e-07, "loss": 0.8054, "step": 38867 }, { "epoch": 0.73, "learning_rate": 8.75996571570521e-07, "loss": 0.9267, "step": 38868 }, { "epoch": 0.73, "learning_rate": 8.758804307879607e-07, "loss": 0.8452, "step": 38869 }, { "epoch": 0.73, "learning_rate": 8.757642960698132e-07, "loss": 0.8497, "step": 38870 }, { "epoch": 0.73, "learning_rate": 8.756481674165118e-07, "loss": 0.6267, "step": 38871 }, { "epoch": 0.73, "learning_rate": 8.755320448284905e-07, "loss": 0.9224, "step": 38872 }, { "epoch": 0.73, "learning_rate": 8.754159283061828e-07, "loss": 0.7618, "step": 38873 }, { "epoch": 0.73, "learning_rate": 8.75299817850023e-07, "loss": 0.9964, "step": 38874 }, { "epoch": 0.73, "learning_rate": 8.751837134604421e-07, "loss": 1.1388, "step": 38875 }, { "epoch": 0.73, "learning_rate": 8.75067615137877e-07, "loss": 1.1205, "step": 38876 }, { "epoch": 0.73, "learning_rate": 8.74951522882759e-07, "loss": 0.7268, "step": 38877 }, { "epoch": 0.73, "learning_rate": 8.748354366955211e-07, "loss": 0.9602, "step": 38878 }, { "epoch": 0.73, "learning_rate": 8.747193565765999e-07, "loss": 0.6798, "step": 38879 }, { "epoch": 0.73, "learning_rate": 8.746032825264256e-07, "loss": 0.937, "step": 38880 }, { "epoch": 0.73, "learning_rate": 8.74487214545433e-07, "loss": 0.9595, "step": 38881 }, { "epoch": 0.73, "learning_rate": 8.743711526340551e-07, "loss": 0.9055, "step": 38882 }, { "epoch": 0.73, "learning_rate": 8.742550967927257e-07, "loss": 1.081, "step": 38883 }, { "epoch": 0.73, "learning_rate": 8.741390470218777e-07, "loss": 0.926, "step": 38884 }, { "epoch": 0.73, "learning_rate": 8.740230033219449e-07, "loss": 0.7617, "step": 38885 }, { "epoch": 0.73, "learning_rate": 8.73906965693361e-07, "loss": 0.7665, "step": 38886 }, { "epoch": 0.73, "learning_rate": 8.737909341365572e-07, "loss": 0.9678, "step": 38887 }, { "epoch": 0.73, "learning_rate": 8.736749086519697e-07, "loss": 0.9333, "step": 38888 }, { "epoch": 0.73, "learning_rate": 8.735588892400293e-07, "loss": 0.8592, "step": 38889 }, { "epoch": 0.73, "learning_rate": 8.734428759011701e-07, "loss": 0.9801, "step": 38890 }, { "epoch": 0.73, "learning_rate": 8.733268686358256e-07, "loss": 1.0258, "step": 38891 }, { "epoch": 0.73, "learning_rate": 8.732108674444284e-07, "loss": 0.8696, "step": 38892 }, { "epoch": 0.73, "learning_rate": 8.730948723274121e-07, "loss": 0.9807, "step": 38893 }, { "epoch": 0.73, "learning_rate": 8.729788832852099e-07, "loss": 0.9461, "step": 38894 }, { "epoch": 0.73, "learning_rate": 8.728629003182551e-07, "loss": 0.9557, "step": 38895 }, { "epoch": 0.73, "learning_rate": 8.727469234269789e-07, "loss": 0.7149, "step": 38896 }, { "epoch": 0.73, "learning_rate": 8.726309526118174e-07, "loss": 0.7707, "step": 38897 }, { "epoch": 0.73, "learning_rate": 8.725149878732011e-07, "loss": 0.9684, "step": 38898 }, { "epoch": 0.73, "learning_rate": 8.723990292115633e-07, "loss": 0.9008, "step": 38899 }, { "epoch": 0.73, "learning_rate": 8.722830766273391e-07, "loss": 0.8354, "step": 38900 }, { "epoch": 0.73, "learning_rate": 8.721671301209591e-07, "loss": 0.8003, "step": 38901 }, { "epoch": 0.73, "learning_rate": 8.720511896928574e-07, "loss": 0.6416, "step": 38902 }, { "epoch": 0.73, "learning_rate": 8.719352553434665e-07, "loss": 0.9632, "step": 38903 }, { "epoch": 0.73, "learning_rate": 8.718193270732195e-07, "loss": 0.974, "step": 38904 }, { "epoch": 0.73, "learning_rate": 8.717034048825491e-07, "loss": 0.9021, "step": 38905 }, { "epoch": 0.73, "learning_rate": 8.715874887718884e-07, "loss": 0.9116, "step": 38906 }, { "epoch": 0.73, "learning_rate": 8.714715787416708e-07, "loss": 1.0455, "step": 38907 }, { "epoch": 0.73, "learning_rate": 8.713556747923265e-07, "loss": 1.0166, "step": 38908 }, { "epoch": 0.73, "learning_rate": 8.712397769242922e-07, "loss": 1.0213, "step": 38909 }, { "epoch": 0.73, "learning_rate": 8.711238851379977e-07, "loss": 0.835, "step": 38910 }, { "epoch": 0.73, "learning_rate": 8.710079994338769e-07, "loss": 1.176, "step": 38911 }, { "epoch": 0.73, "learning_rate": 8.708921198123619e-07, "loss": 1.2617, "step": 38912 }, { "epoch": 0.73, "learning_rate": 8.707762462738859e-07, "loss": 0.9274, "step": 38913 }, { "epoch": 0.73, "learning_rate": 8.706603788188814e-07, "loss": 0.9899, "step": 38914 }, { "epoch": 0.73, "learning_rate": 8.705445174477814e-07, "loss": 0.6812, "step": 38915 }, { "epoch": 0.73, "learning_rate": 8.704286621610186e-07, "loss": 0.598, "step": 38916 }, { "epoch": 0.73, "learning_rate": 8.703128129590238e-07, "loss": 0.8334, "step": 38917 }, { "epoch": 0.73, "learning_rate": 8.701969698422328e-07, "loss": 0.9414, "step": 38918 }, { "epoch": 0.73, "learning_rate": 8.70081132811075e-07, "loss": 1.0872, "step": 38919 }, { "epoch": 0.73, "learning_rate": 8.69965301865984e-07, "loss": 0.7658, "step": 38920 }, { "epoch": 0.73, "learning_rate": 8.69849477007394e-07, "loss": 0.9548, "step": 38921 }, { "epoch": 0.73, "learning_rate": 8.697336582357352e-07, "loss": 0.9003, "step": 38922 }, { "epoch": 0.73, "learning_rate": 8.696178455514409e-07, "loss": 0.7963, "step": 38923 }, { "epoch": 0.73, "learning_rate": 8.695020389549439e-07, "loss": 0.9479, "step": 38924 }, { "epoch": 0.73, "learning_rate": 8.693862384466759e-07, "loss": 1.1217, "step": 38925 }, { "epoch": 0.73, "learning_rate": 8.692704440270699e-07, "loss": 0.8584, "step": 38926 }, { "epoch": 0.73, "learning_rate": 8.69154655696558e-07, "loss": 0.977, "step": 38927 }, { "epoch": 0.73, "learning_rate": 8.690388734555735e-07, "loss": 0.7833, "step": 38928 }, { "epoch": 0.73, "learning_rate": 8.689230973045459e-07, "loss": 0.8641, "step": 38929 }, { "epoch": 0.73, "learning_rate": 8.688073272439116e-07, "loss": 0.872, "step": 38930 }, { "epoch": 0.73, "learning_rate": 8.686915632740995e-07, "loss": 1.0476, "step": 38931 }, { "epoch": 0.73, "learning_rate": 8.685758053955431e-07, "loss": 0.9091, "step": 38932 }, { "epoch": 0.73, "learning_rate": 8.684600536086749e-07, "loss": 0.9883, "step": 38933 }, { "epoch": 0.73, "learning_rate": 8.683443079139268e-07, "loss": 0.8676, "step": 38934 }, { "epoch": 0.73, "learning_rate": 8.682285683117309e-07, "loss": 1.0074, "step": 38935 }, { "epoch": 0.73, "learning_rate": 8.681128348025194e-07, "loss": 0.6436, "step": 38936 }, { "epoch": 0.73, "learning_rate": 8.679971073867255e-07, "loss": 1.03, "step": 38937 }, { "epoch": 0.73, "learning_rate": 8.678813860647787e-07, "loss": 1.1557, "step": 38938 }, { "epoch": 0.73, "learning_rate": 8.677656708371135e-07, "loss": 0.8357, "step": 38939 }, { "epoch": 0.73, "learning_rate": 8.67649961704162e-07, "loss": 0.7149, "step": 38940 }, { "epoch": 0.73, "learning_rate": 8.675342586663541e-07, "loss": 0.821, "step": 38941 }, { "epoch": 0.73, "learning_rate": 8.674185617241246e-07, "loss": 0.7998, "step": 38942 }, { "epoch": 0.73, "learning_rate": 8.673028708779036e-07, "loss": 0.9637, "step": 38943 }, { "epoch": 0.73, "learning_rate": 8.671871861281234e-07, "loss": 1.0239, "step": 38944 }, { "epoch": 0.73, "learning_rate": 8.670715074752162e-07, "loss": 0.8631, "step": 38945 }, { "epoch": 0.73, "learning_rate": 8.669558349196141e-07, "loss": 1.0656, "step": 38946 }, { "epoch": 0.73, "learning_rate": 8.668401684617486e-07, "loss": 1.0007, "step": 38947 }, { "epoch": 0.73, "learning_rate": 8.66724508102052e-07, "loss": 0.8334, "step": 38948 }, { "epoch": 0.73, "learning_rate": 8.66608853840957e-07, "loss": 0.8981, "step": 38949 }, { "epoch": 0.73, "learning_rate": 8.664932056788925e-07, "loss": 1.0891, "step": 38950 }, { "epoch": 0.73, "learning_rate": 8.663775636162941e-07, "loss": 1.123, "step": 38951 }, { "epoch": 0.73, "learning_rate": 8.662619276535908e-07, "loss": 0.9074, "step": 38952 }, { "epoch": 0.73, "learning_rate": 8.661462977912155e-07, "loss": 0.8647, "step": 38953 }, { "epoch": 0.73, "learning_rate": 8.660306740295998e-07, "loss": 0.8196, "step": 38954 }, { "epoch": 0.73, "learning_rate": 8.659150563691756e-07, "loss": 0.9677, "step": 38955 }, { "epoch": 0.73, "learning_rate": 8.657994448103743e-07, "loss": 1.2264, "step": 38956 }, { "epoch": 0.73, "learning_rate": 8.65683839353628e-07, "loss": 1.0234, "step": 38957 }, { "epoch": 0.74, "learning_rate": 8.655682399993687e-07, "loss": 0.8443, "step": 38958 }, { "epoch": 0.74, "learning_rate": 8.654526467480257e-07, "loss": 0.9697, "step": 38959 }, { "epoch": 0.74, "learning_rate": 8.653370596000336e-07, "loss": 0.6662, "step": 38960 }, { "epoch": 0.74, "learning_rate": 8.652214785558233e-07, "loss": 0.895, "step": 38961 }, { "epoch": 0.74, "learning_rate": 8.651059036158244e-07, "loss": 1.268, "step": 38962 }, { "epoch": 0.74, "learning_rate": 8.649903347804717e-07, "loss": 0.7981, "step": 38963 }, { "epoch": 0.74, "learning_rate": 8.64874772050194e-07, "loss": 0.8449, "step": 38964 }, { "epoch": 0.74, "learning_rate": 8.647592154254236e-07, "loss": 0.9641, "step": 38965 }, { "epoch": 0.74, "learning_rate": 8.646436649065923e-07, "loss": 0.8699, "step": 38966 }, { "epoch": 0.74, "learning_rate": 8.645281204941317e-07, "loss": 0.7258, "step": 38967 }, { "epoch": 0.74, "learning_rate": 8.644125821884725e-07, "loss": 0.9602, "step": 38968 }, { "epoch": 0.74, "learning_rate": 8.642970499900469e-07, "loss": 0.9236, "step": 38969 }, { "epoch": 0.74, "learning_rate": 8.641815238992865e-07, "loss": 1.0073, "step": 38970 }, { "epoch": 0.74, "learning_rate": 8.640660039166207e-07, "loss": 0.6555, "step": 38971 }, { "epoch": 0.74, "learning_rate": 8.639504900424839e-07, "loss": 0.9281, "step": 38972 }, { "epoch": 0.74, "learning_rate": 8.638349822773049e-07, "loss": 0.8416, "step": 38973 }, { "epoch": 0.74, "learning_rate": 8.63719480621516e-07, "loss": 0.9805, "step": 38974 }, { "epoch": 0.74, "learning_rate": 8.636039850755482e-07, "loss": 0.94, "step": 38975 }, { "epoch": 0.74, "learning_rate": 8.634884956398332e-07, "loss": 0.8456, "step": 38976 }, { "epoch": 0.74, "learning_rate": 8.633730123148018e-07, "loss": 0.9749, "step": 38977 }, { "epoch": 0.74, "learning_rate": 8.632575351008854e-07, "loss": 0.939, "step": 38978 }, { "epoch": 0.74, "learning_rate": 8.631420639985161e-07, "loss": 0.7493, "step": 38979 }, { "epoch": 0.74, "learning_rate": 8.630265990081224e-07, "loss": 0.9702, "step": 38980 }, { "epoch": 0.74, "learning_rate": 8.629111401301382e-07, "loss": 1.1859, "step": 38981 }, { "epoch": 0.74, "learning_rate": 8.627956873649943e-07, "loss": 0.9482, "step": 38982 }, { "epoch": 0.74, "learning_rate": 8.626802407131194e-07, "loss": 0.8511, "step": 38983 }, { "epoch": 0.74, "learning_rate": 8.625648001749481e-07, "loss": 0.9628, "step": 38984 }, { "epoch": 0.74, "learning_rate": 8.624493657509086e-07, "loss": 0.7974, "step": 38985 }, { "epoch": 0.74, "learning_rate": 8.62333937441433e-07, "loss": 0.8178, "step": 38986 }, { "epoch": 0.74, "learning_rate": 8.622185152469526e-07, "loss": 1.0739, "step": 38987 }, { "epoch": 0.74, "learning_rate": 8.621030991678978e-07, "loss": 0.7919, "step": 38988 }, { "epoch": 0.74, "learning_rate": 8.619876892046997e-07, "loss": 0.8164, "step": 38989 }, { "epoch": 0.74, "learning_rate": 8.618722853577894e-07, "loss": 0.8737, "step": 38990 }, { "epoch": 0.74, "learning_rate": 8.617568876275986e-07, "loss": 0.9792, "step": 38991 }, { "epoch": 0.74, "learning_rate": 8.616414960145555e-07, "loss": 0.7293, "step": 38992 }, { "epoch": 0.74, "learning_rate": 8.615261105190947e-07, "loss": 1.0442, "step": 38993 }, { "epoch": 0.74, "learning_rate": 8.614107311416444e-07, "loss": 0.9552, "step": 38994 }, { "epoch": 0.74, "learning_rate": 8.612953578826361e-07, "loss": 0.802, "step": 38995 }, { "epoch": 0.74, "learning_rate": 8.611799907425009e-07, "loss": 0.8679, "step": 38996 }, { "epoch": 0.74, "learning_rate": 8.61064629721669e-07, "loss": 0.8972, "step": 38997 }, { "epoch": 0.74, "learning_rate": 8.609492748205716e-07, "loss": 0.7203, "step": 38998 }, { "epoch": 0.74, "learning_rate": 8.608339260396398e-07, "loss": 1.0188, "step": 38999 }, { "epoch": 0.74, "learning_rate": 8.607185833793041e-07, "loss": 0.9879, "step": 39000 }, { "epoch": 0.74, "learning_rate": 8.606032468399936e-07, "loss": 1.0186, "step": 39001 }, { "epoch": 0.74, "learning_rate": 8.604879164221411e-07, "loss": 0.8799, "step": 39002 }, { "epoch": 0.74, "learning_rate": 8.603725921261772e-07, "loss": 1.0012, "step": 39003 }, { "epoch": 0.74, "learning_rate": 8.602572739525303e-07, "loss": 0.965, "step": 39004 }, { "epoch": 0.74, "learning_rate": 8.601419619016337e-07, "loss": 0.8294, "step": 39005 }, { "epoch": 0.74, "learning_rate": 8.600266559739165e-07, "loss": 1.2063, "step": 39006 }, { "epoch": 0.74, "learning_rate": 8.599113561698092e-07, "loss": 0.8883, "step": 39007 }, { "epoch": 0.74, "learning_rate": 8.597960624897425e-07, "loss": 0.8574, "step": 39008 }, { "epoch": 0.74, "learning_rate": 8.59680774934147e-07, "loss": 0.9136, "step": 39009 }, { "epoch": 0.74, "learning_rate": 8.595654935034534e-07, "loss": 0.8354, "step": 39010 }, { "epoch": 0.74, "learning_rate": 8.594502181980918e-07, "loss": 1.0424, "step": 39011 }, { "epoch": 0.74, "learning_rate": 8.593349490184938e-07, "loss": 1.0892, "step": 39012 }, { "epoch": 0.74, "learning_rate": 8.59219685965087e-07, "loss": 0.8109, "step": 39013 }, { "epoch": 0.74, "learning_rate": 8.591044290383052e-07, "loss": 0.7079, "step": 39014 }, { "epoch": 0.74, "learning_rate": 8.589891782385762e-07, "loss": 0.9513, "step": 39015 }, { "epoch": 0.74, "learning_rate": 8.588739335663316e-07, "loss": 0.8127, "step": 39016 }, { "epoch": 0.74, "learning_rate": 8.587586950220012e-07, "loss": 0.9037, "step": 39017 }, { "epoch": 0.74, "learning_rate": 8.586434626060156e-07, "loss": 1.0225, "step": 39018 }, { "epoch": 0.74, "learning_rate": 8.585282363188049e-07, "loss": 1.2667, "step": 39019 }, { "epoch": 0.74, "learning_rate": 8.584130161607996e-07, "loss": 0.6933, "step": 39020 }, { "epoch": 0.74, "learning_rate": 8.582978021324304e-07, "loss": 0.9575, "step": 39021 }, { "epoch": 0.74, "learning_rate": 8.581825942341254e-07, "loss": 0.8987, "step": 39022 }, { "epoch": 0.74, "learning_rate": 8.580673924663169e-07, "loss": 0.9145, "step": 39023 }, { "epoch": 0.74, "learning_rate": 8.579521968294355e-07, "loss": 1.0338, "step": 39024 }, { "epoch": 0.74, "learning_rate": 8.578370073239084e-07, "loss": 0.9901, "step": 39025 }, { "epoch": 0.74, "learning_rate": 8.577218239501692e-07, "loss": 0.997, "step": 39026 }, { "epoch": 0.74, "learning_rate": 8.576066467086455e-07, "loss": 0.9396, "step": 39027 }, { "epoch": 0.74, "learning_rate": 8.574914755997682e-07, "loss": 0.8813, "step": 39028 }, { "epoch": 0.74, "learning_rate": 8.573763106239677e-07, "loss": 0.8191, "step": 39029 }, { "epoch": 0.74, "learning_rate": 8.572611517816734e-07, "loss": 0.9285, "step": 39030 }, { "epoch": 0.74, "learning_rate": 8.571459990733155e-07, "loss": 1.1945, "step": 39031 }, { "epoch": 0.74, "learning_rate": 8.570308524993242e-07, "loss": 0.8296, "step": 39032 }, { "epoch": 0.74, "learning_rate": 8.569157120601304e-07, "loss": 0.9092, "step": 39033 }, { "epoch": 0.74, "learning_rate": 8.568005777561611e-07, "loss": 1.0504, "step": 39034 }, { "epoch": 0.74, "learning_rate": 8.566854495878496e-07, "loss": 0.8035, "step": 39035 }, { "epoch": 0.74, "learning_rate": 8.565703275556237e-07, "loss": 0.9222, "step": 39036 }, { "epoch": 0.74, "learning_rate": 8.564552116599134e-07, "loss": 1.0365, "step": 39037 }, { "epoch": 0.74, "learning_rate": 8.563401019011491e-07, "loss": 1.0508, "step": 39038 }, { "epoch": 0.74, "learning_rate": 8.562249982797608e-07, "loss": 0.9543, "step": 39039 }, { "epoch": 0.74, "learning_rate": 8.561099007961776e-07, "loss": 0.7974, "step": 39040 }, { "epoch": 0.74, "learning_rate": 8.559948094508296e-07, "loss": 0.7541, "step": 39041 }, { "epoch": 0.74, "learning_rate": 8.558797242441475e-07, "loss": 0.7696, "step": 39042 }, { "epoch": 0.74, "learning_rate": 8.557646451765586e-07, "loss": 1.1453, "step": 39043 }, { "epoch": 0.74, "learning_rate": 8.556495722484947e-07, "loss": 1.1701, "step": 39044 }, { "epoch": 0.74, "learning_rate": 8.555345054603858e-07, "loss": 0.9915, "step": 39045 }, { "epoch": 0.74, "learning_rate": 8.55419444812659e-07, "loss": 0.9137, "step": 39046 }, { "epoch": 0.74, "learning_rate": 8.553043903057471e-07, "loss": 0.9072, "step": 39047 }, { "epoch": 0.74, "learning_rate": 8.551893419400776e-07, "loss": 0.9067, "step": 39048 }, { "epoch": 0.74, "learning_rate": 8.550742997160805e-07, "loss": 1.1059, "step": 39049 }, { "epoch": 0.74, "learning_rate": 8.549592636341855e-07, "loss": 1.0283, "step": 39050 }, { "epoch": 0.74, "learning_rate": 8.548442336948221e-07, "loss": 0.7351, "step": 39051 }, { "epoch": 0.74, "learning_rate": 8.5472920989842e-07, "loss": 0.8954, "step": 39052 }, { "epoch": 0.74, "learning_rate": 8.546141922454088e-07, "loss": 0.8269, "step": 39053 }, { "epoch": 0.74, "learning_rate": 8.544991807362182e-07, "loss": 0.7879, "step": 39054 }, { "epoch": 0.74, "learning_rate": 8.543841753712758e-07, "loss": 0.8531, "step": 39055 }, { "epoch": 0.74, "learning_rate": 8.542691761510141e-07, "loss": 0.979, "step": 39056 }, { "epoch": 0.74, "learning_rate": 8.541541830758599e-07, "loss": 0.9518, "step": 39057 }, { "epoch": 0.74, "learning_rate": 8.540391961462435e-07, "loss": 0.8449, "step": 39058 }, { "epoch": 0.74, "learning_rate": 8.539242153625943e-07, "loss": 0.9012, "step": 39059 }, { "epoch": 0.74, "learning_rate": 8.538092407253418e-07, "loss": 0.7549, "step": 39060 }, { "epoch": 0.74, "learning_rate": 8.536942722349148e-07, "loss": 0.999, "step": 39061 }, { "epoch": 0.74, "learning_rate": 8.53579309891743e-07, "loss": 0.8506, "step": 39062 }, { "epoch": 0.74, "learning_rate": 8.534643536962567e-07, "loss": 1.0061, "step": 39063 }, { "epoch": 0.74, "learning_rate": 8.533494036488821e-07, "loss": 0.9264, "step": 39064 }, { "epoch": 0.74, "learning_rate": 8.532344597500511e-07, "loss": 0.6535, "step": 39065 }, { "epoch": 0.74, "learning_rate": 8.531195220001931e-07, "loss": 0.7764, "step": 39066 }, { "epoch": 0.74, "learning_rate": 8.530045903997347e-07, "loss": 0.9044, "step": 39067 }, { "epoch": 0.74, "learning_rate": 8.52889664949108e-07, "loss": 1.094, "step": 39068 }, { "epoch": 0.74, "learning_rate": 8.527747456487404e-07, "loss": 0.9374, "step": 39069 }, { "epoch": 0.74, "learning_rate": 8.526598324990612e-07, "loss": 1.0884, "step": 39070 }, { "epoch": 0.74, "learning_rate": 8.525449255004997e-07, "loss": 0.7798, "step": 39071 }, { "epoch": 0.74, "learning_rate": 8.524300246534847e-07, "loss": 0.9686, "step": 39072 }, { "epoch": 0.74, "learning_rate": 8.523151299584458e-07, "loss": 0.8092, "step": 39073 }, { "epoch": 0.74, "learning_rate": 8.522002414158114e-07, "loss": 0.8644, "step": 39074 }, { "epoch": 0.74, "learning_rate": 8.52085359026012e-07, "loss": 1.0865, "step": 39075 }, { "epoch": 0.74, "learning_rate": 8.519704827894734e-07, "loss": 1.0005, "step": 39076 }, { "epoch": 0.74, "learning_rate": 8.518556127066282e-07, "loss": 0.769, "step": 39077 }, { "epoch": 0.74, "learning_rate": 8.517407487779028e-07, "loss": 0.7549, "step": 39078 }, { "epoch": 0.74, "learning_rate": 8.51625891003727e-07, "loss": 0.7547, "step": 39079 }, { "epoch": 0.74, "learning_rate": 8.515110393845294e-07, "loss": 0.85, "step": 39080 }, { "epoch": 0.74, "learning_rate": 8.513961939207391e-07, "loss": 1.1359, "step": 39081 }, { "epoch": 0.74, "learning_rate": 8.512813546127848e-07, "loss": 0.8035, "step": 39082 }, { "epoch": 0.74, "learning_rate": 8.511665214610953e-07, "loss": 0.9271, "step": 39083 }, { "epoch": 0.74, "learning_rate": 8.510516944661007e-07, "loss": 0.9101, "step": 39084 }, { "epoch": 0.74, "learning_rate": 8.509368736282265e-07, "loss": 0.8067, "step": 39085 }, { "epoch": 0.74, "learning_rate": 8.508220589479043e-07, "loss": 0.7015, "step": 39086 }, { "epoch": 0.74, "learning_rate": 8.507072504255628e-07, "loss": 1.1975, "step": 39087 }, { "epoch": 0.74, "learning_rate": 8.505924480616284e-07, "loss": 0.8817, "step": 39088 }, { "epoch": 0.74, "learning_rate": 8.504776518565327e-07, "loss": 0.994, "step": 39089 }, { "epoch": 0.74, "learning_rate": 8.503628618107021e-07, "loss": 0.5771, "step": 39090 }, { "epoch": 0.74, "learning_rate": 8.502480779245658e-07, "loss": 0.8761, "step": 39091 }, { "epoch": 0.74, "learning_rate": 8.501333001985529e-07, "loss": 0.8087, "step": 39092 }, { "epoch": 0.74, "learning_rate": 8.500185286330917e-07, "loss": 1.0983, "step": 39093 }, { "epoch": 0.74, "learning_rate": 8.499037632286106e-07, "loss": 0.8637, "step": 39094 }, { "epoch": 0.74, "learning_rate": 8.49789003985538e-07, "loss": 1.0859, "step": 39095 }, { "epoch": 0.74, "learning_rate": 8.496742509043038e-07, "loss": 0.7465, "step": 39096 }, { "epoch": 0.74, "learning_rate": 8.495595039853336e-07, "loss": 0.7743, "step": 39097 }, { "epoch": 0.74, "learning_rate": 8.494447632290592e-07, "loss": 0.8654, "step": 39098 }, { "epoch": 0.74, "learning_rate": 8.493300286359069e-07, "loss": 1.0232, "step": 39099 }, { "epoch": 0.74, "learning_rate": 8.492153002063052e-07, "loss": 0.8394, "step": 39100 }, { "epoch": 0.74, "learning_rate": 8.491005779406833e-07, "loss": 1.2852, "step": 39101 }, { "epoch": 0.74, "learning_rate": 8.489858618394692e-07, "loss": 0.7508, "step": 39102 }, { "epoch": 0.74, "learning_rate": 8.48871151903092e-07, "loss": 0.8947, "step": 39103 }, { "epoch": 0.74, "learning_rate": 8.487564481319777e-07, "loss": 0.6255, "step": 39104 }, { "epoch": 0.74, "learning_rate": 8.486417505265579e-07, "loss": 0.948, "step": 39105 }, { "epoch": 0.74, "learning_rate": 8.485270590872583e-07, "loss": 0.9305, "step": 39106 }, { "epoch": 0.74, "learning_rate": 8.48412373814507e-07, "loss": 1.0602, "step": 39107 }, { "epoch": 0.74, "learning_rate": 8.482976947087351e-07, "loss": 1.0512, "step": 39108 }, { "epoch": 0.74, "learning_rate": 8.481830217703682e-07, "loss": 1.0588, "step": 39109 }, { "epoch": 0.74, "learning_rate": 8.480683549998353e-07, "loss": 0.8068, "step": 39110 }, { "epoch": 0.74, "learning_rate": 8.479536943975642e-07, "loss": 0.8871, "step": 39111 }, { "epoch": 0.74, "learning_rate": 8.478390399639835e-07, "loss": 0.98, "step": 39112 }, { "epoch": 0.74, "learning_rate": 8.477243916995212e-07, "loss": 1.0566, "step": 39113 }, { "epoch": 0.74, "learning_rate": 8.476097496046054e-07, "loss": 0.7967, "step": 39114 }, { "epoch": 0.74, "learning_rate": 8.474951136796649e-07, "loss": 0.8517, "step": 39115 }, { "epoch": 0.74, "learning_rate": 8.473804839251254e-07, "loss": 0.8495, "step": 39116 }, { "epoch": 0.74, "learning_rate": 8.47265860341418e-07, "loss": 0.8557, "step": 39117 }, { "epoch": 0.74, "learning_rate": 8.471512429289685e-07, "loss": 0.9244, "step": 39118 }, { "epoch": 0.74, "learning_rate": 8.470366316882056e-07, "loss": 1.0324, "step": 39119 }, { "epoch": 0.74, "learning_rate": 8.469220266195571e-07, "loss": 1.1066, "step": 39120 }, { "epoch": 0.74, "learning_rate": 8.468074277234514e-07, "loss": 0.8672, "step": 39121 }, { "epoch": 0.74, "learning_rate": 8.466928350003159e-07, "loss": 0.8551, "step": 39122 }, { "epoch": 0.74, "learning_rate": 8.465782484505786e-07, "loss": 0.7938, "step": 39123 }, { "epoch": 0.74, "learning_rate": 8.464636680746683e-07, "loss": 0.7767, "step": 39124 }, { "epoch": 0.74, "learning_rate": 8.463490938730101e-07, "loss": 1.0613, "step": 39125 }, { "epoch": 0.74, "learning_rate": 8.462345258460356e-07, "loss": 1.0919, "step": 39126 }, { "epoch": 0.74, "learning_rate": 8.461199639941697e-07, "loss": 0.8078, "step": 39127 }, { "epoch": 0.74, "learning_rate": 8.460054083178404e-07, "loss": 0.8321, "step": 39128 }, { "epoch": 0.74, "learning_rate": 8.458908588174777e-07, "loss": 0.8555, "step": 39129 }, { "epoch": 0.74, "learning_rate": 8.457763154935072e-07, "loss": 0.7937, "step": 39130 }, { "epoch": 0.74, "learning_rate": 8.456617783463572e-07, "loss": 1.0356, "step": 39131 }, { "epoch": 0.74, "learning_rate": 8.455472473764553e-07, "loss": 0.9479, "step": 39132 }, { "epoch": 0.74, "learning_rate": 8.45432722584229e-07, "loss": 1.09, "step": 39133 }, { "epoch": 0.74, "learning_rate": 8.453182039701066e-07, "loss": 0.914, "step": 39134 }, { "epoch": 0.74, "learning_rate": 8.452036915345152e-07, "loss": 0.8782, "step": 39135 }, { "epoch": 0.74, "learning_rate": 8.450891852778834e-07, "loss": 1.0352, "step": 39136 }, { "epoch": 0.74, "learning_rate": 8.449746852006358e-07, "loss": 0.8437, "step": 39137 }, { "epoch": 0.74, "learning_rate": 8.44860191303204e-07, "loss": 0.8054, "step": 39138 }, { "epoch": 0.74, "learning_rate": 8.447457035860124e-07, "loss": 0.9222, "step": 39139 }, { "epoch": 0.74, "learning_rate": 8.446312220494898e-07, "loss": 0.9437, "step": 39140 }, { "epoch": 0.74, "learning_rate": 8.445167466940635e-07, "loss": 0.9077, "step": 39141 }, { "epoch": 0.74, "learning_rate": 8.444022775201607e-07, "loss": 1.0352, "step": 39142 }, { "epoch": 0.74, "learning_rate": 8.442878145282094e-07, "loss": 0.8727, "step": 39143 }, { "epoch": 0.74, "learning_rate": 8.441733577186362e-07, "loss": 1.1519, "step": 39144 }, { "epoch": 0.74, "learning_rate": 8.4405890709187e-07, "loss": 0.8517, "step": 39145 }, { "epoch": 0.74, "learning_rate": 8.439444626483353e-07, "loss": 0.9763, "step": 39146 }, { "epoch": 0.74, "learning_rate": 8.438300243884628e-07, "loss": 0.8997, "step": 39147 }, { "epoch": 0.74, "learning_rate": 8.437155923126774e-07, "loss": 0.8867, "step": 39148 }, { "epoch": 0.74, "learning_rate": 8.436011664214067e-07, "loss": 0.9206, "step": 39149 }, { "epoch": 0.74, "learning_rate": 8.434867467150798e-07, "loss": 1.1115, "step": 39150 }, { "epoch": 0.74, "learning_rate": 8.433723331941218e-07, "loss": 0.8764, "step": 39151 }, { "epoch": 0.74, "learning_rate": 8.432579258589607e-07, "loss": 0.856, "step": 39152 }, { "epoch": 0.74, "learning_rate": 8.431435247100236e-07, "loss": 0.7916, "step": 39153 }, { "epoch": 0.74, "learning_rate": 8.43029129747738e-07, "loss": 0.6944, "step": 39154 }, { "epoch": 0.74, "learning_rate": 8.429147409725307e-07, "loss": 1.137, "step": 39155 }, { "epoch": 0.74, "learning_rate": 8.42800358384829e-07, "loss": 1.0969, "step": 39156 }, { "epoch": 0.74, "learning_rate": 8.426859819850608e-07, "loss": 0.7533, "step": 39157 }, { "epoch": 0.74, "learning_rate": 8.425716117736507e-07, "loss": 0.9147, "step": 39158 }, { "epoch": 0.74, "learning_rate": 8.42457247751029e-07, "loss": 0.7986, "step": 39159 }, { "epoch": 0.74, "learning_rate": 8.423428899176203e-07, "loss": 0.9272, "step": 39160 }, { "epoch": 0.74, "learning_rate": 8.422285382738524e-07, "loss": 0.92, "step": 39161 }, { "epoch": 0.74, "learning_rate": 8.421141928201523e-07, "loss": 0.8636, "step": 39162 }, { "epoch": 0.74, "learning_rate": 8.419998535569471e-07, "loss": 1.0094, "step": 39163 }, { "epoch": 0.74, "learning_rate": 8.418855204846635e-07, "loss": 0.9249, "step": 39164 }, { "epoch": 0.74, "learning_rate": 8.417711936037285e-07, "loss": 0.7908, "step": 39165 }, { "epoch": 0.74, "learning_rate": 8.416568729145699e-07, "loss": 0.849, "step": 39166 }, { "epoch": 0.74, "learning_rate": 8.41542558417612e-07, "loss": 0.6143, "step": 39167 }, { "epoch": 0.74, "learning_rate": 8.41428250113285e-07, "loss": 0.9526, "step": 39168 }, { "epoch": 0.74, "learning_rate": 8.413139480020133e-07, "loss": 0.8828, "step": 39169 }, { "epoch": 0.74, "learning_rate": 8.411996520842236e-07, "loss": 0.9924, "step": 39170 }, { "epoch": 0.74, "learning_rate": 8.410853623603451e-07, "loss": 0.8685, "step": 39171 }, { "epoch": 0.74, "learning_rate": 8.409710788308023e-07, "loss": 0.8301, "step": 39172 }, { "epoch": 0.74, "learning_rate": 8.408568014960225e-07, "loss": 0.8381, "step": 39173 }, { "epoch": 0.74, "learning_rate": 8.407425303564326e-07, "loss": 0.9492, "step": 39174 }, { "epoch": 0.74, "learning_rate": 8.406282654124592e-07, "loss": 1.0026, "step": 39175 }, { "epoch": 0.74, "learning_rate": 8.40514006664529e-07, "loss": 1.0107, "step": 39176 }, { "epoch": 0.74, "learning_rate": 8.403997541130684e-07, "loss": 0.71, "step": 39177 }, { "epoch": 0.74, "learning_rate": 8.402855077585054e-07, "loss": 0.7923, "step": 39178 }, { "epoch": 0.74, "learning_rate": 8.401712676012636e-07, "loss": 0.7795, "step": 39179 }, { "epoch": 0.74, "learning_rate": 8.400570336417733e-07, "loss": 0.8932, "step": 39180 }, { "epoch": 0.74, "learning_rate": 8.399428058804579e-07, "loss": 1.0676, "step": 39181 }, { "epoch": 0.74, "learning_rate": 8.398285843177454e-07, "loss": 1.0723, "step": 39182 }, { "epoch": 0.74, "learning_rate": 8.397143689540621e-07, "loss": 0.7078, "step": 39183 }, { "epoch": 0.74, "learning_rate": 8.396001597898343e-07, "loss": 1.0499, "step": 39184 }, { "epoch": 0.74, "learning_rate": 8.394859568254887e-07, "loss": 0.892, "step": 39185 }, { "epoch": 0.74, "learning_rate": 8.393717600614515e-07, "loss": 0.8146, "step": 39186 }, { "epoch": 0.74, "learning_rate": 8.392575694981503e-07, "loss": 0.9534, "step": 39187 }, { "epoch": 0.74, "learning_rate": 8.391433851360084e-07, "loss": 0.7994, "step": 39188 }, { "epoch": 0.74, "learning_rate": 8.390292069754561e-07, "loss": 1.1388, "step": 39189 }, { "epoch": 0.74, "learning_rate": 8.38915035016917e-07, "loss": 1.0878, "step": 39190 }, { "epoch": 0.74, "learning_rate": 8.388008692608174e-07, "loss": 0.9811, "step": 39191 }, { "epoch": 0.74, "learning_rate": 8.38686709707586e-07, "loss": 0.7491, "step": 39192 }, { "epoch": 0.74, "learning_rate": 8.385725563576466e-07, "loss": 0.7711, "step": 39193 }, { "epoch": 0.74, "learning_rate": 8.384584092114264e-07, "loss": 0.9926, "step": 39194 }, { "epoch": 0.74, "learning_rate": 8.383442682693516e-07, "loss": 1.0762, "step": 39195 }, { "epoch": 0.74, "learning_rate": 8.382301335318482e-07, "loss": 0.9509, "step": 39196 }, { "epoch": 0.74, "learning_rate": 8.381160049993428e-07, "loss": 0.8301, "step": 39197 }, { "epoch": 0.74, "learning_rate": 8.38001882672261e-07, "loss": 0.9506, "step": 39198 }, { "epoch": 0.74, "learning_rate": 8.378877665510301e-07, "loss": 1.0176, "step": 39199 }, { "epoch": 0.74, "learning_rate": 8.377736566360739e-07, "loss": 1.0101, "step": 39200 }, { "epoch": 0.74, "learning_rate": 8.376595529278214e-07, "loss": 0.8766, "step": 39201 }, { "epoch": 0.74, "learning_rate": 8.375454554266962e-07, "loss": 0.9773, "step": 39202 }, { "epoch": 0.74, "learning_rate": 8.374313641331255e-07, "loss": 0.8782, "step": 39203 }, { "epoch": 0.74, "learning_rate": 8.373172790475351e-07, "loss": 0.8199, "step": 39204 }, { "epoch": 0.74, "learning_rate": 8.372032001703509e-07, "loss": 0.8069, "step": 39205 }, { "epoch": 0.74, "learning_rate": 8.370891275019988e-07, "loss": 0.9814, "step": 39206 }, { "epoch": 0.74, "learning_rate": 8.369750610429053e-07, "loss": 0.9457, "step": 39207 }, { "epoch": 0.74, "learning_rate": 8.368610007934966e-07, "loss": 0.7736, "step": 39208 }, { "epoch": 0.74, "learning_rate": 8.367469467541961e-07, "loss": 0.8574, "step": 39209 }, { "epoch": 0.74, "learning_rate": 8.366328989254332e-07, "loss": 0.8019, "step": 39210 }, { "epoch": 0.74, "learning_rate": 8.365188573076313e-07, "loss": 0.9017, "step": 39211 }, { "epoch": 0.74, "learning_rate": 8.364048219012163e-07, "loss": 0.7361, "step": 39212 }, { "epoch": 0.74, "learning_rate": 8.362907927066164e-07, "loss": 0.768, "step": 39213 }, { "epoch": 0.74, "learning_rate": 8.361767697242545e-07, "loss": 0.8391, "step": 39214 }, { "epoch": 0.74, "learning_rate": 8.360627529545579e-07, "loss": 0.8589, "step": 39215 }, { "epoch": 0.74, "learning_rate": 8.359487423979514e-07, "loss": 0.8475, "step": 39216 }, { "epoch": 0.74, "learning_rate": 8.358347380548617e-07, "loss": 0.9365, "step": 39217 }, { "epoch": 0.74, "learning_rate": 8.357207399257142e-07, "loss": 1.0756, "step": 39218 }, { "epoch": 0.74, "learning_rate": 8.356067480109343e-07, "loss": 0.8863, "step": 39219 }, { "epoch": 0.74, "learning_rate": 8.354927623109485e-07, "loss": 0.9474, "step": 39220 }, { "epoch": 0.74, "learning_rate": 8.3537878282618e-07, "loss": 0.7557, "step": 39221 }, { "epoch": 0.74, "learning_rate": 8.352648095570579e-07, "loss": 0.9113, "step": 39222 }, { "epoch": 0.74, "learning_rate": 8.35150842504005e-07, "loss": 0.7336, "step": 39223 }, { "epoch": 0.74, "learning_rate": 8.350368816674479e-07, "loss": 0.8704, "step": 39224 }, { "epoch": 0.74, "learning_rate": 8.349229270478118e-07, "loss": 1.1242, "step": 39225 }, { "epoch": 0.74, "learning_rate": 8.348089786455226e-07, "loss": 0.8261, "step": 39226 }, { "epoch": 0.74, "learning_rate": 8.346950364610056e-07, "loss": 0.882, "step": 39227 }, { "epoch": 0.74, "learning_rate": 8.345811004946864e-07, "loss": 0.8028, "step": 39228 }, { "epoch": 0.74, "learning_rate": 8.344671707469912e-07, "loss": 0.8182, "step": 39229 }, { "epoch": 0.74, "learning_rate": 8.343532472183425e-07, "loss": 0.7971, "step": 39230 }, { "epoch": 0.74, "learning_rate": 8.342393299091697e-07, "loss": 1.1315, "step": 39231 }, { "epoch": 0.74, "learning_rate": 8.341254188198952e-07, "loss": 0.94, "step": 39232 }, { "epoch": 0.74, "learning_rate": 8.340115139509444e-07, "loss": 0.8295, "step": 39233 }, { "epoch": 0.74, "learning_rate": 8.338976153027454e-07, "loss": 0.9971, "step": 39234 }, { "epoch": 0.74, "learning_rate": 8.337837228757207e-07, "loss": 0.7929, "step": 39235 }, { "epoch": 0.74, "learning_rate": 8.336698366702964e-07, "loss": 1.0517, "step": 39236 }, { "epoch": 0.74, "learning_rate": 8.335559566868978e-07, "loss": 1.3231, "step": 39237 }, { "epoch": 0.74, "learning_rate": 8.334420829259504e-07, "loss": 0.8675, "step": 39238 }, { "epoch": 0.74, "learning_rate": 8.333282153878788e-07, "loss": 0.8197, "step": 39239 }, { "epoch": 0.74, "learning_rate": 8.332143540731089e-07, "loss": 0.8617, "step": 39240 }, { "epoch": 0.74, "learning_rate": 8.331004989820662e-07, "loss": 0.8306, "step": 39241 }, { "epoch": 0.74, "learning_rate": 8.329866501151735e-07, "loss": 0.904, "step": 39242 }, { "epoch": 0.74, "learning_rate": 8.328728074728593e-07, "loss": 1.0884, "step": 39243 }, { "epoch": 0.74, "learning_rate": 8.327589710555459e-07, "loss": 0.9734, "step": 39244 }, { "epoch": 0.74, "learning_rate": 8.326451408636593e-07, "loss": 0.9685, "step": 39245 }, { "epoch": 0.74, "learning_rate": 8.325313168976248e-07, "loss": 0.8633, "step": 39246 }, { "epoch": 0.74, "learning_rate": 8.324174991578671e-07, "loss": 0.9624, "step": 39247 }, { "epoch": 0.74, "learning_rate": 8.323036876448115e-07, "loss": 0.7344, "step": 39248 }, { "epoch": 0.74, "learning_rate": 8.321898823588829e-07, "loss": 0.9933, "step": 39249 }, { "epoch": 0.74, "learning_rate": 8.320760833005068e-07, "loss": 1.2244, "step": 39250 }, { "epoch": 0.74, "learning_rate": 8.319622904701056e-07, "loss": 1.0345, "step": 39251 }, { "epoch": 0.74, "learning_rate": 8.318485038681079e-07, "loss": 0.8386, "step": 39252 }, { "epoch": 0.74, "learning_rate": 8.31734723494936e-07, "loss": 0.9444, "step": 39253 }, { "epoch": 0.74, "learning_rate": 8.316209493510147e-07, "loss": 0.6083, "step": 39254 }, { "epoch": 0.74, "learning_rate": 8.315071814367712e-07, "loss": 0.9044, "step": 39255 }, { "epoch": 0.74, "learning_rate": 8.313934197526277e-07, "loss": 1.0741, "step": 39256 }, { "epoch": 0.74, "learning_rate": 8.312796642990104e-07, "loss": 1.0375, "step": 39257 }, { "epoch": 0.74, "learning_rate": 8.311659150763432e-07, "loss": 0.8039, "step": 39258 }, { "epoch": 0.74, "learning_rate": 8.310521720850518e-07, "loss": 0.999, "step": 39259 }, { "epoch": 0.74, "learning_rate": 8.3093843532556e-07, "loss": 0.7459, "step": 39260 }, { "epoch": 0.74, "learning_rate": 8.308247047982932e-07, "loss": 0.8428, "step": 39261 }, { "epoch": 0.74, "learning_rate": 8.307109805036765e-07, "loss": 1.1635, "step": 39262 }, { "epoch": 0.74, "learning_rate": 8.305972624421321e-07, "loss": 0.9579, "step": 39263 }, { "epoch": 0.74, "learning_rate": 8.30483550614088e-07, "loss": 0.8565, "step": 39264 }, { "epoch": 0.74, "learning_rate": 8.303698450199663e-07, "loss": 0.9312, "step": 39265 }, { "epoch": 0.74, "learning_rate": 8.302561456601926e-07, "loss": 0.8858, "step": 39266 }, { "epoch": 0.74, "learning_rate": 8.301424525351911e-07, "loss": 0.9348, "step": 39267 }, { "epoch": 0.74, "learning_rate": 8.300287656453865e-07, "loss": 1.0349, "step": 39268 }, { "epoch": 0.74, "learning_rate": 8.299150849912033e-07, "loss": 0.8866, "step": 39269 }, { "epoch": 0.74, "learning_rate": 8.298014105730659e-07, "loss": 0.931, "step": 39270 }, { "epoch": 0.74, "learning_rate": 8.296877423913996e-07, "loss": 0.8757, "step": 39271 }, { "epoch": 0.74, "learning_rate": 8.295740804466266e-07, "loss": 0.8876, "step": 39272 }, { "epoch": 0.74, "learning_rate": 8.294604247391744e-07, "loss": 0.8237, "step": 39273 }, { "epoch": 0.74, "learning_rate": 8.293467752694648e-07, "loss": 0.7938, "step": 39274 }, { "epoch": 0.74, "learning_rate": 8.292331320379224e-07, "loss": 0.9982, "step": 39275 }, { "epoch": 0.74, "learning_rate": 8.291194950449738e-07, "loss": 1.0234, "step": 39276 }, { "epoch": 0.74, "learning_rate": 8.29005864291041e-07, "loss": 0.7775, "step": 39277 }, { "epoch": 0.74, "learning_rate": 8.288922397765489e-07, "loss": 0.9038, "step": 39278 }, { "epoch": 0.74, "learning_rate": 8.287786215019223e-07, "loss": 0.9979, "step": 39279 }, { "epoch": 0.74, "learning_rate": 8.28665009467585e-07, "loss": 0.9379, "step": 39280 }, { "epoch": 0.74, "learning_rate": 8.285514036739611e-07, "loss": 0.9875, "step": 39281 }, { "epoch": 0.74, "learning_rate": 8.284378041214749e-07, "loss": 0.8792, "step": 39282 }, { "epoch": 0.74, "learning_rate": 8.283242108105519e-07, "loss": 0.8558, "step": 39283 }, { "epoch": 0.74, "learning_rate": 8.282106237416132e-07, "loss": 1.0372, "step": 39284 }, { "epoch": 0.74, "learning_rate": 8.280970429150865e-07, "loss": 0.8787, "step": 39285 }, { "epoch": 0.74, "learning_rate": 8.279834683313934e-07, "loss": 0.9818, "step": 39286 }, { "epoch": 0.74, "learning_rate": 8.278698999909585e-07, "loss": 1.0813, "step": 39287 }, { "epoch": 0.74, "learning_rate": 8.277563378942064e-07, "loss": 1.0894, "step": 39288 }, { "epoch": 0.74, "learning_rate": 8.276427820415605e-07, "loss": 0.8692, "step": 39289 }, { "epoch": 0.74, "learning_rate": 8.275292324334455e-07, "loss": 0.8392, "step": 39290 }, { "epoch": 0.74, "learning_rate": 8.274156890702851e-07, "loss": 0.923, "step": 39291 }, { "epoch": 0.74, "learning_rate": 8.27302151952504e-07, "loss": 0.9255, "step": 39292 }, { "epoch": 0.74, "learning_rate": 8.271886210805235e-07, "loss": 1.0569, "step": 39293 }, { "epoch": 0.74, "learning_rate": 8.270750964547713e-07, "loss": 0.9535, "step": 39294 }, { "epoch": 0.74, "learning_rate": 8.269615780756688e-07, "loss": 0.9604, "step": 39295 }, { "epoch": 0.74, "learning_rate": 8.268480659436392e-07, "loss": 0.798, "step": 39296 }, { "epoch": 0.74, "learning_rate": 8.267345600591095e-07, "loss": 0.7718, "step": 39297 }, { "epoch": 0.74, "learning_rate": 8.266210604225006e-07, "loss": 0.8669, "step": 39298 }, { "epoch": 0.74, "learning_rate": 8.265075670342376e-07, "loss": 0.833, "step": 39299 }, { "epoch": 0.74, "learning_rate": 8.263940798947439e-07, "loss": 0.9279, "step": 39300 }, { "epoch": 0.74, "learning_rate": 8.262805990044434e-07, "loss": 0.9593, "step": 39301 }, { "epoch": 0.74, "learning_rate": 8.261671243637598e-07, "loss": 0.9615, "step": 39302 }, { "epoch": 0.74, "learning_rate": 8.260536559731169e-07, "loss": 0.8155, "step": 39303 }, { "epoch": 0.74, "learning_rate": 8.259401938329392e-07, "loss": 1.0231, "step": 39304 }, { "epoch": 0.74, "learning_rate": 8.258267379436477e-07, "loss": 0.9005, "step": 39305 }, { "epoch": 0.74, "learning_rate": 8.257132883056695e-07, "loss": 0.9783, "step": 39306 }, { "epoch": 0.74, "learning_rate": 8.255998449194258e-07, "loss": 1.1601, "step": 39307 }, { "epoch": 0.74, "learning_rate": 8.254864077853411e-07, "loss": 0.8157, "step": 39308 }, { "epoch": 0.74, "learning_rate": 8.253729769038385e-07, "loss": 0.6735, "step": 39309 }, { "epoch": 0.74, "learning_rate": 8.25259552275342e-07, "loss": 0.8976, "step": 39310 }, { "epoch": 0.74, "learning_rate": 8.25146133900275e-07, "loss": 0.9125, "step": 39311 }, { "epoch": 0.74, "learning_rate": 8.25032721779061e-07, "loss": 1.1481, "step": 39312 }, { "epoch": 0.74, "learning_rate": 8.249193159121244e-07, "loss": 1.1089, "step": 39313 }, { "epoch": 0.74, "learning_rate": 8.248059162998859e-07, "loss": 0.893, "step": 39314 }, { "epoch": 0.74, "learning_rate": 8.246925229427721e-07, "loss": 0.9432, "step": 39315 }, { "epoch": 0.74, "learning_rate": 8.245791358412048e-07, "loss": 1.001, "step": 39316 }, { "epoch": 0.74, "learning_rate": 8.244657549956064e-07, "loss": 0.9554, "step": 39317 }, { "epoch": 0.74, "learning_rate": 8.243523804064033e-07, "loss": 1.0212, "step": 39318 }, { "epoch": 0.74, "learning_rate": 8.242390120740162e-07, "loss": 0.9941, "step": 39319 }, { "epoch": 0.74, "learning_rate": 8.241256499988693e-07, "loss": 1.0395, "step": 39320 }, { "epoch": 0.74, "learning_rate": 8.240122941813857e-07, "loss": 0.9177, "step": 39321 }, { "epoch": 0.74, "learning_rate": 8.238989446219888e-07, "loss": 0.9042, "step": 39322 }, { "epoch": 0.74, "learning_rate": 8.237856013211021e-07, "loss": 0.8601, "step": 39323 }, { "epoch": 0.74, "learning_rate": 8.236722642791484e-07, "loss": 1.0248, "step": 39324 }, { "epoch": 0.74, "learning_rate": 8.235589334965518e-07, "loss": 1.0002, "step": 39325 }, { "epoch": 0.74, "learning_rate": 8.234456089737333e-07, "loss": 0.9852, "step": 39326 }, { "epoch": 0.74, "learning_rate": 8.23332290711119e-07, "loss": 0.9818, "step": 39327 }, { "epoch": 0.74, "learning_rate": 8.232189787091299e-07, "loss": 0.9719, "step": 39328 }, { "epoch": 0.74, "learning_rate": 8.231056729681896e-07, "loss": 0.9311, "step": 39329 }, { "epoch": 0.74, "learning_rate": 8.229923734887212e-07, "loss": 0.9451, "step": 39330 }, { "epoch": 0.74, "learning_rate": 8.228790802711479e-07, "loss": 1.0283, "step": 39331 }, { "epoch": 0.74, "learning_rate": 8.227657933158928e-07, "loss": 0.9984, "step": 39332 }, { "epoch": 0.74, "learning_rate": 8.226525126233786e-07, "loss": 0.9724, "step": 39333 }, { "epoch": 0.74, "learning_rate": 8.225392381940295e-07, "loss": 0.7832, "step": 39334 }, { "epoch": 0.74, "learning_rate": 8.224259700282666e-07, "loss": 0.8716, "step": 39335 }, { "epoch": 0.74, "learning_rate": 8.223127081265137e-07, "loss": 0.9647, "step": 39336 }, { "epoch": 0.74, "learning_rate": 8.221994524891936e-07, "loss": 0.9346, "step": 39337 }, { "epoch": 0.74, "learning_rate": 8.220862031167293e-07, "loss": 1.0619, "step": 39338 }, { "epoch": 0.74, "learning_rate": 8.219729600095438e-07, "loss": 1.0082, "step": 39339 }, { "epoch": 0.74, "learning_rate": 8.218597231680597e-07, "loss": 0.9962, "step": 39340 }, { "epoch": 0.74, "learning_rate": 8.217464925927007e-07, "loss": 0.9089, "step": 39341 }, { "epoch": 0.74, "learning_rate": 8.216332682838873e-07, "loss": 0.7487, "step": 39342 }, { "epoch": 0.74, "learning_rate": 8.215200502420448e-07, "loss": 0.9067, "step": 39343 }, { "epoch": 0.74, "learning_rate": 8.214068384675958e-07, "loss": 1.2223, "step": 39344 }, { "epoch": 0.74, "learning_rate": 8.212936329609602e-07, "loss": 0.9073, "step": 39345 }, { "epoch": 0.74, "learning_rate": 8.211804337225646e-07, "loss": 0.9246, "step": 39346 }, { "epoch": 0.74, "learning_rate": 8.210672407528289e-07, "loss": 0.8162, "step": 39347 }, { "epoch": 0.74, "learning_rate": 8.209540540521765e-07, "loss": 0.9692, "step": 39348 }, { "epoch": 0.74, "learning_rate": 8.208408736210304e-07, "loss": 1.0067, "step": 39349 }, { "epoch": 0.74, "learning_rate": 8.207276994598131e-07, "loss": 1.103, "step": 39350 }, { "epoch": 0.74, "learning_rate": 8.206145315689467e-07, "loss": 0.97, "step": 39351 }, { "epoch": 0.74, "learning_rate": 8.205013699488546e-07, "loss": 0.844, "step": 39352 }, { "epoch": 0.74, "learning_rate": 8.203882145999595e-07, "loss": 0.9653, "step": 39353 }, { "epoch": 0.74, "learning_rate": 8.202750655226816e-07, "loss": 0.8546, "step": 39354 }, { "epoch": 0.74, "learning_rate": 8.201619227174468e-07, "loss": 0.8669, "step": 39355 }, { "epoch": 0.74, "learning_rate": 8.200487861846751e-07, "loss": 1.1588, "step": 39356 }, { "epoch": 0.74, "learning_rate": 8.199356559247895e-07, "loss": 1.1154, "step": 39357 }, { "epoch": 0.74, "learning_rate": 8.198225319382127e-07, "loss": 0.886, "step": 39358 }, { "epoch": 0.74, "learning_rate": 8.197094142253672e-07, "loss": 0.8596, "step": 39359 }, { "epoch": 0.74, "learning_rate": 8.195963027866752e-07, "loss": 0.7549, "step": 39360 }, { "epoch": 0.74, "learning_rate": 8.194831976225592e-07, "loss": 0.8371, "step": 39361 }, { "epoch": 0.74, "learning_rate": 8.193700987334421e-07, "loss": 1.0814, "step": 39362 }, { "epoch": 0.74, "learning_rate": 8.192570061197438e-07, "loss": 1.0356, "step": 39363 }, { "epoch": 0.74, "learning_rate": 8.191439197818893e-07, "loss": 0.9255, "step": 39364 }, { "epoch": 0.74, "learning_rate": 8.190308397203006e-07, "loss": 0.971, "step": 39365 }, { "epoch": 0.74, "learning_rate": 8.189177659353975e-07, "loss": 0.7032, "step": 39366 }, { "epoch": 0.74, "learning_rate": 8.188046984276057e-07, "loss": 1.1357, "step": 39367 }, { "epoch": 0.74, "learning_rate": 8.186916371973446e-07, "loss": 1.1968, "step": 39368 }, { "epoch": 0.74, "learning_rate": 8.185785822450376e-07, "loss": 1.1033, "step": 39369 }, { "epoch": 0.74, "learning_rate": 8.184655335711065e-07, "loss": 0.7218, "step": 39370 }, { "epoch": 0.74, "learning_rate": 8.183524911759735e-07, "loss": 0.9673, "step": 39371 }, { "epoch": 0.74, "learning_rate": 8.182394550600608e-07, "loss": 0.9263, "step": 39372 }, { "epoch": 0.74, "learning_rate": 8.181264252237905e-07, "loss": 0.9866, "step": 39373 }, { "epoch": 0.74, "learning_rate": 8.180134016675853e-07, "loss": 0.7157, "step": 39374 }, { "epoch": 0.74, "learning_rate": 8.179003843918648e-07, "loss": 1.007, "step": 39375 }, { "epoch": 0.74, "learning_rate": 8.177873733970543e-07, "loss": 0.9614, "step": 39376 }, { "epoch": 0.74, "learning_rate": 8.176743686835736e-07, "loss": 0.9048, "step": 39377 }, { "epoch": 0.74, "learning_rate": 8.175613702518451e-07, "loss": 0.7584, "step": 39378 }, { "epoch": 0.74, "learning_rate": 8.174483781022907e-07, "loss": 0.8856, "step": 39379 }, { "epoch": 0.74, "learning_rate": 8.173353922353325e-07, "loss": 0.9112, "step": 39380 }, { "epoch": 0.74, "learning_rate": 8.172224126513926e-07, "loss": 1.034, "step": 39381 }, { "epoch": 0.74, "learning_rate": 8.171094393508922e-07, "loss": 0.7661, "step": 39382 }, { "epoch": 0.74, "learning_rate": 8.169964723342546e-07, "loss": 1.1085, "step": 39383 }, { "epoch": 0.74, "learning_rate": 8.168835116018991e-07, "loss": 0.9839, "step": 39384 }, { "epoch": 0.74, "learning_rate": 8.167705571542494e-07, "loss": 0.815, "step": 39385 }, { "epoch": 0.74, "learning_rate": 8.16657608991728e-07, "loss": 1.0396, "step": 39386 }, { "epoch": 0.74, "learning_rate": 8.165446671147537e-07, "loss": 0.8986, "step": 39387 }, { "epoch": 0.74, "learning_rate": 8.164317315237516e-07, "loss": 1.176, "step": 39388 }, { "epoch": 0.74, "learning_rate": 8.163188022191412e-07, "loss": 0.7376, "step": 39389 }, { "epoch": 0.74, "learning_rate": 8.162058792013445e-07, "loss": 0.9708, "step": 39390 }, { "epoch": 0.74, "learning_rate": 8.160929624707837e-07, "loss": 0.8765, "step": 39391 }, { "epoch": 0.74, "learning_rate": 8.159800520278799e-07, "loss": 0.9387, "step": 39392 }, { "epoch": 0.74, "learning_rate": 8.158671478730548e-07, "loss": 1.1101, "step": 39393 }, { "epoch": 0.74, "learning_rate": 8.157542500067304e-07, "loss": 1.0874, "step": 39394 }, { "epoch": 0.74, "learning_rate": 8.156413584293288e-07, "loss": 0.8954, "step": 39395 }, { "epoch": 0.74, "learning_rate": 8.155284731412691e-07, "loss": 0.9201, "step": 39396 }, { "epoch": 0.74, "learning_rate": 8.154155941429759e-07, "loss": 0.8433, "step": 39397 }, { "epoch": 0.74, "learning_rate": 8.153027214348686e-07, "loss": 0.704, "step": 39398 }, { "epoch": 0.74, "learning_rate": 8.151898550173692e-07, "loss": 0.936, "step": 39399 }, { "epoch": 0.74, "learning_rate": 8.150769948908993e-07, "loss": 1.0534, "step": 39400 }, { "epoch": 0.74, "learning_rate": 8.149641410558801e-07, "loss": 0.718, "step": 39401 }, { "epoch": 0.74, "learning_rate": 8.148512935127331e-07, "loss": 0.8075, "step": 39402 }, { "epoch": 0.74, "learning_rate": 8.147384522618798e-07, "loss": 0.8166, "step": 39403 }, { "epoch": 0.74, "learning_rate": 8.146256173037423e-07, "loss": 0.7365, "step": 39404 }, { "epoch": 0.74, "learning_rate": 8.145127886387394e-07, "loss": 1.1743, "step": 39405 }, { "epoch": 0.74, "learning_rate": 8.14399966267295e-07, "loss": 1.0396, "step": 39406 }, { "epoch": 0.74, "learning_rate": 8.1428715018983e-07, "loss": 0.9418, "step": 39407 }, { "epoch": 0.74, "learning_rate": 8.141743404067637e-07, "loss": 1.0409, "step": 39408 }, { "epoch": 0.74, "learning_rate": 8.140615369185204e-07, "loss": 0.8675, "step": 39409 }, { "epoch": 0.74, "learning_rate": 8.139487397255186e-07, "loss": 0.8133, "step": 39410 }, { "epoch": 0.74, "learning_rate": 8.138359488281805e-07, "loss": 0.8572, "step": 39411 }, { "epoch": 0.74, "learning_rate": 8.137231642269275e-07, "loss": 1.1324, "step": 39412 }, { "epoch": 0.74, "learning_rate": 8.136103859221802e-07, "loss": 1.2108, "step": 39413 }, { "epoch": 0.74, "learning_rate": 8.134976139143603e-07, "loss": 0.8382, "step": 39414 }, { "epoch": 0.74, "learning_rate": 8.133848482038884e-07, "loss": 0.853, "step": 39415 }, { "epoch": 0.74, "learning_rate": 8.132720887911866e-07, "loss": 0.9279, "step": 39416 }, { "epoch": 0.74, "learning_rate": 8.131593356766737e-07, "loss": 0.9862, "step": 39417 }, { "epoch": 0.74, "learning_rate": 8.130465888607736e-07, "loss": 1.0291, "step": 39418 }, { "epoch": 0.74, "learning_rate": 8.129338483439047e-07, "loss": 0.9954, "step": 39419 }, { "epoch": 0.74, "learning_rate": 8.128211141264893e-07, "loss": 1.1001, "step": 39420 }, { "epoch": 0.74, "learning_rate": 8.127083862089485e-07, "loss": 0.9935, "step": 39421 }, { "epoch": 0.74, "learning_rate": 8.125956645917024e-07, "loss": 0.8609, "step": 39422 }, { "epoch": 0.74, "learning_rate": 8.124829492751727e-07, "loss": 0.8799, "step": 39423 }, { "epoch": 0.74, "learning_rate": 8.123702402597797e-07, "loss": 0.9531, "step": 39424 }, { "epoch": 0.74, "learning_rate": 8.122575375459452e-07, "loss": 0.9572, "step": 39425 }, { "epoch": 0.74, "learning_rate": 8.121448411340879e-07, "loss": 1.0405, "step": 39426 }, { "epoch": 0.74, "learning_rate": 8.120321510246306e-07, "loss": 0.7732, "step": 39427 }, { "epoch": 0.74, "learning_rate": 8.119194672179945e-07, "loss": 0.9568, "step": 39428 }, { "epoch": 0.74, "learning_rate": 8.118067897145976e-07, "loss": 1.0391, "step": 39429 }, { "epoch": 0.74, "learning_rate": 8.116941185148642e-07, "loss": 0.863, "step": 39430 }, { "epoch": 0.74, "learning_rate": 8.11581453619212e-07, "loss": 1.1303, "step": 39431 }, { "epoch": 0.74, "learning_rate": 8.114687950280633e-07, "loss": 0.872, "step": 39432 }, { "epoch": 0.74, "learning_rate": 8.113561427418381e-07, "loss": 0.8574, "step": 39433 }, { "epoch": 0.74, "learning_rate": 8.112434967609575e-07, "loss": 0.8982, "step": 39434 }, { "epoch": 0.74, "learning_rate": 8.111308570858417e-07, "loss": 0.9937, "step": 39435 }, { "epoch": 0.74, "learning_rate": 8.110182237169115e-07, "loss": 0.9929, "step": 39436 }, { "epoch": 0.74, "learning_rate": 8.109055966545885e-07, "loss": 1.1522, "step": 39437 }, { "epoch": 0.74, "learning_rate": 8.107929758992905e-07, "loss": 1.0524, "step": 39438 }, { "epoch": 0.74, "learning_rate": 8.106803614514411e-07, "loss": 0.8091, "step": 39439 }, { "epoch": 0.74, "learning_rate": 8.105677533114589e-07, "loss": 0.8822, "step": 39440 }, { "epoch": 0.74, "learning_rate": 8.104551514797648e-07, "loss": 0.7071, "step": 39441 }, { "epoch": 0.74, "learning_rate": 8.103425559567796e-07, "loss": 0.8265, "step": 39442 }, { "epoch": 0.74, "learning_rate": 8.102299667429231e-07, "loss": 1.1363, "step": 39443 }, { "epoch": 0.74, "learning_rate": 8.101173838386164e-07, "loss": 1.006, "step": 39444 }, { "epoch": 0.74, "learning_rate": 8.100048072442793e-07, "loss": 1.0342, "step": 39445 }, { "epoch": 0.74, "learning_rate": 8.098922369603335e-07, "loss": 1.0163, "step": 39446 }, { "epoch": 0.74, "learning_rate": 8.097796729871965e-07, "loss": 0.794, "step": 39447 }, { "epoch": 0.74, "learning_rate": 8.096671153252913e-07, "loss": 1.0173, "step": 39448 }, { "epoch": 0.74, "learning_rate": 8.095545639750379e-07, "loss": 0.8871, "step": 39449 }, { "epoch": 0.74, "learning_rate": 8.094420189368546e-07, "loss": 1.1671, "step": 39450 }, { "epoch": 0.74, "learning_rate": 8.093294802111643e-07, "loss": 0.9275, "step": 39451 }, { "epoch": 0.74, "learning_rate": 8.092169477983852e-07, "loss": 0.9457, "step": 39452 }, { "epoch": 0.74, "learning_rate": 8.091044216989383e-07, "loss": 0.9251, "step": 39453 }, { "epoch": 0.74, "learning_rate": 8.089919019132433e-07, "loss": 0.6372, "step": 39454 }, { "epoch": 0.74, "learning_rate": 8.088793884417209e-07, "loss": 1.03, "step": 39455 }, { "epoch": 0.74, "learning_rate": 8.087668812847909e-07, "loss": 1.0379, "step": 39456 }, { "epoch": 0.74, "learning_rate": 8.086543804428737e-07, "loss": 1.045, "step": 39457 }, { "epoch": 0.74, "learning_rate": 8.085418859163899e-07, "loss": 0.8294, "step": 39458 }, { "epoch": 0.74, "learning_rate": 8.084293977057573e-07, "loss": 0.9342, "step": 39459 }, { "epoch": 0.74, "learning_rate": 8.08316915811399e-07, "loss": 0.726, "step": 39460 }, { "epoch": 0.74, "learning_rate": 8.082044402337328e-07, "loss": 0.8618, "step": 39461 }, { "epoch": 0.74, "learning_rate": 8.080919709731791e-07, "loss": 0.9259, "step": 39462 }, { "epoch": 0.74, "learning_rate": 8.079795080301583e-07, "loss": 0.8437, "step": 39463 }, { "epoch": 0.74, "learning_rate": 8.078670514050902e-07, "loss": 0.7426, "step": 39464 }, { "epoch": 0.74, "learning_rate": 8.077546010983944e-07, "loss": 0.7807, "step": 39465 }, { "epoch": 0.74, "learning_rate": 8.076421571104911e-07, "loss": 0.9296, "step": 39466 }, { "epoch": 0.74, "learning_rate": 8.075297194418011e-07, "loss": 0.831, "step": 39467 }, { "epoch": 0.74, "learning_rate": 8.074172880927413e-07, "loss": 0.9498, "step": 39468 }, { "epoch": 0.74, "learning_rate": 8.073048630637345e-07, "loss": 1.0168, "step": 39469 }, { "epoch": 0.74, "learning_rate": 8.071924443552001e-07, "loss": 0.9602, "step": 39470 }, { "epoch": 0.74, "learning_rate": 8.070800319675556e-07, "loss": 0.752, "step": 39471 }, { "epoch": 0.74, "learning_rate": 8.06967625901224e-07, "loss": 0.8694, "step": 39472 }, { "epoch": 0.74, "learning_rate": 8.068552261566229e-07, "loss": 0.6214, "step": 39473 }, { "epoch": 0.74, "learning_rate": 8.067428327341719e-07, "loss": 1.0608, "step": 39474 }, { "epoch": 0.74, "learning_rate": 8.066304456342916e-07, "loss": 1.0209, "step": 39475 }, { "epoch": 0.74, "learning_rate": 8.065180648574014e-07, "loss": 0.764, "step": 39476 }, { "epoch": 0.74, "learning_rate": 8.064056904039205e-07, "loss": 0.9156, "step": 39477 }, { "epoch": 0.74, "learning_rate": 8.062933222742692e-07, "loss": 0.7565, "step": 39478 }, { "epoch": 0.74, "learning_rate": 8.061809604688672e-07, "loss": 0.9667, "step": 39479 }, { "epoch": 0.74, "learning_rate": 8.060686049881319e-07, "loss": 0.7958, "step": 39480 }, { "epoch": 0.74, "learning_rate": 8.059562558324862e-07, "loss": 1.0428, "step": 39481 }, { "epoch": 0.74, "learning_rate": 8.05843913002347e-07, "loss": 0.955, "step": 39482 }, { "epoch": 0.74, "learning_rate": 8.057315764981349e-07, "loss": 0.7871, "step": 39483 }, { "epoch": 0.74, "learning_rate": 8.056192463202692e-07, "loss": 0.8969, "step": 39484 }, { "epoch": 0.74, "learning_rate": 8.055069224691692e-07, "loss": 0.9459, "step": 39485 }, { "epoch": 0.74, "learning_rate": 8.053946049452543e-07, "loss": 0.7657, "step": 39486 }, { "epoch": 0.74, "learning_rate": 8.052822937489441e-07, "loss": 0.9388, "step": 39487 }, { "epoch": 0.75, "learning_rate": 8.051699888806586e-07, "loss": 1.0684, "step": 39488 }, { "epoch": 0.75, "learning_rate": 8.050576903408147e-07, "loss": 0.9809, "step": 39489 }, { "epoch": 0.75, "learning_rate": 8.049453981298344e-07, "loss": 0.8345, "step": 39490 }, { "epoch": 0.75, "learning_rate": 8.048331122481364e-07, "loss": 0.7604, "step": 39491 }, { "epoch": 0.75, "learning_rate": 8.047208326961383e-07, "loss": 0.9127, "step": 39492 }, { "epoch": 0.75, "learning_rate": 8.046085594742626e-07, "loss": 1.0107, "step": 39493 }, { "epoch": 0.75, "learning_rate": 8.044962925829253e-07, "loss": 0.8482, "step": 39494 }, { "epoch": 0.75, "learning_rate": 8.043840320225468e-07, "loss": 0.8896, "step": 39495 }, { "epoch": 0.75, "learning_rate": 8.042717777935466e-07, "loss": 0.8561, "step": 39496 }, { "epoch": 0.75, "learning_rate": 8.041595298963434e-07, "loss": 0.9655, "step": 39497 }, { "epoch": 0.75, "learning_rate": 8.040472883313566e-07, "loss": 0.7048, "step": 39498 }, { "epoch": 0.75, "learning_rate": 8.039350530990053e-07, "loss": 1.0646, "step": 39499 }, { "epoch": 0.75, "learning_rate": 8.038228241997092e-07, "loss": 0.8059, "step": 39500 }, { "epoch": 0.75, "learning_rate": 8.03710601633885e-07, "loss": 1.0729, "step": 39501 }, { "epoch": 0.75, "learning_rate": 8.035983854019552e-07, "loss": 0.985, "step": 39502 }, { "epoch": 0.75, "learning_rate": 8.034861755043361e-07, "loss": 0.8613, "step": 39503 }, { "epoch": 0.75, "learning_rate": 8.033739719414477e-07, "loss": 0.8555, "step": 39504 }, { "epoch": 0.75, "learning_rate": 8.032617747137086e-07, "loss": 0.8246, "step": 39505 }, { "epoch": 0.75, "learning_rate": 8.031495838215384e-07, "loss": 1.109, "step": 39506 }, { "epoch": 0.75, "learning_rate": 8.030373992653553e-07, "loss": 0.924, "step": 39507 }, { "epoch": 0.75, "learning_rate": 8.029252210455785e-07, "loss": 0.8528, "step": 39508 }, { "epoch": 0.75, "learning_rate": 8.02813049162628e-07, "loss": 0.8828, "step": 39509 }, { "epoch": 0.75, "learning_rate": 8.027008836169198e-07, "loss": 0.7866, "step": 39510 }, { "epoch": 0.75, "learning_rate": 8.025887244088751e-07, "loss": 1.0327, "step": 39511 }, { "epoch": 0.75, "learning_rate": 8.024765715389129e-07, "loss": 1.0893, "step": 39512 }, { "epoch": 0.75, "learning_rate": 8.023644250074497e-07, "loss": 1.0785, "step": 39513 }, { "epoch": 0.75, "learning_rate": 8.022522848149073e-07, "loss": 0.9568, "step": 39514 }, { "epoch": 0.75, "learning_rate": 8.021401509617019e-07, "loss": 0.877, "step": 39515 }, { "epoch": 0.75, "learning_rate": 8.02028023448253e-07, "loss": 0.9927, "step": 39516 }, { "epoch": 0.75, "learning_rate": 8.019159022749798e-07, "loss": 0.793, "step": 39517 }, { "epoch": 0.75, "learning_rate": 8.018037874423001e-07, "loss": 0.9698, "step": 39518 }, { "epoch": 0.75, "learning_rate": 8.016916789506332e-07, "loss": 1.0001, "step": 39519 }, { "epoch": 0.75, "learning_rate": 8.015795768003975e-07, "loss": 0.9571, "step": 39520 }, { "epoch": 0.75, "learning_rate": 8.014674809920125e-07, "loss": 0.804, "step": 39521 }, { "epoch": 0.75, "learning_rate": 8.01355391525894e-07, "loss": 0.7484, "step": 39522 }, { "epoch": 0.75, "learning_rate": 8.012433084024642e-07, "loss": 0.979, "step": 39523 }, { "epoch": 0.75, "learning_rate": 8.01131231622139e-07, "loss": 0.9197, "step": 39524 }, { "epoch": 0.75, "learning_rate": 8.010191611853374e-07, "loss": 0.8491, "step": 39525 }, { "epoch": 0.75, "learning_rate": 8.009070970924785e-07, "loss": 0.7626, "step": 39526 }, { "epoch": 0.75, "learning_rate": 8.007950393439803e-07, "loss": 0.8976, "step": 39527 }, { "epoch": 0.75, "learning_rate": 8.006829879402611e-07, "loss": 0.822, "step": 39528 }, { "epoch": 0.75, "learning_rate": 8.005709428817399e-07, "loss": 0.7907, "step": 39529 }, { "epoch": 0.75, "learning_rate": 8.004589041688352e-07, "loss": 1.1121, "step": 39530 }, { "epoch": 0.75, "learning_rate": 8.003468718019634e-07, "loss": 1.1357, "step": 39531 }, { "epoch": 0.75, "learning_rate": 8.002348457815451e-07, "loss": 1.0118, "step": 39532 }, { "epoch": 0.75, "learning_rate": 8.001228261079985e-07, "loss": 0.8001, "step": 39533 }, { "epoch": 0.75, "learning_rate": 8.000108127817393e-07, "loss": 0.8439, "step": 39534 }, { "epoch": 0.75, "learning_rate": 7.998988058031895e-07, "loss": 0.8119, "step": 39535 }, { "epoch": 0.75, "learning_rate": 7.997868051727647e-07, "loss": 0.8793, "step": 39536 }, { "epoch": 0.75, "learning_rate": 7.996748108908836e-07, "loss": 1.1207, "step": 39537 }, { "epoch": 0.75, "learning_rate": 7.995628229579649e-07, "loss": 0.9536, "step": 39538 }, { "epoch": 0.75, "learning_rate": 7.994508413744262e-07, "loss": 0.8293, "step": 39539 }, { "epoch": 0.75, "learning_rate": 7.993388661406862e-07, "loss": 0.8899, "step": 39540 }, { "epoch": 0.75, "learning_rate": 7.992268972571623e-07, "loss": 0.8453, "step": 39541 }, { "epoch": 0.75, "learning_rate": 7.991149347242743e-07, "loss": 0.6876, "step": 39542 }, { "epoch": 0.75, "learning_rate": 7.990029785424371e-07, "loss": 1.077, "step": 39543 }, { "epoch": 0.75, "learning_rate": 7.988910287120724e-07, "loss": 0.7378, "step": 39544 }, { "epoch": 0.75, "learning_rate": 7.987790852335955e-07, "loss": 1.0543, "step": 39545 }, { "epoch": 0.75, "learning_rate": 7.986671481074246e-07, "loss": 0.8962, "step": 39546 }, { "epoch": 0.75, "learning_rate": 7.9855521733398e-07, "loss": 0.8932, "step": 39547 }, { "epoch": 0.75, "learning_rate": 7.98443292913677e-07, "loss": 0.9665, "step": 39548 }, { "epoch": 0.75, "learning_rate": 7.983313748469348e-07, "loss": 1.0251, "step": 39549 }, { "epoch": 0.75, "learning_rate": 7.982194631341711e-07, "loss": 1.3436, "step": 39550 }, { "epoch": 0.75, "learning_rate": 7.981075577758037e-07, "loss": 0.9097, "step": 39551 }, { "epoch": 0.75, "learning_rate": 7.979956587722507e-07, "loss": 0.9994, "step": 39552 }, { "epoch": 0.75, "learning_rate": 7.978837661239294e-07, "loss": 0.8636, "step": 39553 }, { "epoch": 0.75, "learning_rate": 7.977718798312589e-07, "loss": 0.8261, "step": 39554 }, { "epoch": 0.75, "learning_rate": 7.976599998946544e-07, "loss": 0.833, "step": 39555 }, { "epoch": 0.75, "learning_rate": 7.975481263145369e-07, "loss": 1.0173, "step": 39556 }, { "epoch": 0.75, "learning_rate": 7.974362590913215e-07, "loss": 0.9915, "step": 39557 }, { "epoch": 0.75, "learning_rate": 7.973243982254272e-07, "loss": 0.8586, "step": 39558 }, { "epoch": 0.75, "learning_rate": 7.972125437172711e-07, "loss": 0.7742, "step": 39559 }, { "epoch": 0.75, "learning_rate": 7.971006955672713e-07, "loss": 1.0189, "step": 39560 }, { "epoch": 0.75, "learning_rate": 7.969888537758455e-07, "loss": 0.9164, "step": 39561 }, { "epoch": 0.75, "learning_rate": 7.968770183434108e-07, "loss": 1.1928, "step": 39562 }, { "epoch": 0.75, "learning_rate": 7.967651892703859e-07, "loss": 0.9674, "step": 39563 }, { "epoch": 0.75, "learning_rate": 7.96653366557186e-07, "loss": 0.7948, "step": 39564 }, { "epoch": 0.75, "learning_rate": 7.96541550204232e-07, "loss": 0.7851, "step": 39565 }, { "epoch": 0.75, "learning_rate": 7.964297402119387e-07, "loss": 0.9337, "step": 39566 }, { "epoch": 0.75, "learning_rate": 7.963179365807245e-07, "loss": 0.9425, "step": 39567 }, { "epoch": 0.75, "learning_rate": 7.962061393110068e-07, "loss": 0.8972, "step": 39568 }, { "epoch": 0.75, "learning_rate": 7.960943484032033e-07, "loss": 1.1175, "step": 39569 }, { "epoch": 0.75, "learning_rate": 7.959825638577321e-07, "loss": 0.8211, "step": 39570 }, { "epoch": 0.75, "learning_rate": 7.958707856750078e-07, "loss": 0.8739, "step": 39571 }, { "epoch": 0.75, "learning_rate": 7.957590138554508e-07, "loss": 0.8341, "step": 39572 }, { "epoch": 0.75, "learning_rate": 7.956472483994781e-07, "loss": 0.7435, "step": 39573 }, { "epoch": 0.75, "learning_rate": 7.955354893075049e-07, "loss": 1.0993, "step": 39574 }, { "epoch": 0.75, "learning_rate": 7.954237365799513e-07, "loss": 1.1969, "step": 39575 }, { "epoch": 0.75, "learning_rate": 7.953119902172326e-07, "loss": 0.8259, "step": 39576 }, { "epoch": 0.75, "learning_rate": 7.952002502197664e-07, "loss": 0.829, "step": 39577 }, { "epoch": 0.75, "learning_rate": 7.950885165879704e-07, "loss": 0.8989, "step": 39578 }, { "epoch": 0.75, "learning_rate": 7.949767893222615e-07, "loss": 0.87, "step": 39579 }, { "epoch": 0.75, "learning_rate": 7.948650684230572e-07, "loss": 0.8813, "step": 39580 }, { "epoch": 0.75, "learning_rate": 7.947533538907742e-07, "loss": 1.1204, "step": 39581 }, { "epoch": 0.75, "learning_rate": 7.946416457258311e-07, "loss": 1.119, "step": 39582 }, { "epoch": 0.75, "learning_rate": 7.945299439286417e-07, "loss": 1.0816, "step": 39583 }, { "epoch": 0.75, "learning_rate": 7.944182484996271e-07, "loss": 0.9101, "step": 39584 }, { "epoch": 0.75, "learning_rate": 7.943065594392015e-07, "loss": 0.9358, "step": 39585 }, { "epoch": 0.75, "learning_rate": 7.94194876747783e-07, "loss": 0.8682, "step": 39586 }, { "epoch": 0.75, "learning_rate": 7.940832004257886e-07, "loss": 0.8804, "step": 39587 }, { "epoch": 0.75, "learning_rate": 7.939715304736351e-07, "loss": 1.0693, "step": 39588 }, { "epoch": 0.75, "learning_rate": 7.938598668917397e-07, "loss": 0.8736, "step": 39589 }, { "epoch": 0.75, "learning_rate": 7.937482096805191e-07, "loss": 1.003, "step": 39590 }, { "epoch": 0.75, "learning_rate": 7.936365588403913e-07, "loss": 0.821, "step": 39591 }, { "epoch": 0.75, "learning_rate": 7.935249143717704e-07, "loss": 0.729, "step": 39592 }, { "epoch": 0.75, "learning_rate": 7.934132762750763e-07, "loss": 0.8535, "step": 39593 }, { "epoch": 0.75, "learning_rate": 7.933016445507255e-07, "loss": 0.9489, "step": 39594 }, { "epoch": 0.75, "learning_rate": 7.931900191991324e-07, "loss": 0.8834, "step": 39595 }, { "epoch": 0.75, "learning_rate": 7.930784002207167e-07, "loss": 0.8214, "step": 39596 }, { "epoch": 0.75, "learning_rate": 7.929667876158933e-07, "loss": 0.8077, "step": 39597 }, { "epoch": 0.75, "learning_rate": 7.928551813850799e-07, "loss": 0.85, "step": 39598 }, { "epoch": 0.75, "learning_rate": 7.927435815286927e-07, "loss": 0.9894, "step": 39599 }, { "epoch": 0.75, "learning_rate": 7.926319880471483e-07, "loss": 1.1375, "step": 39600 }, { "epoch": 0.75, "learning_rate": 7.925204009408641e-07, "loss": 1.1407, "step": 39601 }, { "epoch": 0.75, "learning_rate": 7.924088202102562e-07, "loss": 0.8299, "step": 39602 }, { "epoch": 0.75, "learning_rate": 7.922972458557423e-07, "loss": 0.7962, "step": 39603 }, { "epoch": 0.75, "learning_rate": 7.921856778777365e-07, "loss": 0.7588, "step": 39604 }, { "epoch": 0.75, "learning_rate": 7.920741162766585e-07, "loss": 0.79, "step": 39605 }, { "epoch": 0.75, "learning_rate": 7.919625610529228e-07, "loss": 1.1357, "step": 39606 }, { "epoch": 0.75, "learning_rate": 7.918510122069464e-07, "loss": 0.8313, "step": 39607 }, { "epoch": 0.75, "learning_rate": 7.917394697391459e-07, "loss": 0.765, "step": 39608 }, { "epoch": 0.75, "learning_rate": 7.91627933649938e-07, "loss": 0.9827, "step": 39609 }, { "epoch": 0.75, "learning_rate": 7.915164039397389e-07, "loss": 0.9222, "step": 39610 }, { "epoch": 0.75, "learning_rate": 7.914048806089652e-07, "loss": 0.7293, "step": 39611 }, { "epoch": 0.75, "learning_rate": 7.912933636580339e-07, "loss": 1.2325, "step": 39612 }, { "epoch": 0.75, "learning_rate": 7.911818530873593e-07, "loss": 0.8613, "step": 39613 }, { "epoch": 0.75, "learning_rate": 7.910703488973603e-07, "loss": 0.7846, "step": 39614 }, { "epoch": 0.75, "learning_rate": 7.909588510884527e-07, "loss": 0.9147, "step": 39615 }, { "epoch": 0.75, "learning_rate": 7.908473596610511e-07, "loss": 0.8441, "step": 39616 }, { "epoch": 0.75, "learning_rate": 7.907358746155744e-07, "loss": 0.8447, "step": 39617 }, { "epoch": 0.75, "learning_rate": 7.906243959524368e-07, "loss": 1.0332, "step": 39618 }, { "epoch": 0.75, "learning_rate": 7.905129236720552e-07, "loss": 0.9425, "step": 39619 }, { "epoch": 0.75, "learning_rate": 7.904014577748461e-07, "loss": 0.926, "step": 39620 }, { "epoch": 0.75, "learning_rate": 7.902899982612255e-07, "loss": 0.8005, "step": 39621 }, { "epoch": 0.75, "learning_rate": 7.901785451316096e-07, "loss": 0.8123, "step": 39622 }, { "epoch": 0.75, "learning_rate": 7.900670983864145e-07, "loss": 0.7839, "step": 39623 }, { "epoch": 0.75, "learning_rate": 7.899556580260573e-07, "loss": 0.9542, "step": 39624 }, { "epoch": 0.75, "learning_rate": 7.898442240509515e-07, "loss": 1.0894, "step": 39625 }, { "epoch": 0.75, "learning_rate": 7.897327964615167e-07, "loss": 0.9051, "step": 39626 }, { "epoch": 0.75, "learning_rate": 7.896213752581664e-07, "loss": 0.9633, "step": 39627 }, { "epoch": 0.75, "learning_rate": 7.895099604413176e-07, "loss": 0.7599, "step": 39628 }, { "epoch": 0.75, "learning_rate": 7.893985520113859e-07, "loss": 0.8994, "step": 39629 }, { "epoch": 0.75, "learning_rate": 7.892871499687877e-07, "loss": 0.9131, "step": 39630 }, { "epoch": 0.75, "learning_rate": 7.891757543139386e-07, "loss": 0.8629, "step": 39631 }, { "epoch": 0.75, "learning_rate": 7.890643650472549e-07, "loss": 0.9575, "step": 39632 }, { "epoch": 0.75, "learning_rate": 7.889529821691533e-07, "loss": 0.7769, "step": 39633 }, { "epoch": 0.75, "learning_rate": 7.888416056800472e-07, "loss": 0.8095, "step": 39634 }, { "epoch": 0.75, "learning_rate": 7.887302355803547e-07, "loss": 0.9171, "step": 39635 }, { "epoch": 0.75, "learning_rate": 7.886188718704921e-07, "loss": 0.9077, "step": 39636 }, { "epoch": 0.75, "learning_rate": 7.885075145508722e-07, "loss": 1.1169, "step": 39637 }, { "epoch": 0.75, "learning_rate": 7.883961636219148e-07, "loss": 0.971, "step": 39638 }, { "epoch": 0.75, "learning_rate": 7.882848190840326e-07, "loss": 0.8204, "step": 39639 }, { "epoch": 0.75, "learning_rate": 7.881734809376424e-07, "loss": 0.9337, "step": 39640 }, { "epoch": 0.75, "learning_rate": 7.8806214918316e-07, "loss": 0.9788, "step": 39641 }, { "epoch": 0.75, "learning_rate": 7.87950823821001e-07, "loss": 0.9283, "step": 39642 }, { "epoch": 0.75, "learning_rate": 7.87839504851581e-07, "loss": 1.063, "step": 39643 }, { "epoch": 0.75, "learning_rate": 7.877281922753161e-07, "loss": 1.0473, "step": 39644 }, { "epoch": 0.75, "learning_rate": 7.876168860926222e-07, "loss": 0.938, "step": 39645 }, { "epoch": 0.75, "learning_rate": 7.875055863039127e-07, "loss": 0.8811, "step": 39646 }, { "epoch": 0.75, "learning_rate": 7.873942929096068e-07, "loss": 0.7809, "step": 39647 }, { "epoch": 0.75, "learning_rate": 7.872830059101169e-07, "loss": 0.6818, "step": 39648 }, { "epoch": 0.75, "learning_rate": 7.8717172530586e-07, "loss": 0.9319, "step": 39649 }, { "epoch": 0.75, "learning_rate": 7.870604510972513e-07, "loss": 1.2059, "step": 39650 }, { "epoch": 0.75, "learning_rate": 7.869491832847062e-07, "loss": 0.8963, "step": 39651 }, { "epoch": 0.75, "learning_rate": 7.868379218686403e-07, "loss": 0.8217, "step": 39652 }, { "epoch": 0.75, "learning_rate": 7.867266668494694e-07, "loss": 0.9326, "step": 39653 }, { "epoch": 0.75, "learning_rate": 7.866154182276092e-07, "loss": 0.8064, "step": 39654 }, { "epoch": 0.75, "learning_rate": 7.865041760034727e-07, "loss": 0.9524, "step": 39655 }, { "epoch": 0.75, "learning_rate": 7.863929401774781e-07, "loss": 0.9944, "step": 39656 }, { "epoch": 0.75, "learning_rate": 7.862817107500406e-07, "loss": 0.9868, "step": 39657 }, { "epoch": 0.75, "learning_rate": 7.861704877215728e-07, "loss": 0.7974, "step": 39658 }, { "epoch": 0.75, "learning_rate": 7.860592710924938e-07, "loss": 0.8383, "step": 39659 }, { "epoch": 0.75, "learning_rate": 7.859480608632159e-07, "loss": 0.7363, "step": 39660 }, { "epoch": 0.75, "learning_rate": 7.858368570341554e-07, "loss": 0.9268, "step": 39661 }, { "epoch": 0.75, "learning_rate": 7.857256596057275e-07, "loss": 0.8702, "step": 39662 }, { "epoch": 0.75, "learning_rate": 7.856144685783473e-07, "loss": 1.1407, "step": 39663 }, { "epoch": 0.75, "learning_rate": 7.855032839524304e-07, "loss": 0.9655, "step": 39664 }, { "epoch": 0.75, "learning_rate": 7.853921057283915e-07, "loss": 0.853, "step": 39665 }, { "epoch": 0.75, "learning_rate": 7.852809339066467e-07, "loss": 0.7092, "step": 39666 }, { "epoch": 0.75, "learning_rate": 7.851697684876089e-07, "loss": 0.7231, "step": 39667 }, { "epoch": 0.75, "learning_rate": 7.850586094716961e-07, "loss": 1.0155, "step": 39668 }, { "epoch": 0.75, "learning_rate": 7.84947456859321e-07, "loss": 0.9635, "step": 39669 }, { "epoch": 0.75, "learning_rate": 7.848363106508994e-07, "loss": 0.8669, "step": 39670 }, { "epoch": 0.75, "learning_rate": 7.847251708468467e-07, "loss": 0.8299, "step": 39671 }, { "epoch": 0.75, "learning_rate": 7.846140374475775e-07, "loss": 0.8925, "step": 39672 }, { "epoch": 0.75, "learning_rate": 7.845029104535068e-07, "loss": 0.9129, "step": 39673 }, { "epoch": 0.75, "learning_rate": 7.843917898650497e-07, "loss": 0.7946, "step": 39674 }, { "epoch": 0.75, "learning_rate": 7.842806756826219e-07, "loss": 1.1935, "step": 39675 }, { "epoch": 0.75, "learning_rate": 7.841695679066358e-07, "loss": 0.7988, "step": 39676 }, { "epoch": 0.75, "learning_rate": 7.840584665375086e-07, "loss": 0.8914, "step": 39677 }, { "epoch": 0.75, "learning_rate": 7.839473715756557e-07, "loss": 0.9272, "step": 39678 }, { "epoch": 0.75, "learning_rate": 7.838362830214888e-07, "loss": 1.0432, "step": 39679 }, { "epoch": 0.75, "learning_rate": 7.837252008754262e-07, "loss": 1.1257, "step": 39680 }, { "epoch": 0.75, "learning_rate": 7.836141251378803e-07, "loss": 1.0646, "step": 39681 }, { "epoch": 0.75, "learning_rate": 7.835030558092666e-07, "loss": 0.9425, "step": 39682 }, { "epoch": 0.75, "learning_rate": 7.833919928899999e-07, "loss": 0.9738, "step": 39683 }, { "epoch": 0.75, "learning_rate": 7.83280936380495e-07, "loss": 1.0405, "step": 39684 }, { "epoch": 0.75, "learning_rate": 7.831698862811662e-07, "loss": 0.8866, "step": 39685 }, { "epoch": 0.75, "learning_rate": 7.830588425924285e-07, "loss": 0.81, "step": 39686 }, { "epoch": 0.75, "learning_rate": 7.829478053146971e-07, "loss": 1.1948, "step": 39687 }, { "epoch": 0.75, "learning_rate": 7.828367744483848e-07, "loss": 0.9426, "step": 39688 }, { "epoch": 0.75, "learning_rate": 7.827257499939084e-07, "loss": 0.8737, "step": 39689 }, { "epoch": 0.75, "learning_rate": 7.826147319516808e-07, "loss": 0.6778, "step": 39690 }, { "epoch": 0.75, "learning_rate": 7.825037203221173e-07, "loss": 0.7079, "step": 39691 }, { "epoch": 0.75, "learning_rate": 7.823927151056321e-07, "loss": 0.9786, "step": 39692 }, { "epoch": 0.75, "learning_rate": 7.822817163026398e-07, "loss": 1.1531, "step": 39693 }, { "epoch": 0.75, "learning_rate": 7.821707239135551e-07, "loss": 0.9962, "step": 39694 }, { "epoch": 0.75, "learning_rate": 7.820597379387921e-07, "loss": 0.9221, "step": 39695 }, { "epoch": 0.75, "learning_rate": 7.819487583787661e-07, "loss": 0.845, "step": 39696 }, { "epoch": 0.75, "learning_rate": 7.818377852338893e-07, "loss": 0.9521, "step": 39697 }, { "epoch": 0.75, "learning_rate": 7.817268185045781e-07, "loss": 0.9491, "step": 39698 }, { "epoch": 0.75, "learning_rate": 7.816158581912472e-07, "loss": 0.8788, "step": 39699 }, { "epoch": 0.75, "learning_rate": 7.815049042943084e-07, "loss": 1.2192, "step": 39700 }, { "epoch": 0.75, "learning_rate": 7.813939568141793e-07, "loss": 1.0079, "step": 39701 }, { "epoch": 0.75, "learning_rate": 7.812830157512716e-07, "loss": 0.8704, "step": 39702 }, { "epoch": 0.75, "learning_rate": 7.811720811060005e-07, "loss": 0.6707, "step": 39703 }, { "epoch": 0.75, "learning_rate": 7.810611528787801e-07, "loss": 0.7059, "step": 39704 }, { "epoch": 0.75, "learning_rate": 7.809502310700245e-07, "loss": 0.9818, "step": 39705 }, { "epoch": 0.75, "learning_rate": 7.808393156801483e-07, "loss": 0.7846, "step": 39706 }, { "epoch": 0.75, "learning_rate": 7.807284067095652e-07, "loss": 1.0594, "step": 39707 }, { "epoch": 0.75, "learning_rate": 7.806175041586902e-07, "loss": 0.7773, "step": 39708 }, { "epoch": 0.75, "learning_rate": 7.805066080279356e-07, "loss": 1.011, "step": 39709 }, { "epoch": 0.75, "learning_rate": 7.803957183177177e-07, "loss": 0.8545, "step": 39710 }, { "epoch": 0.75, "learning_rate": 7.802848350284489e-07, "loss": 0.8193, "step": 39711 }, { "epoch": 0.75, "learning_rate": 7.801739581605439e-07, "loss": 1.2236, "step": 39712 }, { "epoch": 0.75, "learning_rate": 7.800630877144164e-07, "loss": 0.9802, "step": 39713 }, { "epoch": 0.75, "learning_rate": 7.799522236904805e-07, "loss": 1.1652, "step": 39714 }, { "epoch": 0.75, "learning_rate": 7.798413660891505e-07, "loss": 0.7214, "step": 39715 }, { "epoch": 0.75, "learning_rate": 7.7973051491084e-07, "loss": 0.793, "step": 39716 }, { "epoch": 0.75, "learning_rate": 7.796196701559639e-07, "loss": 0.8792, "step": 39717 }, { "epoch": 0.75, "learning_rate": 7.795088318249333e-07, "loss": 0.9988, "step": 39718 }, { "epoch": 0.75, "learning_rate": 7.79397999918165e-07, "loss": 0.9992, "step": 39719 }, { "epoch": 0.75, "learning_rate": 7.792871744360727e-07, "loss": 0.8786, "step": 39720 }, { "epoch": 0.75, "learning_rate": 7.791763553790677e-07, "loss": 0.8714, "step": 39721 }, { "epoch": 0.75, "learning_rate": 7.790655427475669e-07, "loss": 0.872, "step": 39722 }, { "epoch": 0.75, "learning_rate": 7.78954736541982e-07, "loss": 0.8638, "step": 39723 }, { "epoch": 0.75, "learning_rate": 7.788439367627271e-07, "loss": 0.874, "step": 39724 }, { "epoch": 0.75, "learning_rate": 7.787331434102164e-07, "loss": 0.941, "step": 39725 }, { "epoch": 0.75, "learning_rate": 7.78622356484863e-07, "loss": 1.0547, "step": 39726 }, { "epoch": 0.75, "learning_rate": 7.785115759870813e-07, "loss": 0.6763, "step": 39727 }, { "epoch": 0.75, "learning_rate": 7.784008019172845e-07, "loss": 1.1216, "step": 39728 }, { "epoch": 0.75, "learning_rate": 7.78290034275887e-07, "loss": 0.7824, "step": 39729 }, { "epoch": 0.75, "learning_rate": 7.781792730633004e-07, "loss": 0.769, "step": 39730 }, { "epoch": 0.75, "learning_rate": 7.780685182799411e-07, "loss": 0.981, "step": 39731 }, { "epoch": 0.75, "learning_rate": 7.779577699262203e-07, "loss": 1.0001, "step": 39732 }, { "epoch": 0.75, "learning_rate": 7.778470280025521e-07, "loss": 0.7509, "step": 39733 }, { "epoch": 0.75, "learning_rate": 7.777362925093507e-07, "loss": 0.7846, "step": 39734 }, { "epoch": 0.75, "learning_rate": 7.776255634470289e-07, "loss": 0.8773, "step": 39735 }, { "epoch": 0.75, "learning_rate": 7.775148408160007e-07, "loss": 0.9434, "step": 39736 }, { "epoch": 0.75, "learning_rate": 7.774041246166792e-07, "loss": 1.1475, "step": 39737 }, { "epoch": 0.75, "learning_rate": 7.772934148494787e-07, "loss": 0.9147, "step": 39738 }, { "epoch": 0.75, "learning_rate": 7.7718271151481e-07, "loss": 0.932, "step": 39739 }, { "epoch": 0.75, "learning_rate": 7.770720146130892e-07, "loss": 0.9323, "step": 39740 }, { "epoch": 0.75, "learning_rate": 7.769613241447294e-07, "loss": 0.8119, "step": 39741 }, { "epoch": 0.75, "learning_rate": 7.768506401101416e-07, "loss": 0.7565, "step": 39742 }, { "epoch": 0.75, "learning_rate": 7.767399625097421e-07, "loss": 1.0878, "step": 39743 }, { "epoch": 0.75, "learning_rate": 7.766292913439424e-07, "loss": 1.1115, "step": 39744 }, { "epoch": 0.75, "learning_rate": 7.765186266131558e-07, "loss": 0.991, "step": 39745 }, { "epoch": 0.75, "learning_rate": 7.764079683177958e-07, "loss": 0.7304, "step": 39746 }, { "epoch": 0.75, "learning_rate": 7.762973164582754e-07, "loss": 0.811, "step": 39747 }, { "epoch": 0.75, "learning_rate": 7.761866710350083e-07, "loss": 0.7963, "step": 39748 }, { "epoch": 0.75, "learning_rate": 7.760760320484074e-07, "loss": 1.1315, "step": 39749 }, { "epoch": 0.75, "learning_rate": 7.759653994988861e-07, "loss": 1.0956, "step": 39750 }, { "epoch": 0.75, "learning_rate": 7.758547733868557e-07, "loss": 0.9485, "step": 39751 }, { "epoch": 0.75, "learning_rate": 7.757441537127325e-07, "loss": 1.0072, "step": 39752 }, { "epoch": 0.75, "learning_rate": 7.756335404769269e-07, "loss": 0.7375, "step": 39753 }, { "epoch": 0.75, "learning_rate": 7.755229336798528e-07, "loss": 0.8464, "step": 39754 }, { "epoch": 0.75, "learning_rate": 7.75412333321923e-07, "loss": 0.7607, "step": 39755 }, { "epoch": 0.75, "learning_rate": 7.753017394035508e-07, "loss": 1.0458, "step": 39756 }, { "epoch": 0.75, "learning_rate": 7.75191151925149e-07, "loss": 0.876, "step": 39757 }, { "epoch": 0.75, "learning_rate": 7.750805708871307e-07, "loss": 0.8215, "step": 39758 }, { "epoch": 0.75, "learning_rate": 7.749699962899093e-07, "loss": 0.8548, "step": 39759 }, { "epoch": 0.75, "learning_rate": 7.748594281338956e-07, "loss": 1.0393, "step": 39760 }, { "epoch": 0.75, "learning_rate": 7.747488664195044e-07, "loss": 0.9459, "step": 39761 }, { "epoch": 0.75, "learning_rate": 7.746383111471492e-07, "loss": 0.9215, "step": 39762 }, { "epoch": 0.75, "learning_rate": 7.745277623172399e-07, "loss": 0.8168, "step": 39763 }, { "epoch": 0.75, "learning_rate": 7.744172199301925e-07, "loss": 0.9078, "step": 39764 }, { "epoch": 0.75, "learning_rate": 7.743066839864178e-07, "loss": 0.9184, "step": 39765 }, { "epoch": 0.75, "learning_rate": 7.741961544863286e-07, "loss": 0.7768, "step": 39766 }, { "epoch": 0.75, "learning_rate": 7.740856314303383e-07, "loss": 0.8618, "step": 39767 }, { "epoch": 0.75, "learning_rate": 7.739751148188593e-07, "loss": 1.1354, "step": 39768 }, { "epoch": 0.75, "learning_rate": 7.738646046523044e-07, "loss": 1.0381, "step": 39769 }, { "epoch": 0.75, "learning_rate": 7.737541009310859e-07, "loss": 1.0535, "step": 39770 }, { "epoch": 0.75, "learning_rate": 7.736436036556178e-07, "loss": 0.7838, "step": 39771 }, { "epoch": 0.75, "learning_rate": 7.735331128263096e-07, "loss": 0.8213, "step": 39772 }, { "epoch": 0.75, "learning_rate": 7.734226284435775e-07, "loss": 0.8717, "step": 39773 }, { "epoch": 0.75, "learning_rate": 7.733121505078317e-07, "loss": 0.8789, "step": 39774 }, { "epoch": 0.75, "learning_rate": 7.732016790194855e-07, "loss": 0.9702, "step": 39775 }, { "epoch": 0.75, "learning_rate": 7.73091213978951e-07, "loss": 0.9959, "step": 39776 }, { "epoch": 0.75, "learning_rate": 7.729807553866411e-07, "loss": 0.8506, "step": 39777 }, { "epoch": 0.75, "learning_rate": 7.72870303242968e-07, "loss": 0.9184, "step": 39778 }, { "epoch": 0.75, "learning_rate": 7.727598575483445e-07, "loss": 0.7831, "step": 39779 }, { "epoch": 0.75, "learning_rate": 7.726494183031832e-07, "loss": 0.8586, "step": 39780 }, { "epoch": 0.75, "learning_rate": 7.725389855078946e-07, "loss": 1.1478, "step": 39781 }, { "epoch": 0.75, "learning_rate": 7.724285591628933e-07, "loss": 0.9877, "step": 39782 }, { "epoch": 0.75, "learning_rate": 7.723181392685917e-07, "loss": 0.9977, "step": 39783 }, { "epoch": 0.75, "learning_rate": 7.722077258253994e-07, "loss": 0.8606, "step": 39784 }, { "epoch": 0.75, "learning_rate": 7.720973188337319e-07, "loss": 0.8571, "step": 39785 }, { "epoch": 0.75, "learning_rate": 7.719869182939996e-07, "loss": 0.7943, "step": 39786 }, { "epoch": 0.75, "learning_rate": 7.718765242066148e-07, "loss": 1.2585, "step": 39787 }, { "epoch": 0.75, "learning_rate": 7.717661365719903e-07, "loss": 1.1129, "step": 39788 }, { "epoch": 0.75, "learning_rate": 7.71655755390538e-07, "loss": 0.9604, "step": 39789 }, { "epoch": 0.75, "learning_rate": 7.715453806626702e-07, "loss": 0.9283, "step": 39790 }, { "epoch": 0.75, "learning_rate": 7.71435012388799e-07, "loss": 0.8056, "step": 39791 }, { "epoch": 0.75, "learning_rate": 7.71324650569337e-07, "loss": 0.7853, "step": 39792 }, { "epoch": 0.75, "learning_rate": 7.712142952046944e-07, "loss": 0.77, "step": 39793 }, { "epoch": 0.75, "learning_rate": 7.71103946295286e-07, "loss": 1.0745, "step": 39794 }, { "epoch": 0.75, "learning_rate": 7.709936038415219e-07, "loss": 0.9629, "step": 39795 }, { "epoch": 0.75, "learning_rate": 7.708832678438144e-07, "loss": 0.8862, "step": 39796 }, { "epoch": 0.75, "learning_rate": 7.707729383025761e-07, "loss": 0.789, "step": 39797 }, { "epoch": 0.75, "learning_rate": 7.706626152182183e-07, "loss": 0.7315, "step": 39798 }, { "epoch": 0.75, "learning_rate": 7.705522985911535e-07, "loss": 1.0861, "step": 39799 }, { "epoch": 0.75, "learning_rate": 7.704419884217931e-07, "loss": 0.9273, "step": 39800 }, { "epoch": 0.75, "learning_rate": 7.703316847105504e-07, "loss": 0.7995, "step": 39801 }, { "epoch": 0.75, "learning_rate": 7.702213874578354e-07, "loss": 0.7931, "step": 39802 }, { "epoch": 0.75, "learning_rate": 7.701110966640596e-07, "loss": 0.9898, "step": 39803 }, { "epoch": 0.75, "learning_rate": 7.700008123296376e-07, "loss": 1.1011, "step": 39804 }, { "epoch": 0.75, "learning_rate": 7.69890534454979e-07, "loss": 1.012, "step": 39805 }, { "epoch": 0.75, "learning_rate": 7.697802630404957e-07, "loss": 1.2843, "step": 39806 }, { "epoch": 0.75, "learning_rate": 7.696699980866001e-07, "loss": 0.8727, "step": 39807 }, { "epoch": 0.75, "learning_rate": 7.695597395937038e-07, "loss": 0.8078, "step": 39808 }, { "epoch": 0.75, "learning_rate": 7.69449487562218e-07, "loss": 0.714, "step": 39809 }, { "epoch": 0.75, "learning_rate": 7.693392419925549e-07, "loss": 0.9609, "step": 39810 }, { "epoch": 0.75, "learning_rate": 7.692290028851271e-07, "loss": 0.8109, "step": 39811 }, { "epoch": 0.75, "learning_rate": 7.691187702403432e-07, "loss": 1.1293, "step": 39812 }, { "epoch": 0.75, "learning_rate": 7.690085440586184e-07, "loss": 1.0125, "step": 39813 }, { "epoch": 0.75, "learning_rate": 7.688983243403619e-07, "loss": 0.8224, "step": 39814 }, { "epoch": 0.75, "learning_rate": 7.68788111085986e-07, "loss": 0.9532, "step": 39815 }, { "epoch": 0.75, "learning_rate": 7.686779042959022e-07, "loss": 1.0839, "step": 39816 }, { "epoch": 0.75, "learning_rate": 7.68567703970522e-07, "loss": 0.8064, "step": 39817 }, { "epoch": 0.75, "learning_rate": 7.684575101102568e-07, "loss": 1.0123, "step": 39818 }, { "epoch": 0.75, "learning_rate": 7.683473227155183e-07, "loss": 1.0593, "step": 39819 }, { "epoch": 0.75, "learning_rate": 7.682371417867184e-07, "loss": 0.9947, "step": 39820 }, { "epoch": 0.75, "learning_rate": 7.681269673242667e-07, "loss": 0.7527, "step": 39821 }, { "epoch": 0.75, "learning_rate": 7.680167993285769e-07, "loss": 1.0001, "step": 39822 }, { "epoch": 0.75, "learning_rate": 7.679066378000589e-07, "loss": 0.75, "step": 39823 }, { "epoch": 0.75, "learning_rate": 7.677964827391235e-07, "loss": 0.8578, "step": 39824 }, { "epoch": 0.75, "learning_rate": 7.676863341461843e-07, "loss": 1.1781, "step": 39825 }, { "epoch": 0.75, "learning_rate": 7.675761920216507e-07, "loss": 0.9064, "step": 39826 }, { "epoch": 0.75, "learning_rate": 7.674660563659342e-07, "loss": 0.8694, "step": 39827 }, { "epoch": 0.75, "learning_rate": 7.673559271794467e-07, "loss": 0.9999, "step": 39828 }, { "epoch": 0.75, "learning_rate": 7.672458044625989e-07, "loss": 0.722, "step": 39829 }, { "epoch": 0.75, "learning_rate": 7.671356882158018e-07, "loss": 1.0156, "step": 39830 }, { "epoch": 0.75, "learning_rate": 7.670255784394673e-07, "loss": 1.136, "step": 39831 }, { "epoch": 0.75, "learning_rate": 7.669154751340069e-07, "loss": 1.0277, "step": 39832 }, { "epoch": 0.75, "learning_rate": 7.668053782998292e-07, "loss": 0.8854, "step": 39833 }, { "epoch": 0.75, "learning_rate": 7.666952879373487e-07, "loss": 0.9157, "step": 39834 }, { "epoch": 0.75, "learning_rate": 7.665852040469743e-07, "loss": 0.9515, "step": 39835 }, { "epoch": 0.75, "learning_rate": 7.664751266291173e-07, "loss": 0.6885, "step": 39836 }, { "epoch": 0.75, "learning_rate": 7.663650556841892e-07, "loss": 1.2335, "step": 39837 }, { "epoch": 0.75, "learning_rate": 7.662549912126008e-07, "loss": 1.0179, "step": 39838 }, { "epoch": 0.75, "learning_rate": 7.661449332147633e-07, "loss": 0.9217, "step": 39839 }, { "epoch": 0.75, "learning_rate": 7.66034881691087e-07, "loss": 0.8209, "step": 39840 }, { "epoch": 0.75, "learning_rate": 7.659248366419844e-07, "loss": 0.8467, "step": 39841 }, { "epoch": 0.75, "learning_rate": 7.658147980678638e-07, "loss": 0.9292, "step": 39842 }, { "epoch": 0.75, "learning_rate": 7.657047659691388e-07, "loss": 0.9814, "step": 39843 }, { "epoch": 0.75, "learning_rate": 7.655947403462186e-07, "loss": 1.0168, "step": 39844 }, { "epoch": 0.75, "learning_rate": 7.654847211995134e-07, "loss": 0.8347, "step": 39845 }, { "epoch": 0.75, "learning_rate": 7.653747085294369e-07, "loss": 0.8469, "step": 39846 }, { "epoch": 0.75, "learning_rate": 7.652647023363971e-07, "loss": 0.8129, "step": 39847 }, { "epoch": 0.75, "learning_rate": 7.651547026208059e-07, "loss": 0.9136, "step": 39848 }, { "epoch": 0.75, "learning_rate": 7.650447093830735e-07, "loss": 0.8616, "step": 39849 }, { "epoch": 0.75, "learning_rate": 7.649347226236112e-07, "loss": 0.9913, "step": 39850 }, { "epoch": 0.75, "learning_rate": 7.648247423428293e-07, "loss": 0.7893, "step": 39851 }, { "epoch": 0.75, "learning_rate": 7.647147685411388e-07, "loss": 0.9669, "step": 39852 }, { "epoch": 0.75, "learning_rate": 7.646048012189508e-07, "loss": 0.9894, "step": 39853 }, { "epoch": 0.75, "learning_rate": 7.644948403766738e-07, "loss": 0.8391, "step": 39854 }, { "epoch": 0.75, "learning_rate": 7.643848860147213e-07, "loss": 0.9492, "step": 39855 }, { "epoch": 0.75, "learning_rate": 7.642749381335019e-07, "loss": 1.173, "step": 39856 }, { "epoch": 0.75, "learning_rate": 7.641649967334263e-07, "loss": 0.9214, "step": 39857 }, { "epoch": 0.75, "learning_rate": 7.640550618149057e-07, "loss": 0.7864, "step": 39858 }, { "epoch": 0.75, "learning_rate": 7.639451333783499e-07, "loss": 0.8722, "step": 39859 }, { "epoch": 0.75, "learning_rate": 7.638352114241701e-07, "loss": 0.9858, "step": 39860 }, { "epoch": 0.75, "learning_rate": 7.637252959527761e-07, "loss": 0.9267, "step": 39861 }, { "epoch": 0.75, "learning_rate": 7.636153869645796e-07, "loss": 1.1796, "step": 39862 }, { "epoch": 0.75, "learning_rate": 7.635054844599884e-07, "loss": 0.9189, "step": 39863 }, { "epoch": 0.75, "learning_rate": 7.633955884394159e-07, "loss": 0.8525, "step": 39864 }, { "epoch": 0.75, "learning_rate": 7.632856989032705e-07, "loss": 0.7562, "step": 39865 }, { "epoch": 0.75, "learning_rate": 7.63175815851962e-07, "loss": 0.9846, "step": 39866 }, { "epoch": 0.75, "learning_rate": 7.630659392859035e-07, "loss": 0.8895, "step": 39867 }, { "epoch": 0.75, "learning_rate": 7.629560692055027e-07, "loss": 1.0398, "step": 39868 }, { "epoch": 0.75, "learning_rate": 7.628462056111707e-07, "loss": 0.9963, "step": 39869 }, { "epoch": 0.75, "learning_rate": 7.627363485033176e-07, "loss": 0.8611, "step": 39870 }, { "epoch": 0.75, "learning_rate": 7.626264978823539e-07, "loss": 0.8328, "step": 39871 }, { "epoch": 0.75, "learning_rate": 7.625166537486894e-07, "loss": 0.8004, "step": 39872 }, { "epoch": 0.75, "learning_rate": 7.624068161027346e-07, "loss": 0.7769, "step": 39873 }, { "epoch": 0.75, "learning_rate": 7.622969849449003e-07, "loss": 0.8401, "step": 39874 }, { "epoch": 0.75, "learning_rate": 7.62187160275594e-07, "loss": 1.1828, "step": 39875 }, { "epoch": 0.75, "learning_rate": 7.620773420952293e-07, "loss": 0.8096, "step": 39876 }, { "epoch": 0.75, "learning_rate": 7.619675304042135e-07, "loss": 0.8115, "step": 39877 }, { "epoch": 0.75, "learning_rate": 7.61857725202958e-07, "loss": 0.9673, "step": 39878 }, { "epoch": 0.75, "learning_rate": 7.61747926491872e-07, "loss": 0.6845, "step": 39879 }, { "epoch": 0.75, "learning_rate": 7.616381342713664e-07, "loss": 0.9503, "step": 39880 }, { "epoch": 0.75, "learning_rate": 7.615283485418503e-07, "loss": 1.1609, "step": 39881 }, { "epoch": 0.75, "learning_rate": 7.614185693037343e-07, "loss": 1.1509, "step": 39882 }, { "epoch": 0.75, "learning_rate": 7.61308796557429e-07, "loss": 0.8243, "step": 39883 }, { "epoch": 0.75, "learning_rate": 7.611990303033414e-07, "loss": 0.8268, "step": 39884 }, { "epoch": 0.75, "learning_rate": 7.610892705418851e-07, "loss": 0.6367, "step": 39885 }, { "epoch": 0.75, "learning_rate": 7.609795172734674e-07, "loss": 0.9626, "step": 39886 }, { "epoch": 0.75, "learning_rate": 7.60869770498498e-07, "loss": 0.8977, "step": 39887 }, { "epoch": 0.75, "learning_rate": 7.607600302173893e-07, "loss": 0.9238, "step": 39888 }, { "epoch": 0.75, "learning_rate": 7.606502964305482e-07, "loss": 1.0209, "step": 39889 }, { "epoch": 0.75, "learning_rate": 7.605405691383858e-07, "loss": 0.977, "step": 39890 }, { "epoch": 0.75, "learning_rate": 7.604308483413114e-07, "loss": 0.8396, "step": 39891 }, { "epoch": 0.75, "learning_rate": 7.603211340397351e-07, "loss": 0.8413, "step": 39892 }, { "epoch": 0.75, "learning_rate": 7.602114262340662e-07, "loss": 1.2389, "step": 39893 }, { "epoch": 0.75, "learning_rate": 7.601017249247145e-07, "loss": 1.0503, "step": 39894 }, { "epoch": 0.75, "learning_rate": 7.599920301120902e-07, "loss": 0.9085, "step": 39895 }, { "epoch": 0.75, "learning_rate": 7.598823417966012e-07, "loss": 0.972, "step": 39896 }, { "epoch": 0.75, "learning_rate": 7.597726599786595e-07, "loss": 0.7976, "step": 39897 }, { "epoch": 0.75, "learning_rate": 7.596629846586726e-07, "loss": 0.767, "step": 39898 }, { "epoch": 0.75, "learning_rate": 7.595533158370505e-07, "loss": 1.0459, "step": 39899 }, { "epoch": 0.75, "learning_rate": 7.594436535142033e-07, "loss": 0.8519, "step": 39900 }, { "epoch": 0.75, "learning_rate": 7.593339976905401e-07, "loss": 0.8139, "step": 39901 }, { "epoch": 0.75, "learning_rate": 7.592243483664702e-07, "loss": 0.7834, "step": 39902 }, { "epoch": 0.75, "learning_rate": 7.591147055424033e-07, "loss": 0.9274, "step": 39903 }, { "epoch": 0.75, "learning_rate": 7.590050692187495e-07, "loss": 0.9774, "step": 39904 }, { "epoch": 0.75, "learning_rate": 7.588954393959158e-07, "loss": 1.0023, "step": 39905 }, { "epoch": 0.75, "learning_rate": 7.587858160743147e-07, "loss": 0.9994, "step": 39906 }, { "epoch": 0.75, "learning_rate": 7.586761992543532e-07, "loss": 0.9096, "step": 39907 }, { "epoch": 0.75, "learning_rate": 7.585665889364405e-07, "loss": 0.9519, "step": 39908 }, { "epoch": 0.75, "learning_rate": 7.584569851209885e-07, "loss": 0.801, "step": 39909 }, { "epoch": 0.75, "learning_rate": 7.583473878084039e-07, "loss": 0.8589, "step": 39910 }, { "epoch": 0.75, "learning_rate": 7.582377969990967e-07, "loss": 0.8022, "step": 39911 }, { "epoch": 0.75, "learning_rate": 7.581282126934764e-07, "loss": 1.0256, "step": 39912 }, { "epoch": 0.75, "learning_rate": 7.580186348919516e-07, "loss": 1.04, "step": 39913 }, { "epoch": 0.75, "learning_rate": 7.579090635949318e-07, "loss": 0.7925, "step": 39914 }, { "epoch": 0.75, "learning_rate": 7.577994988028265e-07, "loss": 0.8446, "step": 39915 }, { "epoch": 0.75, "learning_rate": 7.576899405160449e-07, "loss": 0.8425, "step": 39916 }, { "epoch": 0.75, "learning_rate": 7.575803887349942e-07, "loss": 1.0538, "step": 39917 }, { "epoch": 0.75, "learning_rate": 7.574708434600867e-07, "loss": 1.1781, "step": 39918 }, { "epoch": 0.75, "learning_rate": 7.573613046917286e-07, "loss": 0.9939, "step": 39919 }, { "epoch": 0.75, "learning_rate": 7.572517724303299e-07, "loss": 0.897, "step": 39920 }, { "epoch": 0.75, "learning_rate": 7.571422466762999e-07, "loss": 0.9312, "step": 39921 }, { "epoch": 0.75, "learning_rate": 7.57032727430047e-07, "loss": 1.0027, "step": 39922 }, { "epoch": 0.75, "learning_rate": 7.569232146919805e-07, "loss": 0.8049, "step": 39923 }, { "epoch": 0.75, "learning_rate": 7.568137084625094e-07, "loss": 0.7871, "step": 39924 }, { "epoch": 0.75, "learning_rate": 7.567042087420434e-07, "loss": 0.9482, "step": 39925 }, { "epoch": 0.75, "learning_rate": 7.565947155309885e-07, "loss": 0.8667, "step": 39926 }, { "epoch": 0.75, "learning_rate": 7.564852288297573e-07, "loss": 0.7633, "step": 39927 }, { "epoch": 0.75, "learning_rate": 7.56375748638756e-07, "loss": 0.9057, "step": 39928 }, { "epoch": 0.75, "learning_rate": 7.562662749583934e-07, "loss": 0.821, "step": 39929 }, { "epoch": 0.75, "learning_rate": 7.561568077890804e-07, "loss": 0.7768, "step": 39930 }, { "epoch": 0.75, "learning_rate": 7.560473471312241e-07, "loss": 1.0215, "step": 39931 }, { "epoch": 0.75, "learning_rate": 7.559378929852332e-07, "loss": 0.8025, "step": 39932 }, { "epoch": 0.75, "learning_rate": 7.558284453515169e-07, "loss": 1.0193, "step": 39933 }, { "epoch": 0.75, "learning_rate": 7.557190042304835e-07, "loss": 0.8477, "step": 39934 }, { "epoch": 0.75, "learning_rate": 7.556095696225418e-07, "loss": 1.0115, "step": 39935 }, { "epoch": 0.75, "learning_rate": 7.555001415281008e-07, "loss": 0.9953, "step": 39936 }, { "epoch": 0.75, "learning_rate": 7.553907199475693e-07, "loss": 1.0267, "step": 39937 }, { "epoch": 0.75, "learning_rate": 7.55281304881354e-07, "loss": 0.8026, "step": 39938 }, { "epoch": 0.75, "learning_rate": 7.551718963298663e-07, "loss": 0.963, "step": 39939 }, { "epoch": 0.75, "learning_rate": 7.550624942935126e-07, "loss": 0.98, "step": 39940 }, { "epoch": 0.75, "learning_rate": 7.549530987727019e-07, "loss": 0.8004, "step": 39941 }, { "epoch": 0.75, "learning_rate": 7.548437097678427e-07, "loss": 0.8847, "step": 39942 }, { "epoch": 0.75, "learning_rate": 7.547343272793437e-07, "loss": 0.91, "step": 39943 }, { "epoch": 0.75, "learning_rate": 7.546249513076132e-07, "loss": 0.8928, "step": 39944 }, { "epoch": 0.75, "learning_rate": 7.545155818530597e-07, "loss": 0.9131, "step": 39945 }, { "epoch": 0.75, "learning_rate": 7.544062189160922e-07, "loss": 0.6903, "step": 39946 }, { "epoch": 0.75, "learning_rate": 7.542968624971167e-07, "loss": 0.8394, "step": 39947 }, { "epoch": 0.75, "learning_rate": 7.54187512596545e-07, "loss": 0.8573, "step": 39948 }, { "epoch": 0.75, "learning_rate": 7.540781692147825e-07, "loss": 0.8335, "step": 39949 }, { "epoch": 0.75, "learning_rate": 7.539688323522381e-07, "loss": 1.1243, "step": 39950 }, { "epoch": 0.75, "learning_rate": 7.53859502009322e-07, "loss": 0.9106, "step": 39951 }, { "epoch": 0.75, "learning_rate": 7.537501781864401e-07, "loss": 1.0378, "step": 39952 }, { "epoch": 0.75, "learning_rate": 7.536408608840016e-07, "loss": 1.1378, "step": 39953 }, { "epoch": 0.75, "learning_rate": 7.535315501024146e-07, "loss": 0.6926, "step": 39954 }, { "epoch": 0.75, "learning_rate": 7.534222458420873e-07, "loss": 0.9025, "step": 39955 }, { "epoch": 0.75, "learning_rate": 7.533129481034276e-07, "loss": 1.1899, "step": 39956 }, { "epoch": 0.75, "learning_rate": 7.532036568868439e-07, "loss": 0.8798, "step": 39957 }, { "epoch": 0.75, "learning_rate": 7.530943721927451e-07, "loss": 0.8817, "step": 39958 }, { "epoch": 0.75, "learning_rate": 7.529850940215364e-07, "loss": 0.9041, "step": 39959 }, { "epoch": 0.75, "learning_rate": 7.528758223736296e-07, "loss": 0.6733, "step": 39960 }, { "epoch": 0.75, "learning_rate": 7.527665572494303e-07, "loss": 0.8593, "step": 39961 }, { "epoch": 0.75, "learning_rate": 7.526572986493469e-07, "loss": 1.1348, "step": 39962 }, { "epoch": 0.75, "learning_rate": 7.525480465737875e-07, "loss": 0.9777, "step": 39963 }, { "epoch": 0.75, "learning_rate": 7.524388010231603e-07, "loss": 0.8885, "step": 39964 }, { "epoch": 0.75, "learning_rate": 7.52329561997873e-07, "loss": 0.7678, "step": 39965 }, { "epoch": 0.75, "learning_rate": 7.522203294983335e-07, "loss": 0.9349, "step": 39966 }, { "epoch": 0.75, "learning_rate": 7.521111035249504e-07, "loss": 0.6436, "step": 39967 }, { "epoch": 0.75, "learning_rate": 7.520018840781293e-07, "loss": 0.9904, "step": 39968 }, { "epoch": 0.75, "learning_rate": 7.518926711582814e-07, "loss": 1.0092, "step": 39969 }, { "epoch": 0.75, "learning_rate": 7.517834647658115e-07, "loss": 0.8815, "step": 39970 }, { "epoch": 0.75, "learning_rate": 7.51674264901128e-07, "loss": 0.8482, "step": 39971 }, { "epoch": 0.75, "learning_rate": 7.515650715646405e-07, "loss": 0.8057, "step": 39972 }, { "epoch": 0.75, "learning_rate": 7.514558847567549e-07, "loss": 0.674, "step": 39973 }, { "epoch": 0.75, "learning_rate": 7.513467044778794e-07, "loss": 0.8551, "step": 39974 }, { "epoch": 0.75, "learning_rate": 7.512375307284217e-07, "loss": 0.9142, "step": 39975 }, { "epoch": 0.75, "learning_rate": 7.511283635087894e-07, "loss": 0.9699, "step": 39976 }, { "epoch": 0.75, "learning_rate": 7.510192028193899e-07, "loss": 0.9615, "step": 39977 }, { "epoch": 0.75, "learning_rate": 7.509100486606313e-07, "loss": 0.8585, "step": 39978 }, { "epoch": 0.75, "learning_rate": 7.50800901032922e-07, "loss": 0.6987, "step": 39979 }, { "epoch": 0.75, "learning_rate": 7.506917599366668e-07, "loss": 1.037, "step": 39980 }, { "epoch": 0.75, "learning_rate": 7.505826253722762e-07, "loss": 1.0523, "step": 39981 }, { "epoch": 0.75, "learning_rate": 7.504734973401559e-07, "loss": 1.0414, "step": 39982 }, { "epoch": 0.75, "learning_rate": 7.503643758407137e-07, "loss": 0.9777, "step": 39983 }, { "epoch": 0.75, "learning_rate": 7.502552608743574e-07, "loss": 0.7359, "step": 39984 }, { "epoch": 0.75, "learning_rate": 7.501461524414944e-07, "loss": 0.8501, "step": 39985 }, { "epoch": 0.75, "learning_rate": 7.50037050542532e-07, "loss": 0.6306, "step": 39986 }, { "epoch": 0.75, "learning_rate": 7.499279551778776e-07, "loss": 1.1793, "step": 39987 }, { "epoch": 0.75, "learning_rate": 7.498188663479392e-07, "loss": 0.9915, "step": 39988 }, { "epoch": 0.75, "learning_rate": 7.49709784053122e-07, "loss": 0.8922, "step": 39989 }, { "epoch": 0.75, "learning_rate": 7.496007082938364e-07, "loss": 0.9096, "step": 39990 }, { "epoch": 0.75, "learning_rate": 7.494916390704874e-07, "loss": 0.7383, "step": 39991 }, { "epoch": 0.75, "learning_rate": 7.49382576383482e-07, "loss": 0.7458, "step": 39992 }, { "epoch": 0.75, "learning_rate": 7.492735202332299e-07, "loss": 0.883, "step": 39993 }, { "epoch": 0.75, "learning_rate": 7.491644706201361e-07, "loss": 0.9658, "step": 39994 }, { "epoch": 0.75, "learning_rate": 7.490554275446086e-07, "loss": 0.9887, "step": 39995 }, { "epoch": 0.75, "learning_rate": 7.489463910070544e-07, "loss": 0.7764, "step": 39996 }, { "epoch": 0.75, "learning_rate": 7.488373610078806e-07, "loss": 0.8488, "step": 39997 }, { "epoch": 0.75, "learning_rate": 7.487283375474944e-07, "loss": 0.7939, "step": 39998 }, { "epoch": 0.75, "learning_rate": 7.486193206263028e-07, "loss": 1.041, "step": 39999 }, { "epoch": 0.75, "learning_rate": 7.485103102447142e-07, "loss": 0.9664, "step": 40000 }, { "epoch": 0.75, "learning_rate": 7.484013064031323e-07, "loss": 0.893, "step": 40001 }, { "epoch": 0.75, "learning_rate": 7.482923091019681e-07, "loss": 0.7024, "step": 40002 }, { "epoch": 0.75, "learning_rate": 7.481833183416259e-07, "loss": 0.7521, "step": 40003 }, { "epoch": 0.75, "learning_rate": 7.480743341225133e-07, "loss": 0.808, "step": 40004 }, { "epoch": 0.75, "learning_rate": 7.479653564450376e-07, "loss": 1.1325, "step": 40005 }, { "epoch": 0.75, "learning_rate": 7.478563853096055e-07, "loss": 1.1172, "step": 40006 }, { "epoch": 0.75, "learning_rate": 7.477474207166238e-07, "loss": 0.9669, "step": 40007 }, { "epoch": 0.75, "learning_rate": 7.476384626664995e-07, "loss": 0.7375, "step": 40008 }, { "epoch": 0.75, "learning_rate": 7.475295111596403e-07, "loss": 0.9051, "step": 40009 }, { "epoch": 0.75, "learning_rate": 7.474205661964507e-07, "loss": 0.8649, "step": 40010 }, { "epoch": 0.75, "learning_rate": 7.473116277773404e-07, "loss": 0.8053, "step": 40011 }, { "epoch": 0.75, "learning_rate": 7.472026959027143e-07, "loss": 1.0934, "step": 40012 }, { "epoch": 0.75, "learning_rate": 7.470937705729784e-07, "loss": 0.8947, "step": 40013 }, { "epoch": 0.75, "learning_rate": 7.469848517885423e-07, "loss": 0.8879, "step": 40014 }, { "epoch": 0.75, "learning_rate": 7.468759395498104e-07, "loss": 0.8585, "step": 40015 }, { "epoch": 0.75, "learning_rate": 7.467670338571898e-07, "loss": 0.6197, "step": 40016 }, { "epoch": 0.75, "learning_rate": 7.466581347110874e-07, "loss": 0.9553, "step": 40017 }, { "epoch": 0.76, "learning_rate": 7.465492421119098e-07, "loss": 1.0297, "step": 40018 }, { "epoch": 0.76, "learning_rate": 7.464403560600633e-07, "loss": 1.2152, "step": 40019 }, { "epoch": 0.76, "learning_rate": 7.463314765559552e-07, "loss": 0.8567, "step": 40020 }, { "epoch": 0.76, "learning_rate": 7.46222603599992e-07, "loss": 1.011, "step": 40021 }, { "epoch": 0.76, "learning_rate": 7.461137371925783e-07, "loss": 0.8753, "step": 40022 }, { "epoch": 0.76, "learning_rate": 7.460048773341238e-07, "loss": 0.9415, "step": 40023 }, { "epoch": 0.76, "learning_rate": 7.458960240250327e-07, "loss": 0.9799, "step": 40024 }, { "epoch": 0.76, "learning_rate": 7.457871772657119e-07, "loss": 1.0883, "step": 40025 }, { "epoch": 0.76, "learning_rate": 7.456783370565679e-07, "loss": 1.1169, "step": 40026 }, { "epoch": 0.76, "learning_rate": 7.455695033980074e-07, "loss": 0.8398, "step": 40027 }, { "epoch": 0.76, "learning_rate": 7.454606762904365e-07, "loss": 0.7645, "step": 40028 }, { "epoch": 0.76, "learning_rate": 7.453518557342615e-07, "loss": 0.8666, "step": 40029 }, { "epoch": 0.76, "learning_rate": 7.452430417298897e-07, "loss": 0.96, "step": 40030 }, { "epoch": 0.76, "learning_rate": 7.451342342777251e-07, "loss": 1.2193, "step": 40031 }, { "epoch": 0.76, "learning_rate": 7.45025433378177e-07, "loss": 1.0225, "step": 40032 }, { "epoch": 0.76, "learning_rate": 7.449166390316496e-07, "loss": 0.7928, "step": 40033 }, { "epoch": 0.76, "learning_rate": 7.448078512385493e-07, "loss": 0.933, "step": 40034 }, { "epoch": 0.76, "learning_rate": 7.446990699992828e-07, "loss": 0.7147, "step": 40035 }, { "epoch": 0.76, "learning_rate": 7.445902953142561e-07, "loss": 0.8954, "step": 40036 }, { "epoch": 0.76, "learning_rate": 7.444815271838763e-07, "loss": 1.2084, "step": 40037 }, { "epoch": 0.76, "learning_rate": 7.44372765608547e-07, "loss": 1.0242, "step": 40038 }, { "epoch": 0.76, "learning_rate": 7.442640105886767e-07, "loss": 0.8423, "step": 40039 }, { "epoch": 0.76, "learning_rate": 7.441552621246717e-07, "loss": 0.9958, "step": 40040 }, { "epoch": 0.76, "learning_rate": 7.440465202169353e-07, "loss": 1.0464, "step": 40041 }, { "epoch": 0.76, "learning_rate": 7.439377848658771e-07, "loss": 0.7164, "step": 40042 }, { "epoch": 0.76, "learning_rate": 7.438290560719005e-07, "loss": 1.0043, "step": 40043 }, { "epoch": 0.76, "learning_rate": 7.437203338354126e-07, "loss": 1.0892, "step": 40044 }, { "epoch": 0.76, "learning_rate": 7.43611618156819e-07, "loss": 0.9613, "step": 40045 }, { "epoch": 0.76, "learning_rate": 7.435029090365256e-07, "loss": 0.953, "step": 40046 }, { "epoch": 0.76, "learning_rate": 7.433942064749386e-07, "loss": 0.9705, "step": 40047 }, { "epoch": 0.76, "learning_rate": 7.432855104724638e-07, "loss": 0.8318, "step": 40048 }, { "epoch": 0.76, "learning_rate": 7.431768210295076e-07, "loss": 1.0777, "step": 40049 }, { "epoch": 0.76, "learning_rate": 7.430681381464741e-07, "loss": 0.9929, "step": 40050 }, { "epoch": 0.76, "learning_rate": 7.429594618237718e-07, "loss": 0.9744, "step": 40051 }, { "epoch": 0.76, "learning_rate": 7.428507920618039e-07, "loss": 0.757, "step": 40052 }, { "epoch": 0.76, "learning_rate": 7.427421288609774e-07, "loss": 1.0739, "step": 40053 }, { "epoch": 0.76, "learning_rate": 7.426334722216979e-07, "loss": 0.739, "step": 40054 }, { "epoch": 0.76, "learning_rate": 7.425248221443715e-07, "loss": 0.8347, "step": 40055 }, { "epoch": 0.76, "learning_rate": 7.424161786294032e-07, "loss": 1.229, "step": 40056 }, { "epoch": 0.76, "learning_rate": 7.423075416771988e-07, "loss": 1.1114, "step": 40057 }, { "epoch": 0.76, "learning_rate": 7.421989112881653e-07, "loss": 0.8768, "step": 40058 }, { "epoch": 0.76, "learning_rate": 7.420902874627054e-07, "loss": 0.8754, "step": 40059 }, { "epoch": 0.76, "learning_rate": 7.419816702012272e-07, "loss": 0.848, "step": 40060 }, { "epoch": 0.76, "learning_rate": 7.418730595041365e-07, "loss": 0.9673, "step": 40061 }, { "epoch": 0.76, "learning_rate": 7.417644553718364e-07, "loss": 1.0537, "step": 40062 }, { "epoch": 0.76, "learning_rate": 7.416558578047353e-07, "loss": 1.018, "step": 40063 }, { "epoch": 0.76, "learning_rate": 7.415472668032367e-07, "loss": 0.9194, "step": 40064 }, { "epoch": 0.76, "learning_rate": 7.414386823677464e-07, "loss": 0.8056, "step": 40065 }, { "epoch": 0.76, "learning_rate": 7.413301044986704e-07, "loss": 0.8451, "step": 40066 }, { "epoch": 0.76, "learning_rate": 7.412215331964137e-07, "loss": 0.7346, "step": 40067 }, { "epoch": 0.76, "learning_rate": 7.411129684613821e-07, "loss": 0.9689, "step": 40068 }, { "epoch": 0.76, "learning_rate": 7.410044102939807e-07, "loss": 0.7991, "step": 40069 }, { "epoch": 0.76, "learning_rate": 7.408958586946155e-07, "loss": 0.8453, "step": 40070 }, { "epoch": 0.76, "learning_rate": 7.407873136636898e-07, "loss": 0.9749, "step": 40071 }, { "epoch": 0.76, "learning_rate": 7.406787752016118e-07, "loss": 0.9871, "step": 40072 }, { "epoch": 0.76, "learning_rate": 7.405702433087844e-07, "loss": 0.9758, "step": 40073 }, { "epoch": 0.76, "learning_rate": 7.404617179856141e-07, "loss": 0.9236, "step": 40074 }, { "epoch": 0.76, "learning_rate": 7.403531992325056e-07, "loss": 1.2443, "step": 40075 }, { "epoch": 0.76, "learning_rate": 7.402446870498642e-07, "loss": 0.8307, "step": 40076 }, { "epoch": 0.76, "learning_rate": 7.401361814380953e-07, "loss": 0.814, "step": 40077 }, { "epoch": 0.76, "learning_rate": 7.400276823976041e-07, "loss": 0.8559, "step": 40078 }, { "epoch": 0.76, "learning_rate": 7.39919189928796e-07, "loss": 0.8586, "step": 40079 }, { "epoch": 0.76, "learning_rate": 7.398107040320746e-07, "loss": 0.9385, "step": 40080 }, { "epoch": 0.76, "learning_rate": 7.397022247078464e-07, "loss": 1.3174, "step": 40081 }, { "epoch": 0.76, "learning_rate": 7.395937519565172e-07, "loss": 0.9547, "step": 40082 }, { "epoch": 0.76, "learning_rate": 7.394852857784893e-07, "loss": 0.743, "step": 40083 }, { "epoch": 0.76, "learning_rate": 7.393768261741707e-07, "loss": 0.8871, "step": 40084 }, { "epoch": 0.76, "learning_rate": 7.392683731439646e-07, "loss": 0.7245, "step": 40085 }, { "epoch": 0.76, "learning_rate": 7.391599266882763e-07, "loss": 0.7736, "step": 40086 }, { "epoch": 0.76, "learning_rate": 7.390514868075107e-07, "loss": 1.0624, "step": 40087 }, { "epoch": 0.76, "learning_rate": 7.389430535020731e-07, "loss": 0.9267, "step": 40088 }, { "epoch": 0.76, "learning_rate": 7.388346267723678e-07, "loss": 0.8605, "step": 40089 }, { "epoch": 0.76, "learning_rate": 7.387262066188003e-07, "loss": 0.8983, "step": 40090 }, { "epoch": 0.76, "learning_rate": 7.38617793041776e-07, "loss": 0.7901, "step": 40091 }, { "epoch": 0.76, "learning_rate": 7.38509386041697e-07, "loss": 0.7181, "step": 40092 }, { "epoch": 0.76, "learning_rate": 7.384009856189716e-07, "loss": 1.119, "step": 40093 }, { "epoch": 0.76, "learning_rate": 7.382925917740022e-07, "loss": 1.1019, "step": 40094 }, { "epoch": 0.76, "learning_rate": 7.381842045071944e-07, "loss": 0.7394, "step": 40095 }, { "epoch": 0.76, "learning_rate": 7.380758238189526e-07, "loss": 0.8608, "step": 40096 }, { "epoch": 0.76, "learning_rate": 7.379674497096814e-07, "loss": 0.9302, "step": 40097 }, { "epoch": 0.76, "learning_rate": 7.37859082179786e-07, "loss": 1.0287, "step": 40098 }, { "epoch": 0.76, "learning_rate": 7.377507212296709e-07, "loss": 0.8675, "step": 40099 }, { "epoch": 0.76, "learning_rate": 7.37642366859741e-07, "loss": 0.8946, "step": 40100 }, { "epoch": 0.76, "learning_rate": 7.375340190703992e-07, "loss": 1.1125, "step": 40101 }, { "epoch": 0.76, "learning_rate": 7.374256778620517e-07, "loss": 0.9301, "step": 40102 }, { "epoch": 0.76, "learning_rate": 7.373173432351039e-07, "loss": 0.9489, "step": 40103 }, { "epoch": 0.76, "learning_rate": 7.372090151899575e-07, "loss": 0.9216, "step": 40104 }, { "epoch": 0.76, "learning_rate": 7.371006937270198e-07, "loss": 1.025, "step": 40105 }, { "epoch": 0.76, "learning_rate": 7.369923788466935e-07, "loss": 0.9001, "step": 40106 }, { "epoch": 0.76, "learning_rate": 7.368840705493838e-07, "loss": 1.032, "step": 40107 }, { "epoch": 0.76, "learning_rate": 7.367757688354945e-07, "loss": 0.9025, "step": 40108 }, { "epoch": 0.76, "learning_rate": 7.366674737054308e-07, "loss": 0.9727, "step": 40109 }, { "epoch": 0.76, "learning_rate": 7.365591851595966e-07, "loss": 1.0155, "step": 40110 }, { "epoch": 0.76, "learning_rate": 7.364509031983963e-07, "loss": 0.8902, "step": 40111 }, { "epoch": 0.76, "learning_rate": 7.363426278222349e-07, "loss": 1.1452, "step": 40112 }, { "epoch": 0.76, "learning_rate": 7.362343590315147e-07, "loss": 1.0136, "step": 40113 }, { "epoch": 0.76, "learning_rate": 7.361260968266426e-07, "loss": 0.8637, "step": 40114 }, { "epoch": 0.76, "learning_rate": 7.36017841208021e-07, "loss": 1.0473, "step": 40115 }, { "epoch": 0.76, "learning_rate": 7.359095921760548e-07, "loss": 0.7476, "step": 40116 }, { "epoch": 0.76, "learning_rate": 7.358013497311478e-07, "loss": 0.9508, "step": 40117 }, { "epoch": 0.76, "learning_rate": 7.356931138737048e-07, "loss": 0.9399, "step": 40118 }, { "epoch": 0.76, "learning_rate": 7.355848846041294e-07, "loss": 1.0558, "step": 40119 }, { "epoch": 0.76, "learning_rate": 7.35476661922826e-07, "loss": 0.746, "step": 40120 }, { "epoch": 0.76, "learning_rate": 7.353684458301993e-07, "loss": 1.0052, "step": 40121 }, { "epoch": 0.76, "learning_rate": 7.352602363266514e-07, "loss": 0.9083, "step": 40122 }, { "epoch": 0.76, "learning_rate": 7.351520334125883e-07, "loss": 0.7484, "step": 40123 }, { "epoch": 0.76, "learning_rate": 7.350438370884142e-07, "loss": 0.8352, "step": 40124 }, { "epoch": 0.76, "learning_rate": 7.349356473545308e-07, "loss": 0.9648, "step": 40125 }, { "epoch": 0.76, "learning_rate": 7.348274642113451e-07, "loss": 0.899, "step": 40126 }, { "epoch": 0.76, "learning_rate": 7.347192876592585e-07, "loss": 0.6365, "step": 40127 }, { "epoch": 0.76, "learning_rate": 7.346111176986762e-07, "loss": 0.7489, "step": 40128 }, { "epoch": 0.76, "learning_rate": 7.34502954330002e-07, "loss": 0.731, "step": 40129 }, { "epoch": 0.76, "learning_rate": 7.343947975536395e-07, "loss": 0.8765, "step": 40130 }, { "epoch": 0.76, "learning_rate": 7.342866473699925e-07, "loss": 1.0551, "step": 40131 }, { "epoch": 0.76, "learning_rate": 7.341785037794652e-07, "loss": 0.8639, "step": 40132 }, { "epoch": 0.76, "learning_rate": 7.34070366782462e-07, "loss": 0.9843, "step": 40133 }, { "epoch": 0.76, "learning_rate": 7.339622363793844e-07, "loss": 0.915, "step": 40134 }, { "epoch": 0.76, "learning_rate": 7.338541125706392e-07, "loss": 0.7083, "step": 40135 }, { "epoch": 0.76, "learning_rate": 7.337459953566278e-07, "loss": 0.8737, "step": 40136 }, { "epoch": 0.76, "learning_rate": 7.336378847377545e-07, "loss": 0.9664, "step": 40137 }, { "epoch": 0.76, "learning_rate": 7.335297807144235e-07, "loss": 0.8611, "step": 40138 }, { "epoch": 0.76, "learning_rate": 7.334216832870378e-07, "loss": 1.0189, "step": 40139 }, { "epoch": 0.76, "learning_rate": 7.333135924560017e-07, "loss": 0.8871, "step": 40140 }, { "epoch": 0.76, "learning_rate": 7.332055082217182e-07, "loss": 0.9379, "step": 40141 }, { "epoch": 0.76, "learning_rate": 7.330974305845923e-07, "loss": 0.7767, "step": 40142 }, { "epoch": 0.76, "learning_rate": 7.329893595450247e-07, "loss": 0.8084, "step": 40143 }, { "epoch": 0.76, "learning_rate": 7.328812951034212e-07, "loss": 1.0575, "step": 40144 }, { "epoch": 0.76, "learning_rate": 7.327732372601857e-07, "loss": 0.8941, "step": 40145 }, { "epoch": 0.76, "learning_rate": 7.326651860157191e-07, "loss": 0.9283, "step": 40146 }, { "epoch": 0.76, "learning_rate": 7.325571413704283e-07, "loss": 0.8783, "step": 40147 }, { "epoch": 0.76, "learning_rate": 7.324491033247139e-07, "loss": 0.7821, "step": 40148 }, { "epoch": 0.76, "learning_rate": 7.323410718789806e-07, "loss": 0.7734, "step": 40149 }, { "epoch": 0.76, "learning_rate": 7.322330470336314e-07, "loss": 1.0545, "step": 40150 }, { "epoch": 0.76, "learning_rate": 7.3212502878907e-07, "loss": 0.806, "step": 40151 }, { "epoch": 0.76, "learning_rate": 7.320170171456991e-07, "loss": 0.8875, "step": 40152 }, { "epoch": 0.76, "learning_rate": 7.319090121039229e-07, "loss": 0.9956, "step": 40153 }, { "epoch": 0.76, "learning_rate": 7.318010136641449e-07, "loss": 0.8228, "step": 40154 }, { "epoch": 0.76, "learning_rate": 7.316930218267659e-07, "loss": 0.8375, "step": 40155 }, { "epoch": 0.76, "learning_rate": 7.315850365921929e-07, "loss": 0.9843, "step": 40156 }, { "epoch": 0.76, "learning_rate": 7.31477057960826e-07, "loss": 0.923, "step": 40157 }, { "epoch": 0.76, "learning_rate": 7.313690859330688e-07, "loss": 1.2137, "step": 40158 }, { "epoch": 0.76, "learning_rate": 7.31261120509327e-07, "loss": 0.9296, "step": 40159 }, { "epoch": 0.76, "learning_rate": 7.311531616900009e-07, "loss": 0.8558, "step": 40160 }, { "epoch": 0.76, "learning_rate": 7.310452094754949e-07, "loss": 1.0192, "step": 40161 }, { "epoch": 0.76, "learning_rate": 7.309372638662118e-07, "loss": 1.0761, "step": 40162 }, { "epoch": 0.76, "learning_rate": 7.308293248625545e-07, "loss": 1.0966, "step": 40163 }, { "epoch": 0.76, "learning_rate": 7.307213924649265e-07, "loss": 0.9687, "step": 40164 }, { "epoch": 0.76, "learning_rate": 7.306134666737305e-07, "loss": 0.975, "step": 40165 }, { "epoch": 0.76, "learning_rate": 7.305055474893705e-07, "loss": 1.015, "step": 40166 }, { "epoch": 0.76, "learning_rate": 7.303976349122466e-07, "loss": 0.8192, "step": 40167 }, { "epoch": 0.76, "learning_rate": 7.302897289427655e-07, "loss": 1.0029, "step": 40168 }, { "epoch": 0.76, "learning_rate": 7.301818295813273e-07, "loss": 1.0005, "step": 40169 }, { "epoch": 0.76, "learning_rate": 7.300739368283363e-07, "loss": 0.9588, "step": 40170 }, { "epoch": 0.76, "learning_rate": 7.299660506841947e-07, "loss": 0.8718, "step": 40171 }, { "epoch": 0.76, "learning_rate": 7.298581711493055e-07, "loss": 0.8868, "step": 40172 }, { "epoch": 0.76, "learning_rate": 7.297502982240718e-07, "loss": 0.9427, "step": 40173 }, { "epoch": 0.76, "learning_rate": 7.29642431908896e-07, "loss": 1.0715, "step": 40174 }, { "epoch": 0.76, "learning_rate": 7.295345722041819e-07, "loss": 1.0833, "step": 40175 }, { "epoch": 0.76, "learning_rate": 7.2942671911033e-07, "loss": 0.9897, "step": 40176 }, { "epoch": 0.76, "learning_rate": 7.293188726277459e-07, "loss": 0.7897, "step": 40177 }, { "epoch": 0.76, "learning_rate": 7.292110327568302e-07, "loss": 0.947, "step": 40178 }, { "epoch": 0.76, "learning_rate": 7.291031994979853e-07, "loss": 0.8864, "step": 40179 }, { "epoch": 0.76, "learning_rate": 7.289953728516163e-07, "loss": 0.9474, "step": 40180 }, { "epoch": 0.76, "learning_rate": 7.288875528181236e-07, "loss": 0.8188, "step": 40181 }, { "epoch": 0.76, "learning_rate": 7.287797393979105e-07, "loss": 0.7524, "step": 40182 }, { "epoch": 0.76, "learning_rate": 7.286719325913794e-07, "loss": 0.963, "step": 40183 }, { "epoch": 0.76, "learning_rate": 7.285641323989332e-07, "loss": 0.909, "step": 40184 }, { "epoch": 0.76, "learning_rate": 7.28456338820974e-07, "loss": 0.9343, "step": 40185 }, { "epoch": 0.76, "learning_rate": 7.283485518579045e-07, "loss": 0.7589, "step": 40186 }, { "epoch": 0.76, "learning_rate": 7.282407715101281e-07, "loss": 1.101, "step": 40187 }, { "epoch": 0.76, "learning_rate": 7.281329977780447e-07, "loss": 0.9813, "step": 40188 }, { "epoch": 0.76, "learning_rate": 7.2802523066206e-07, "loss": 0.8059, "step": 40189 }, { "epoch": 0.76, "learning_rate": 7.279174701625738e-07, "loss": 0.9213, "step": 40190 }, { "epoch": 0.76, "learning_rate": 7.278097162799896e-07, "loss": 0.7955, "step": 40191 }, { "epoch": 0.76, "learning_rate": 7.277019690147097e-07, "loss": 0.7427, "step": 40192 }, { "epoch": 0.76, "learning_rate": 7.275942283671361e-07, "loss": 1.1254, "step": 40193 }, { "epoch": 0.76, "learning_rate": 7.274864943376714e-07, "loss": 1.0274, "step": 40194 }, { "epoch": 0.76, "learning_rate": 7.273787669267176e-07, "loss": 0.8228, "step": 40195 }, { "epoch": 0.76, "learning_rate": 7.272710461346782e-07, "loss": 0.977, "step": 40196 }, { "epoch": 0.76, "learning_rate": 7.271633319619525e-07, "loss": 0.7208, "step": 40197 }, { "epoch": 0.76, "learning_rate": 7.270556244089463e-07, "loss": 0.7996, "step": 40198 }, { "epoch": 0.76, "learning_rate": 7.269479234760593e-07, "loss": 1.0073, "step": 40199 }, { "epoch": 0.76, "learning_rate": 7.268402291636937e-07, "loss": 1.0858, "step": 40200 }, { "epoch": 0.76, "learning_rate": 7.267325414722537e-07, "loss": 0.8351, "step": 40201 }, { "epoch": 0.76, "learning_rate": 7.266248604021392e-07, "loss": 0.6126, "step": 40202 }, { "epoch": 0.76, "learning_rate": 7.265171859537532e-07, "loss": 0.9716, "step": 40203 }, { "epoch": 0.76, "learning_rate": 7.264095181274977e-07, "loss": 0.9236, "step": 40204 }, { "epoch": 0.76, "learning_rate": 7.263018569237746e-07, "loss": 0.9325, "step": 40205 }, { "epoch": 0.76, "learning_rate": 7.261942023429857e-07, "loss": 1.0145, "step": 40206 }, { "epoch": 0.76, "learning_rate": 7.260865543855339e-07, "loss": 0.776, "step": 40207 }, { "epoch": 0.76, "learning_rate": 7.259789130518208e-07, "loss": 0.834, "step": 40208 }, { "epoch": 0.76, "learning_rate": 7.258712783422467e-07, "loss": 0.8529, "step": 40209 }, { "epoch": 0.76, "learning_rate": 7.257636502572163e-07, "loss": 0.8342, "step": 40210 }, { "epoch": 0.76, "learning_rate": 7.256560287971293e-07, "loss": 0.9043, "step": 40211 }, { "epoch": 0.76, "learning_rate": 7.255484139623883e-07, "loss": 0.9525, "step": 40212 }, { "epoch": 0.76, "learning_rate": 7.254408057533951e-07, "loss": 1.0362, "step": 40213 }, { "epoch": 0.76, "learning_rate": 7.253332041705516e-07, "loss": 0.9525, "step": 40214 }, { "epoch": 0.76, "learning_rate": 7.252256092142593e-07, "loss": 0.9678, "step": 40215 }, { "epoch": 0.76, "learning_rate": 7.251180208849204e-07, "loss": 0.958, "step": 40216 }, { "epoch": 0.76, "learning_rate": 7.250104391829369e-07, "loss": 0.9285, "step": 40217 }, { "epoch": 0.76, "learning_rate": 7.249028641087086e-07, "loss": 1.0981, "step": 40218 }, { "epoch": 0.76, "learning_rate": 7.2479529566264e-07, "loss": 0.9471, "step": 40219 }, { "epoch": 0.76, "learning_rate": 7.246877338451308e-07, "loss": 0.8379, "step": 40220 }, { "epoch": 0.76, "learning_rate": 7.245801786565824e-07, "loss": 0.8875, "step": 40221 }, { "epoch": 0.76, "learning_rate": 7.244726300973983e-07, "loss": 0.8151, "step": 40222 }, { "epoch": 0.76, "learning_rate": 7.243650881679787e-07, "loss": 1.0516, "step": 40223 }, { "epoch": 0.76, "learning_rate": 7.242575528687251e-07, "loss": 1.0886, "step": 40224 }, { "epoch": 0.76, "learning_rate": 7.241500242000396e-07, "loss": 1.2394, "step": 40225 }, { "epoch": 0.76, "learning_rate": 7.240425021623232e-07, "loss": 0.8281, "step": 40226 }, { "epoch": 0.76, "learning_rate": 7.239349867559778e-07, "loss": 0.8113, "step": 40227 }, { "epoch": 0.76, "learning_rate": 7.238274779814048e-07, "loss": 0.8119, "step": 40228 }, { "epoch": 0.76, "learning_rate": 7.237199758390062e-07, "loss": 0.7918, "step": 40229 }, { "epoch": 0.76, "learning_rate": 7.23612480329181e-07, "loss": 0.822, "step": 40230 }, { "epoch": 0.76, "learning_rate": 7.235049914523343e-07, "loss": 1.0757, "step": 40231 }, { "epoch": 0.76, "learning_rate": 7.233975092088643e-07, "loss": 0.7969, "step": 40232 }, { "epoch": 0.76, "learning_rate": 7.232900335991738e-07, "loss": 0.8419, "step": 40233 }, { "epoch": 0.76, "learning_rate": 7.231825646236637e-07, "loss": 0.7574, "step": 40234 }, { "epoch": 0.76, "learning_rate": 7.230751022827357e-07, "loss": 0.8748, "step": 40235 }, { "epoch": 0.76, "learning_rate": 7.229676465767904e-07, "loss": 0.8805, "step": 40236 }, { "epoch": 0.76, "learning_rate": 7.228601975062297e-07, "loss": 0.9171, "step": 40237 }, { "epoch": 0.76, "learning_rate": 7.22752755071455e-07, "loss": 1.134, "step": 40238 }, { "epoch": 0.76, "learning_rate": 7.226453192728658e-07, "loss": 0.7448, "step": 40239 }, { "epoch": 0.76, "learning_rate": 7.225378901108659e-07, "loss": 0.9581, "step": 40240 }, { "epoch": 0.76, "learning_rate": 7.224304675858543e-07, "loss": 0.9693, "step": 40241 }, { "epoch": 0.76, "learning_rate": 7.223230516982318e-07, "loss": 0.7461, "step": 40242 }, { "epoch": 0.76, "learning_rate": 7.222156424484026e-07, "loss": 0.9655, "step": 40243 }, { "epoch": 0.76, "learning_rate": 7.221082398367643e-07, "loss": 0.89, "step": 40244 }, { "epoch": 0.76, "learning_rate": 7.220008438637196e-07, "loss": 0.9723, "step": 40245 }, { "epoch": 0.76, "learning_rate": 7.218934545296694e-07, "loss": 0.7966, "step": 40246 }, { "epoch": 0.76, "learning_rate": 7.217860718350142e-07, "loss": 0.7381, "step": 40247 }, { "epoch": 0.76, "learning_rate": 7.216786957801556e-07, "loss": 0.8515, "step": 40248 }, { "epoch": 0.76, "learning_rate": 7.215713263654938e-07, "loss": 1.0168, "step": 40249 }, { "epoch": 0.76, "learning_rate": 7.214639635914314e-07, "loss": 0.9432, "step": 40250 }, { "epoch": 0.76, "learning_rate": 7.213566074583664e-07, "loss": 0.7953, "step": 40251 }, { "epoch": 0.76, "learning_rate": 7.212492579667027e-07, "loss": 0.8276, "step": 40252 }, { "epoch": 0.76, "learning_rate": 7.211419151168388e-07, "loss": 0.8881, "step": 40253 }, { "epoch": 0.76, "learning_rate": 7.210345789091766e-07, "loss": 0.7267, "step": 40254 }, { "epoch": 0.76, "learning_rate": 7.209272493441169e-07, "loss": 0.9201, "step": 40255 }, { "epoch": 0.76, "learning_rate": 7.2081992642206e-07, "loss": 1.2226, "step": 40256 }, { "epoch": 0.76, "learning_rate": 7.207126101434073e-07, "loss": 0.9615, "step": 40257 }, { "epoch": 0.76, "learning_rate": 7.206053005085589e-07, "loss": 0.9767, "step": 40258 }, { "epoch": 0.76, "learning_rate": 7.204979975179166e-07, "loss": 0.8222, "step": 40259 }, { "epoch": 0.76, "learning_rate": 7.203907011718786e-07, "loss": 0.6618, "step": 40260 }, { "epoch": 0.76, "learning_rate": 7.202834114708488e-07, "loss": 0.8871, "step": 40261 }, { "epoch": 0.76, "learning_rate": 7.201761284152253e-07, "loss": 0.7947, "step": 40262 }, { "epoch": 0.76, "learning_rate": 7.200688520054089e-07, "loss": 0.933, "step": 40263 }, { "epoch": 0.76, "learning_rate": 7.199615822418024e-07, "loss": 0.8285, "step": 40264 }, { "epoch": 0.76, "learning_rate": 7.198543191248039e-07, "loss": 0.8645, "step": 40265 }, { "epoch": 0.76, "learning_rate": 7.197470626548147e-07, "loss": 0.8101, "step": 40266 }, { "epoch": 0.76, "learning_rate": 7.196398128322358e-07, "loss": 0.681, "step": 40267 }, { "epoch": 0.76, "learning_rate": 7.195325696574668e-07, "loss": 0.9559, "step": 40268 }, { "epoch": 0.76, "learning_rate": 7.194253331309095e-07, "loss": 0.8452, "step": 40269 }, { "epoch": 0.76, "learning_rate": 7.19318103252962e-07, "loss": 1.0656, "step": 40270 }, { "epoch": 0.76, "learning_rate": 7.192108800240275e-07, "loss": 0.8428, "step": 40271 }, { "epoch": 0.76, "learning_rate": 7.191036634445042e-07, "loss": 0.9067, "step": 40272 }, { "epoch": 0.76, "learning_rate": 7.189964535147933e-07, "loss": 0.8628, "step": 40273 }, { "epoch": 0.76, "learning_rate": 7.188892502352948e-07, "loss": 0.7974, "step": 40274 }, { "epoch": 0.76, "learning_rate": 7.187820536064096e-07, "loss": 1.1613, "step": 40275 }, { "epoch": 0.76, "learning_rate": 7.186748636285374e-07, "loss": 1.073, "step": 40276 }, { "epoch": 0.76, "learning_rate": 7.185676803020786e-07, "loss": 0.9019, "step": 40277 }, { "epoch": 0.76, "learning_rate": 7.184605036274344e-07, "loss": 0.7508, "step": 40278 }, { "epoch": 0.76, "learning_rate": 7.183533336050025e-07, "loss": 0.7633, "step": 40279 }, { "epoch": 0.76, "learning_rate": 7.182461702351859e-07, "loss": 0.9536, "step": 40280 }, { "epoch": 0.76, "learning_rate": 7.18139013518383e-07, "loss": 0.8812, "step": 40281 }, { "epoch": 0.76, "learning_rate": 7.180318634549943e-07, "loss": 0.9666, "step": 40282 }, { "epoch": 0.76, "learning_rate": 7.179247200454201e-07, "loss": 0.9542, "step": 40283 }, { "epoch": 0.76, "learning_rate": 7.178175832900599e-07, "loss": 0.7984, "step": 40284 }, { "epoch": 0.76, "learning_rate": 7.177104531893148e-07, "loss": 1.0912, "step": 40285 }, { "epoch": 0.76, "learning_rate": 7.176033297435839e-07, "loss": 1.0029, "step": 40286 }, { "epoch": 0.76, "learning_rate": 7.174962129532684e-07, "loss": 1.0102, "step": 40287 }, { "epoch": 0.76, "learning_rate": 7.173891028187657e-07, "loss": 0.7957, "step": 40288 }, { "epoch": 0.76, "learning_rate": 7.17281999340478e-07, "loss": 0.8573, "step": 40289 }, { "epoch": 0.76, "learning_rate": 7.17174902518806e-07, "loss": 0.9298, "step": 40290 }, { "epoch": 0.76, "learning_rate": 7.170678123541464e-07, "loss": 0.9345, "step": 40291 }, { "epoch": 0.76, "learning_rate": 7.169607288469024e-07, "loss": 0.9066, "step": 40292 }, { "epoch": 0.76, "learning_rate": 7.168536519974717e-07, "loss": 1.254, "step": 40293 }, { "epoch": 0.76, "learning_rate": 7.167465818062547e-07, "loss": 1.0028, "step": 40294 }, { "epoch": 0.76, "learning_rate": 7.166395182736513e-07, "loss": 0.994, "step": 40295 }, { "epoch": 0.76, "learning_rate": 7.165324614000616e-07, "loss": 1.0117, "step": 40296 }, { "epoch": 0.76, "learning_rate": 7.164254111858845e-07, "loss": 1.0289, "step": 40297 }, { "epoch": 0.76, "learning_rate": 7.163183676315205e-07, "loss": 0.6971, "step": 40298 }, { "epoch": 0.76, "learning_rate": 7.162113307373697e-07, "loss": 1.0093, "step": 40299 }, { "epoch": 0.76, "learning_rate": 7.161043005038295e-07, "loss": 0.9969, "step": 40300 }, { "epoch": 0.76, "learning_rate": 7.159972769313031e-07, "loss": 0.8109, "step": 40301 }, { "epoch": 0.76, "learning_rate": 7.158902600201869e-07, "loss": 0.9828, "step": 40302 }, { "epoch": 0.76, "learning_rate": 7.157832497708819e-07, "loss": 0.8354, "step": 40303 }, { "epoch": 0.76, "learning_rate": 7.156762461837876e-07, "loss": 0.8322, "step": 40304 }, { "epoch": 0.76, "learning_rate": 7.155692492593036e-07, "loss": 1.1328, "step": 40305 }, { "epoch": 0.76, "learning_rate": 7.154622589978294e-07, "loss": 1.2451, "step": 40306 }, { "epoch": 0.76, "learning_rate": 7.153552753997642e-07, "loss": 1.121, "step": 40307 }, { "epoch": 0.76, "learning_rate": 7.152482984655085e-07, "loss": 0.5512, "step": 40308 }, { "epoch": 0.76, "learning_rate": 7.151413281954591e-07, "loss": 0.757, "step": 40309 }, { "epoch": 0.76, "learning_rate": 7.150343645900184e-07, "loss": 1.0287, "step": 40310 }, { "epoch": 0.76, "learning_rate": 7.149274076495851e-07, "loss": 0.9022, "step": 40311 }, { "epoch": 0.76, "learning_rate": 7.14820457374557e-07, "loss": 1.0164, "step": 40312 }, { "epoch": 0.76, "learning_rate": 7.14713513765336e-07, "loss": 0.9534, "step": 40313 }, { "epoch": 0.76, "learning_rate": 7.14606576822319e-07, "loss": 0.8403, "step": 40314 }, { "epoch": 0.76, "learning_rate": 7.144996465459065e-07, "loss": 0.8796, "step": 40315 }, { "epoch": 0.76, "learning_rate": 7.143927229364975e-07, "loss": 0.8176, "step": 40316 }, { "epoch": 0.76, "learning_rate": 7.142858059944913e-07, "loss": 0.9168, "step": 40317 }, { "epoch": 0.76, "learning_rate": 7.141788957202872e-07, "loss": 0.8853, "step": 40318 }, { "epoch": 0.76, "learning_rate": 7.140719921142845e-07, "loss": 0.9707, "step": 40319 }, { "epoch": 0.76, "learning_rate": 7.139650951768828e-07, "loss": 0.9225, "step": 40320 }, { "epoch": 0.76, "learning_rate": 7.138582049084791e-07, "loss": 0.9919, "step": 40321 }, { "epoch": 0.76, "learning_rate": 7.137513213094757e-07, "loss": 1.092, "step": 40322 }, { "epoch": 0.76, "learning_rate": 7.136444443802693e-07, "loss": 0.7081, "step": 40323 }, { "epoch": 0.76, "learning_rate": 7.135375741212599e-07, "loss": 1.0096, "step": 40324 }, { "epoch": 0.76, "learning_rate": 7.134307105328464e-07, "loss": 1.0599, "step": 40325 }, { "epoch": 0.76, "learning_rate": 7.133238536154277e-07, "loss": 0.8908, "step": 40326 }, { "epoch": 0.76, "learning_rate": 7.13217003369403e-07, "loss": 0.9179, "step": 40327 }, { "epoch": 0.76, "learning_rate": 7.131101597951711e-07, "loss": 1.0, "step": 40328 }, { "epoch": 0.76, "learning_rate": 7.130033228931322e-07, "loss": 0.7331, "step": 40329 }, { "epoch": 0.76, "learning_rate": 7.128964926636825e-07, "loss": 0.8316, "step": 40330 }, { "epoch": 0.76, "learning_rate": 7.127896691072231e-07, "loss": 1.2775, "step": 40331 }, { "epoch": 0.76, "learning_rate": 7.12682852224153e-07, "loss": 0.9234, "step": 40332 }, { "epoch": 0.76, "learning_rate": 7.125760420148689e-07, "loss": 0.9894, "step": 40333 }, { "epoch": 0.76, "learning_rate": 7.124692384797727e-07, "loss": 0.6927, "step": 40334 }, { "epoch": 0.76, "learning_rate": 7.123624416192607e-07, "loss": 0.8656, "step": 40335 }, { "epoch": 0.76, "learning_rate": 7.122556514337322e-07, "loss": 0.9027, "step": 40336 }, { "epoch": 0.76, "learning_rate": 7.121488679235866e-07, "loss": 0.9628, "step": 40337 }, { "epoch": 0.76, "learning_rate": 7.120420910892222e-07, "loss": 0.7868, "step": 40338 }, { "epoch": 0.76, "learning_rate": 7.119353209310381e-07, "loss": 0.9675, "step": 40339 }, { "epoch": 0.76, "learning_rate": 7.118285574494324e-07, "loss": 0.9153, "step": 40340 }, { "epoch": 0.76, "learning_rate": 7.117218006448051e-07, "loss": 0.8726, "step": 40341 }, { "epoch": 0.76, "learning_rate": 7.11615050517552e-07, "loss": 0.8996, "step": 40342 }, { "epoch": 0.76, "learning_rate": 7.11508307068075e-07, "loss": 0.9147, "step": 40343 }, { "epoch": 0.76, "learning_rate": 7.114015702967702e-07, "loss": 0.9586, "step": 40344 }, { "epoch": 0.76, "learning_rate": 7.112948402040373e-07, "loss": 1.0836, "step": 40345 }, { "epoch": 0.76, "learning_rate": 7.111881167902748e-07, "loss": 0.8556, "step": 40346 }, { "epoch": 0.76, "learning_rate": 7.110814000558808e-07, "loss": 0.6901, "step": 40347 }, { "epoch": 0.76, "learning_rate": 7.109746900012541e-07, "loss": 0.7728, "step": 40348 }, { "epoch": 0.76, "learning_rate": 7.108679866267931e-07, "loss": 1.1133, "step": 40349 }, { "epoch": 0.76, "learning_rate": 7.107612899328967e-07, "loss": 0.908, "step": 40350 }, { "epoch": 0.76, "learning_rate": 7.106545999199615e-07, "loss": 0.9057, "step": 40351 }, { "epoch": 0.76, "learning_rate": 7.105479165883877e-07, "loss": 0.7575, "step": 40352 }, { "epoch": 0.76, "learning_rate": 7.10441239938574e-07, "loss": 0.9741, "step": 40353 }, { "epoch": 0.76, "learning_rate": 7.103345699709166e-07, "loss": 0.7947, "step": 40354 }, { "epoch": 0.76, "learning_rate": 7.102279066858161e-07, "loss": 0.9719, "step": 40355 }, { "epoch": 0.76, "learning_rate": 7.101212500836694e-07, "loss": 0.9082, "step": 40356 }, { "epoch": 0.76, "learning_rate": 7.100146001648748e-07, "loss": 1.016, "step": 40357 }, { "epoch": 0.76, "learning_rate": 7.099079569298307e-07, "loss": 0.8312, "step": 40358 }, { "epoch": 0.76, "learning_rate": 7.098013203789355e-07, "loss": 0.7789, "step": 40359 }, { "epoch": 0.76, "learning_rate": 7.096946905125874e-07, "loss": 0.8778, "step": 40360 }, { "epoch": 0.76, "learning_rate": 7.095880673311844e-07, "loss": 0.7023, "step": 40361 }, { "epoch": 0.76, "learning_rate": 7.094814508351252e-07, "loss": 1.0603, "step": 40362 }, { "epoch": 0.76, "learning_rate": 7.09374841024806e-07, "loss": 0.8867, "step": 40363 }, { "epoch": 0.76, "learning_rate": 7.09268237900628e-07, "loss": 0.6715, "step": 40364 }, { "epoch": 0.76, "learning_rate": 7.091616414629865e-07, "loss": 0.9601, "step": 40365 }, { "epoch": 0.76, "learning_rate": 7.090550517122804e-07, "loss": 0.7362, "step": 40366 }, { "epoch": 0.76, "learning_rate": 7.089484686489082e-07, "loss": 0.8469, "step": 40367 }, { "epoch": 0.76, "learning_rate": 7.08841892273267e-07, "loss": 0.8112, "step": 40368 }, { "epoch": 0.76, "learning_rate": 7.087353225857557e-07, "loss": 1.1575, "step": 40369 }, { "epoch": 0.76, "learning_rate": 7.086287595867716e-07, "loss": 0.8762, "step": 40370 }, { "epoch": 0.76, "learning_rate": 7.085222032767136e-07, "loss": 0.8491, "step": 40371 }, { "epoch": 0.76, "learning_rate": 7.084156536559772e-07, "loss": 0.8598, "step": 40372 }, { "epoch": 0.76, "learning_rate": 7.083091107249623e-07, "loss": 0.7917, "step": 40373 }, { "epoch": 0.76, "learning_rate": 7.082025744840673e-07, "loss": 1.0322, "step": 40374 }, { "epoch": 0.76, "learning_rate": 7.080960449336877e-07, "loss": 0.8136, "step": 40375 }, { "epoch": 0.76, "learning_rate": 7.079895220742236e-07, "loss": 0.9359, "step": 40376 }, { "epoch": 0.76, "learning_rate": 7.078830059060709e-07, "loss": 0.7473, "step": 40377 }, { "epoch": 0.76, "learning_rate": 7.077764964296286e-07, "loss": 0.7712, "step": 40378 }, { "epoch": 0.76, "learning_rate": 7.076699936452935e-07, "loss": 0.7494, "step": 40379 }, { "epoch": 0.76, "learning_rate": 7.075634975534637e-07, "loss": 1.0519, "step": 40380 }, { "epoch": 0.76, "learning_rate": 7.07457008154537e-07, "loss": 1.2528, "step": 40381 }, { "epoch": 0.76, "learning_rate": 7.073505254489107e-07, "loss": 0.8731, "step": 40382 }, { "epoch": 0.76, "learning_rate": 7.072440494369837e-07, "loss": 0.7438, "step": 40383 }, { "epoch": 0.76, "learning_rate": 7.071375801191505e-07, "loss": 0.9215, "step": 40384 }, { "epoch": 0.76, "learning_rate": 7.070311174958122e-07, "loss": 0.8448, "step": 40385 }, { "epoch": 0.76, "learning_rate": 7.069246615673642e-07, "loss": 0.9194, "step": 40386 }, { "epoch": 0.76, "learning_rate": 7.068182123342043e-07, "loss": 0.9642, "step": 40387 }, { "epoch": 0.76, "learning_rate": 7.067117697967305e-07, "loss": 0.892, "step": 40388 }, { "epoch": 0.76, "learning_rate": 7.066053339553397e-07, "loss": 1.0279, "step": 40389 }, { "epoch": 0.76, "learning_rate": 7.064989048104296e-07, "loss": 0.9062, "step": 40390 }, { "epoch": 0.76, "learning_rate": 7.063924823623977e-07, "loss": 0.8489, "step": 40391 }, { "epoch": 0.76, "learning_rate": 7.062860666116423e-07, "loss": 0.8625, "step": 40392 }, { "epoch": 0.76, "learning_rate": 7.061796575585578e-07, "loss": 1.1196, "step": 40393 }, { "epoch": 0.76, "learning_rate": 7.060732552035443e-07, "loss": 0.8431, "step": 40394 }, { "epoch": 0.76, "learning_rate": 7.05966859546999e-07, "loss": 0.9998, "step": 40395 }, { "epoch": 0.76, "learning_rate": 7.058604705893171e-07, "loss": 0.9047, "step": 40396 }, { "epoch": 0.76, "learning_rate": 7.057540883308986e-07, "loss": 0.8921, "step": 40397 }, { "epoch": 0.76, "learning_rate": 7.056477127721384e-07, "loss": 0.7218, "step": 40398 }, { "epoch": 0.76, "learning_rate": 7.055413439134348e-07, "loss": 0.9071, "step": 40399 }, { "epoch": 0.76, "learning_rate": 7.054349817551847e-07, "loss": 1.0035, "step": 40400 }, { "epoch": 0.76, "learning_rate": 7.053286262977857e-07, "loss": 0.9316, "step": 40401 }, { "epoch": 0.76, "learning_rate": 7.052222775416342e-07, "loss": 0.7267, "step": 40402 }, { "epoch": 0.76, "learning_rate": 7.051159354871278e-07, "loss": 0.7443, "step": 40403 }, { "epoch": 0.76, "learning_rate": 7.050096001346643e-07, "loss": 0.8251, "step": 40404 }, { "epoch": 0.76, "learning_rate": 7.049032714846385e-07, "loss": 1.0502, "step": 40405 }, { "epoch": 0.76, "learning_rate": 7.047969495374502e-07, "loss": 1.1987, "step": 40406 }, { "epoch": 0.76, "learning_rate": 7.046906342934942e-07, "loss": 0.9716, "step": 40407 }, { "epoch": 0.76, "learning_rate": 7.045843257531685e-07, "loss": 0.7653, "step": 40408 }, { "epoch": 0.76, "learning_rate": 7.044780239168697e-07, "loss": 0.9728, "step": 40409 }, { "epoch": 0.76, "learning_rate": 7.043717287849949e-07, "loss": 0.9831, "step": 40410 }, { "epoch": 0.76, "learning_rate": 7.042654403579413e-07, "loss": 1.0474, "step": 40411 }, { "epoch": 0.76, "learning_rate": 7.041591586361052e-07, "loss": 1.0868, "step": 40412 }, { "epoch": 0.76, "learning_rate": 7.040528836198846e-07, "loss": 0.8294, "step": 40413 }, { "epoch": 0.76, "learning_rate": 7.039466153096741e-07, "loss": 0.8073, "step": 40414 }, { "epoch": 0.76, "learning_rate": 7.038403537058725e-07, "loss": 0.8571, "step": 40415 }, { "epoch": 0.76, "learning_rate": 7.037340988088767e-07, "loss": 0.8705, "step": 40416 }, { "epoch": 0.76, "learning_rate": 7.036278506190811e-07, "loss": 0.8643, "step": 40417 }, { "epoch": 0.76, "learning_rate": 7.035216091368858e-07, "loss": 0.9604, "step": 40418 }, { "epoch": 0.76, "learning_rate": 7.034153743626846e-07, "loss": 0.9581, "step": 40419 }, { "epoch": 0.76, "learning_rate": 7.033091462968756e-07, "loss": 1.0084, "step": 40420 }, { "epoch": 0.76, "learning_rate": 7.032029249398551e-07, "loss": 0.8194, "step": 40421 }, { "epoch": 0.76, "learning_rate": 7.030967102920197e-07, "loss": 0.9488, "step": 40422 }, { "epoch": 0.76, "learning_rate": 7.029905023537661e-07, "loss": 0.9092, "step": 40423 }, { "epoch": 0.76, "learning_rate": 7.028843011254907e-07, "loss": 0.9619, "step": 40424 }, { "epoch": 0.76, "learning_rate": 7.027781066075914e-07, "loss": 1.0698, "step": 40425 }, { "epoch": 0.76, "learning_rate": 7.026719188004616e-07, "loss": 0.9768, "step": 40426 }, { "epoch": 0.76, "learning_rate": 7.025657377045017e-07, "loss": 0.8086, "step": 40427 }, { "epoch": 0.76, "learning_rate": 7.024595633201051e-07, "loss": 0.8085, "step": 40428 }, { "epoch": 0.76, "learning_rate": 7.023533956476697e-07, "loss": 0.7081, "step": 40429 }, { "epoch": 0.76, "learning_rate": 7.022472346875913e-07, "loss": 0.9246, "step": 40430 }, { "epoch": 0.76, "learning_rate": 7.021410804402667e-07, "loss": 1.0479, "step": 40431 }, { "epoch": 0.76, "learning_rate": 7.020349329060921e-07, "loss": 0.9525, "step": 40432 }, { "epoch": 0.76, "learning_rate": 7.019287920854642e-07, "loss": 0.881, "step": 40433 }, { "epoch": 0.76, "learning_rate": 7.018226579787796e-07, "loss": 0.8735, "step": 40434 }, { "epoch": 0.76, "learning_rate": 7.017165305864326e-07, "loss": 0.8906, "step": 40435 }, { "epoch": 0.76, "learning_rate": 7.016104099088217e-07, "loss": 1.0173, "step": 40436 }, { "epoch": 0.76, "learning_rate": 7.015042959463431e-07, "loss": 1.0216, "step": 40437 }, { "epoch": 0.76, "learning_rate": 7.013981886993909e-07, "loss": 0.9183, "step": 40438 }, { "epoch": 0.76, "learning_rate": 7.012920881683641e-07, "loss": 0.9643, "step": 40439 }, { "epoch": 0.76, "learning_rate": 7.01185994353657e-07, "loss": 0.7371, "step": 40440 }, { "epoch": 0.76, "learning_rate": 7.010799072556659e-07, "loss": 0.7243, "step": 40441 }, { "epoch": 0.76, "learning_rate": 7.009738268747876e-07, "loss": 0.8746, "step": 40442 }, { "epoch": 0.76, "learning_rate": 7.008677532114175e-07, "loss": 0.941, "step": 40443 }, { "epoch": 0.76, "learning_rate": 7.007616862659525e-07, "loss": 1.068, "step": 40444 }, { "epoch": 0.76, "learning_rate": 7.006556260387879e-07, "loss": 0.8159, "step": 40445 }, { "epoch": 0.76, "learning_rate": 7.005495725303207e-07, "loss": 0.8967, "step": 40446 }, { "epoch": 0.76, "learning_rate": 7.004435257409447e-07, "loss": 0.8935, "step": 40447 }, { "epoch": 0.76, "learning_rate": 7.003374856710593e-07, "loss": 0.8694, "step": 40448 }, { "epoch": 0.76, "learning_rate": 7.002314523210574e-07, "loss": 0.9681, "step": 40449 }, { "epoch": 0.76, "learning_rate": 7.001254256913362e-07, "loss": 0.9037, "step": 40450 }, { "epoch": 0.76, "learning_rate": 7.000194057822915e-07, "loss": 0.863, "step": 40451 }, { "epoch": 0.76, "learning_rate": 6.999133925943191e-07, "loss": 0.7929, "step": 40452 }, { "epoch": 0.76, "learning_rate": 6.998073861278151e-07, "loss": 0.7589, "step": 40453 }, { "epoch": 0.76, "learning_rate": 6.99701386383175e-07, "loss": 1.1273, "step": 40454 }, { "epoch": 0.76, "learning_rate": 6.995953933607954e-07, "loss": 1.0674, "step": 40455 }, { "epoch": 0.76, "learning_rate": 6.9948940706107e-07, "loss": 1.1224, "step": 40456 }, { "epoch": 0.76, "learning_rate": 6.993834274843966e-07, "loss": 1.0905, "step": 40457 }, { "epoch": 0.76, "learning_rate": 6.992774546311709e-07, "loss": 1.0322, "step": 40458 }, { "epoch": 0.76, "learning_rate": 6.991714885017867e-07, "loss": 1.051, "step": 40459 }, { "epoch": 0.76, "learning_rate": 6.990655290966424e-07, "loss": 0.7658, "step": 40460 }, { "epoch": 0.76, "learning_rate": 6.989595764161314e-07, "loss": 1.2268, "step": 40461 }, { "epoch": 0.76, "learning_rate": 6.988536304606502e-07, "loss": 1.0331, "step": 40462 }, { "epoch": 0.76, "learning_rate": 6.987476912305943e-07, "loss": 0.9604, "step": 40463 }, { "epoch": 0.76, "learning_rate": 6.986417587263594e-07, "loss": 0.911, "step": 40464 }, { "epoch": 0.76, "learning_rate": 6.985358329483408e-07, "loss": 0.8148, "step": 40465 }, { "epoch": 0.76, "learning_rate": 6.984299138969341e-07, "loss": 0.8771, "step": 40466 }, { "epoch": 0.76, "learning_rate": 6.983240015725357e-07, "loss": 0.7228, "step": 40467 }, { "epoch": 0.76, "learning_rate": 6.982180959755386e-07, "loss": 0.7188, "step": 40468 }, { "epoch": 0.76, "learning_rate": 6.981121971063415e-07, "loss": 0.9856, "step": 40469 }, { "epoch": 0.76, "learning_rate": 6.980063049653376e-07, "loss": 0.8299, "step": 40470 }, { "epoch": 0.76, "learning_rate": 6.979004195529226e-07, "loss": 0.9018, "step": 40471 }, { "epoch": 0.76, "learning_rate": 6.977945408694925e-07, "loss": 0.799, "step": 40472 }, { "epoch": 0.76, "learning_rate": 6.976886689154422e-07, "loss": 0.5983, "step": 40473 }, { "epoch": 0.76, "learning_rate": 6.975828036911672e-07, "loss": 0.9516, "step": 40474 }, { "epoch": 0.76, "learning_rate": 6.974769451970625e-07, "loss": 1.0042, "step": 40475 }, { "epoch": 0.76, "learning_rate": 6.973710934335245e-07, "loss": 1.0773, "step": 40476 }, { "epoch": 0.76, "learning_rate": 6.972652484009462e-07, "loss": 0.9382, "step": 40477 }, { "epoch": 0.76, "learning_rate": 6.97159410099725e-07, "loss": 0.7308, "step": 40478 }, { "epoch": 0.76, "learning_rate": 6.97053578530256e-07, "loss": 0.842, "step": 40479 }, { "epoch": 0.76, "learning_rate": 6.96947753692932e-07, "loss": 0.787, "step": 40480 }, { "epoch": 0.76, "learning_rate": 6.968419355881512e-07, "loss": 1.0585, "step": 40481 }, { "epoch": 0.76, "learning_rate": 6.967361242163068e-07, "loss": 1.1381, "step": 40482 }, { "epoch": 0.76, "learning_rate": 6.966303195777943e-07, "loss": 0.7528, "step": 40483 }, { "epoch": 0.76, "learning_rate": 6.96524521673009e-07, "loss": 0.7689, "step": 40484 }, { "epoch": 0.76, "learning_rate": 6.964187305023459e-07, "loss": 0.6954, "step": 40485 }, { "epoch": 0.76, "learning_rate": 6.963129460661996e-07, "loss": 0.929, "step": 40486 }, { "epoch": 0.76, "learning_rate": 6.96207168364966e-07, "loss": 1.2747, "step": 40487 }, { "epoch": 0.76, "learning_rate": 6.9610139739904e-07, "loss": 0.8132, "step": 40488 }, { "epoch": 0.76, "learning_rate": 6.959956331688144e-07, "loss": 0.8821, "step": 40489 }, { "epoch": 0.76, "learning_rate": 6.958898756746877e-07, "loss": 0.8557, "step": 40490 }, { "epoch": 0.76, "learning_rate": 6.957841249170516e-07, "loss": 0.9968, "step": 40491 }, { "epoch": 0.76, "learning_rate": 6.956783808963027e-07, "loss": 0.7176, "step": 40492 }, { "epoch": 0.76, "learning_rate": 6.955726436128351e-07, "loss": 0.96, "step": 40493 }, { "epoch": 0.76, "learning_rate": 6.954669130670441e-07, "loss": 1.0801, "step": 40494 }, { "epoch": 0.76, "learning_rate": 6.953611892593243e-07, "loss": 0.9725, "step": 40495 }, { "epoch": 0.76, "learning_rate": 6.952554721900706e-07, "loss": 0.8893, "step": 40496 }, { "epoch": 0.76, "learning_rate": 6.951497618596783e-07, "loss": 0.8661, "step": 40497 }, { "epoch": 0.76, "learning_rate": 6.9504405826854e-07, "loss": 0.8796, "step": 40498 }, { "epoch": 0.76, "learning_rate": 6.949383614170524e-07, "loss": 0.8882, "step": 40499 }, { "epoch": 0.76, "learning_rate": 6.948326713056106e-07, "loss": 0.934, "step": 40500 }, { "epoch": 0.76, "learning_rate": 6.947269879346072e-07, "loss": 0.8089, "step": 40501 }, { "epoch": 0.76, "learning_rate": 6.946213113044381e-07, "loss": 0.7418, "step": 40502 }, { "epoch": 0.76, "learning_rate": 6.945156414154977e-07, "loss": 0.8503, "step": 40503 }, { "epoch": 0.76, "learning_rate": 6.944099782681804e-07, "loss": 0.8033, "step": 40504 }, { "epoch": 0.76, "learning_rate": 6.943043218628809e-07, "loss": 0.9713, "step": 40505 }, { "epoch": 0.76, "learning_rate": 6.941986721999938e-07, "loss": 1.0811, "step": 40506 }, { "epoch": 0.76, "learning_rate": 6.940930292799142e-07, "loss": 1.0552, "step": 40507 }, { "epoch": 0.76, "learning_rate": 6.939873931030344e-07, "loss": 0.9062, "step": 40508 }, { "epoch": 0.76, "learning_rate": 6.938817636697518e-07, "loss": 0.8826, "step": 40509 }, { "epoch": 0.76, "learning_rate": 6.937761409804586e-07, "loss": 0.8607, "step": 40510 }, { "epoch": 0.76, "learning_rate": 6.936705250355497e-07, "loss": 0.8177, "step": 40511 }, { "epoch": 0.76, "learning_rate": 6.935649158354199e-07, "loss": 1.0198, "step": 40512 }, { "epoch": 0.76, "learning_rate": 6.934593133804632e-07, "loss": 1.0106, "step": 40513 }, { "epoch": 0.76, "learning_rate": 6.933537176710739e-07, "loss": 1.0388, "step": 40514 }, { "epoch": 0.76, "learning_rate": 6.932481287076468e-07, "loss": 0.7833, "step": 40515 }, { "epoch": 0.76, "learning_rate": 6.931425464905761e-07, "loss": 0.9294, "step": 40516 }, { "epoch": 0.76, "learning_rate": 6.930369710202545e-07, "loss": 0.7303, "step": 40517 }, { "epoch": 0.76, "learning_rate": 6.92931402297079e-07, "loss": 1.1042, "step": 40518 }, { "epoch": 0.76, "learning_rate": 6.928258403214414e-07, "loss": 1.0419, "step": 40519 }, { "epoch": 0.76, "learning_rate": 6.927202850937359e-07, "loss": 0.8545, "step": 40520 }, { "epoch": 0.76, "learning_rate": 6.926147366143591e-07, "loss": 0.8422, "step": 40521 }, { "epoch": 0.76, "learning_rate": 6.925091948837026e-07, "loss": 0.9344, "step": 40522 }, { "epoch": 0.76, "learning_rate": 6.924036599021611e-07, "loss": 0.662, "step": 40523 }, { "epoch": 0.76, "learning_rate": 6.922981316701294e-07, "loss": 1.106, "step": 40524 }, { "epoch": 0.76, "learning_rate": 6.921926101880005e-07, "loss": 0.7526, "step": 40525 }, { "epoch": 0.76, "learning_rate": 6.920870954561695e-07, "loss": 0.9891, "step": 40526 }, { "epoch": 0.76, "learning_rate": 6.919815874750296e-07, "loss": 0.8786, "step": 40527 }, { "epoch": 0.76, "learning_rate": 6.918760862449759e-07, "loss": 0.9501, "step": 40528 }, { "epoch": 0.76, "learning_rate": 6.917705917663997e-07, "loss": 0.7151, "step": 40529 }, { "epoch": 0.76, "learning_rate": 6.916651040396982e-07, "loss": 0.7813, "step": 40530 }, { "epoch": 0.76, "learning_rate": 6.915596230652633e-07, "loss": 1.0352, "step": 40531 }, { "epoch": 0.76, "learning_rate": 6.914541488434893e-07, "loss": 0.9569, "step": 40532 }, { "epoch": 0.76, "learning_rate": 6.913486813747697e-07, "loss": 0.9418, "step": 40533 }, { "epoch": 0.76, "learning_rate": 6.912432206594988e-07, "loss": 0.7526, "step": 40534 }, { "epoch": 0.76, "learning_rate": 6.911377666980704e-07, "loss": 0.7522, "step": 40535 }, { "epoch": 0.76, "learning_rate": 6.91032319490878e-07, "loss": 0.9175, "step": 40536 }, { "epoch": 0.76, "learning_rate": 6.909268790383164e-07, "loss": 0.9862, "step": 40537 }, { "epoch": 0.76, "learning_rate": 6.908214453407766e-07, "loss": 1.0826, "step": 40538 }, { "epoch": 0.76, "learning_rate": 6.907160183986555e-07, "loss": 0.8723, "step": 40539 }, { "epoch": 0.76, "learning_rate": 6.906105982123448e-07, "loss": 0.8564, "step": 40540 }, { "epoch": 0.76, "learning_rate": 6.905051847822377e-07, "loss": 0.8371, "step": 40541 }, { "epoch": 0.76, "learning_rate": 6.903997781087307e-07, "loss": 0.6705, "step": 40542 }, { "epoch": 0.76, "learning_rate": 6.902943781922141e-07, "loss": 1.0532, "step": 40543 }, { "epoch": 0.76, "learning_rate": 6.901889850330835e-07, "loss": 1.0299, "step": 40544 }, { "epoch": 0.76, "learning_rate": 6.900835986317311e-07, "loss": 0.9332, "step": 40545 }, { "epoch": 0.76, "learning_rate": 6.899782189885512e-07, "loss": 0.8493, "step": 40546 }, { "epoch": 0.76, "learning_rate": 6.898728461039372e-07, "loss": 0.9647, "step": 40547 }, { "epoch": 0.77, "learning_rate": 6.897674799782824e-07, "loss": 0.7982, "step": 40548 }, { "epoch": 0.77, "learning_rate": 6.896621206119814e-07, "loss": 0.8506, "step": 40549 }, { "epoch": 0.77, "learning_rate": 6.895567680054249e-07, "loss": 0.9584, "step": 40550 }, { "epoch": 0.77, "learning_rate": 6.894514221590093e-07, "loss": 0.8961, "step": 40551 }, { "epoch": 0.77, "learning_rate": 6.893460830731258e-07, "loss": 0.9896, "step": 40552 }, { "epoch": 0.77, "learning_rate": 6.892407507481685e-07, "loss": 1.0375, "step": 40553 }, { "epoch": 0.77, "learning_rate": 6.891354251845309e-07, "loss": 0.5376, "step": 40554 }, { "epoch": 0.77, "learning_rate": 6.89030106382606e-07, "loss": 0.888, "step": 40555 }, { "epoch": 0.77, "learning_rate": 6.889247943427871e-07, "loss": 1.1052, "step": 40556 }, { "epoch": 0.77, "learning_rate": 6.888194890654675e-07, "loss": 0.9785, "step": 40557 }, { "epoch": 0.77, "learning_rate": 6.887141905510414e-07, "loss": 0.8662, "step": 40558 }, { "epoch": 0.77, "learning_rate": 6.88608898799899e-07, "loss": 0.8763, "step": 40559 }, { "epoch": 0.77, "learning_rate": 6.885036138124374e-07, "loss": 0.6968, "step": 40560 }, { "epoch": 0.77, "learning_rate": 6.883983355890467e-07, "loss": 0.7892, "step": 40561 }, { "epoch": 0.77, "learning_rate": 6.882930641301205e-07, "loss": 1.1001, "step": 40562 }, { "epoch": 0.77, "learning_rate": 6.881877994360539e-07, "loss": 1.023, "step": 40563 }, { "epoch": 0.77, "learning_rate": 6.880825415072375e-07, "loss": 0.8599, "step": 40564 }, { "epoch": 0.77, "learning_rate": 6.879772903440656e-07, "loss": 0.821, "step": 40565 }, { "epoch": 0.77, "learning_rate": 6.87872045946931e-07, "loss": 0.7727, "step": 40566 }, { "epoch": 0.77, "learning_rate": 6.877668083162264e-07, "loss": 0.9203, "step": 40567 }, { "epoch": 0.77, "learning_rate": 6.876615774523451e-07, "loss": 1.0136, "step": 40568 }, { "epoch": 0.77, "learning_rate": 6.875563533556801e-07, "loss": 1.1082, "step": 40569 }, { "epoch": 0.77, "learning_rate": 6.874511360266245e-07, "loss": 0.7957, "step": 40570 }, { "epoch": 0.77, "learning_rate": 6.873459254655696e-07, "loss": 0.7, "step": 40571 }, { "epoch": 0.77, "learning_rate": 6.872407216729107e-07, "loss": 0.8351, "step": 40572 }, { "epoch": 0.77, "learning_rate": 6.871355246490389e-07, "loss": 0.8282, "step": 40573 }, { "epoch": 0.77, "learning_rate": 6.870303343943472e-07, "loss": 0.8712, "step": 40574 }, { "epoch": 0.77, "learning_rate": 6.869251509092287e-07, "loss": 1.0345, "step": 40575 }, { "epoch": 0.77, "learning_rate": 6.86819974194076e-07, "loss": 0.7858, "step": 40576 }, { "epoch": 0.77, "learning_rate": 6.867148042492822e-07, "loss": 0.7369, "step": 40577 }, { "epoch": 0.77, "learning_rate": 6.866096410752393e-07, "loss": 0.8889, "step": 40578 }, { "epoch": 0.77, "learning_rate": 6.865044846723415e-07, "loss": 0.9449, "step": 40579 }, { "epoch": 0.77, "learning_rate": 6.863993350409786e-07, "loss": 0.9561, "step": 40580 }, { "epoch": 0.77, "learning_rate": 6.862941921815469e-07, "loss": 1.0563, "step": 40581 }, { "epoch": 0.77, "learning_rate": 6.861890560944359e-07, "loss": 0.7927, "step": 40582 }, { "epoch": 0.77, "learning_rate": 6.860839267800387e-07, "loss": 0.71, "step": 40583 }, { "epoch": 0.77, "learning_rate": 6.859788042387503e-07, "loss": 0.9374, "step": 40584 }, { "epoch": 0.77, "learning_rate": 6.858736884709602e-07, "loss": 0.8218, "step": 40585 }, { "epoch": 0.77, "learning_rate": 6.857685794770624e-07, "loss": 0.9007, "step": 40586 }, { "epoch": 0.77, "learning_rate": 6.856634772574491e-07, "loss": 1.0733, "step": 40587 }, { "epoch": 0.77, "learning_rate": 6.855583818125128e-07, "loss": 1.1188, "step": 40588 }, { "epoch": 0.77, "learning_rate": 6.854532931426458e-07, "loss": 0.7128, "step": 40589 }, { "epoch": 0.77, "learning_rate": 6.853482112482404e-07, "loss": 1.0091, "step": 40590 }, { "epoch": 0.77, "learning_rate": 6.852431361296902e-07, "loss": 0.9547, "step": 40591 }, { "epoch": 0.77, "learning_rate": 6.851380677873848e-07, "loss": 0.7785, "step": 40592 }, { "epoch": 0.77, "learning_rate": 6.850330062217198e-07, "loss": 0.9327, "step": 40593 }, { "epoch": 0.77, "learning_rate": 6.84927951433085e-07, "loss": 1.0157, "step": 40594 }, { "epoch": 0.77, "learning_rate": 6.848229034218737e-07, "loss": 0.9362, "step": 40595 }, { "epoch": 0.77, "learning_rate": 6.847178621884778e-07, "loss": 0.8536, "step": 40596 }, { "epoch": 0.77, "learning_rate": 6.8461282773329e-07, "loss": 1.0099, "step": 40597 }, { "epoch": 0.77, "learning_rate": 6.845078000567024e-07, "loss": 0.705, "step": 40598 }, { "epoch": 0.77, "learning_rate": 6.844027791591065e-07, "loss": 1.1384, "step": 40599 }, { "epoch": 0.77, "learning_rate": 6.84297765040896e-07, "loss": 1.0065, "step": 40600 }, { "epoch": 0.77, "learning_rate": 6.841927577024607e-07, "loss": 0.9241, "step": 40601 }, { "epoch": 0.77, "learning_rate": 6.840877571441951e-07, "loss": 0.8518, "step": 40602 }, { "epoch": 0.77, "learning_rate": 6.839827633664894e-07, "loss": 0.8112, "step": 40603 }, { "epoch": 0.77, "learning_rate": 6.83877776369736e-07, "loss": 0.6883, "step": 40604 }, { "epoch": 0.77, "learning_rate": 6.837727961543286e-07, "loss": 1.0941, "step": 40605 }, { "epoch": 0.77, "learning_rate": 6.83667822720657e-07, "loss": 0.9566, "step": 40606 }, { "epoch": 0.77, "learning_rate": 6.83562856069114e-07, "loss": 0.9414, "step": 40607 }, { "epoch": 0.77, "learning_rate": 6.834578962000918e-07, "loss": 1.0591, "step": 40608 }, { "epoch": 0.77, "learning_rate": 6.833529431139821e-07, "loss": 0.8502, "step": 40609 }, { "epoch": 0.77, "learning_rate": 6.832479968111769e-07, "loss": 0.7981, "step": 40610 }, { "epoch": 0.77, "learning_rate": 6.831430572920677e-07, "loss": 0.8561, "step": 40611 }, { "epoch": 0.77, "learning_rate": 6.830381245570478e-07, "loss": 1.1403, "step": 40612 }, { "epoch": 0.77, "learning_rate": 6.829331986065061e-07, "loss": 1.0614, "step": 40613 }, { "epoch": 0.77, "learning_rate": 6.828282794408375e-07, "loss": 0.9934, "step": 40614 }, { "epoch": 0.77, "learning_rate": 6.827233670604317e-07, "loss": 0.8583, "step": 40615 }, { "epoch": 0.77, "learning_rate": 6.826184614656811e-07, "loss": 0.7516, "step": 40616 }, { "epoch": 0.77, "learning_rate": 6.825135626569776e-07, "loss": 0.7521, "step": 40617 }, { "epoch": 0.77, "learning_rate": 6.824086706347127e-07, "loss": 1.0017, "step": 40618 }, { "epoch": 0.77, "learning_rate": 6.823037853992779e-07, "loss": 1.085, "step": 40619 }, { "epoch": 0.77, "learning_rate": 6.821989069510651e-07, "loss": 0.798, "step": 40620 }, { "epoch": 0.77, "learning_rate": 6.820940352904667e-07, "loss": 0.8367, "step": 40621 }, { "epoch": 0.77, "learning_rate": 6.819891704178718e-07, "loss": 0.9333, "step": 40622 }, { "epoch": 0.77, "learning_rate": 6.818843123336754e-07, "loss": 0.7289, "step": 40623 }, { "epoch": 0.77, "learning_rate": 6.817794610382661e-07, "loss": 0.8902, "step": 40624 }, { "epoch": 0.77, "learning_rate": 6.816746165320362e-07, "loss": 1.0688, "step": 40625 }, { "epoch": 0.77, "learning_rate": 6.815697788153786e-07, "loss": 0.8964, "step": 40626 }, { "epoch": 0.77, "learning_rate": 6.814649478886831e-07, "loss": 0.748, "step": 40627 }, { "epoch": 0.77, "learning_rate": 6.813601237523418e-07, "loss": 0.9706, "step": 40628 }, { "epoch": 0.77, "learning_rate": 6.812553064067462e-07, "loss": 0.7619, "step": 40629 }, { "epoch": 0.77, "learning_rate": 6.811504958522871e-07, "loss": 1.0001, "step": 40630 }, { "epoch": 0.77, "learning_rate": 6.810456920893565e-07, "loss": 0.9679, "step": 40631 }, { "epoch": 0.77, "learning_rate": 6.809408951183458e-07, "loss": 0.6908, "step": 40632 }, { "epoch": 0.77, "learning_rate": 6.808361049396464e-07, "loss": 0.9144, "step": 40633 }, { "epoch": 0.77, "learning_rate": 6.807313215536476e-07, "loss": 0.9028, "step": 40634 }, { "epoch": 0.77, "learning_rate": 6.806265449607441e-07, "loss": 0.9853, "step": 40635 }, { "epoch": 0.77, "learning_rate": 6.805217751613244e-07, "loss": 1.0665, "step": 40636 }, { "epoch": 0.77, "learning_rate": 6.804170121557808e-07, "loss": 1.0685, "step": 40637 }, { "epoch": 0.77, "learning_rate": 6.803122559445042e-07, "loss": 0.7773, "step": 40638 }, { "epoch": 0.77, "learning_rate": 6.802075065278857e-07, "loss": 0.9029, "step": 40639 }, { "epoch": 0.77, "learning_rate": 6.801027639063165e-07, "loss": 0.8166, "step": 40640 }, { "epoch": 0.77, "learning_rate": 6.79998028080188e-07, "loss": 0.8325, "step": 40641 }, { "epoch": 0.77, "learning_rate": 6.798932990498916e-07, "loss": 0.7893, "step": 40642 }, { "epoch": 0.77, "learning_rate": 6.797885768158163e-07, "loss": 1.0424, "step": 40643 }, { "epoch": 0.77, "learning_rate": 6.796838613783565e-07, "loss": 0.9729, "step": 40644 }, { "epoch": 0.77, "learning_rate": 6.795791527379003e-07, "loss": 0.7924, "step": 40645 }, { "epoch": 0.77, "learning_rate": 6.794744508948393e-07, "loss": 0.7135, "step": 40646 }, { "epoch": 0.77, "learning_rate": 6.79369755849566e-07, "loss": 0.7819, "step": 40647 }, { "epoch": 0.77, "learning_rate": 6.792650676024696e-07, "loss": 0.8339, "step": 40648 }, { "epoch": 0.77, "learning_rate": 6.791603861539414e-07, "loss": 1.0386, "step": 40649 }, { "epoch": 0.77, "learning_rate": 6.790557115043728e-07, "loss": 1.1644, "step": 40650 }, { "epoch": 0.77, "learning_rate": 6.789510436541544e-07, "loss": 1.0919, "step": 40651 }, { "epoch": 0.77, "learning_rate": 6.788463826036768e-07, "loss": 0.7347, "step": 40652 }, { "epoch": 0.77, "learning_rate": 6.787417283533309e-07, "loss": 0.8266, "step": 40653 }, { "epoch": 0.77, "learning_rate": 6.786370809035084e-07, "loss": 0.593, "step": 40654 }, { "epoch": 0.77, "learning_rate": 6.785324402545975e-07, "loss": 1.0463, "step": 40655 }, { "epoch": 0.77, "learning_rate": 6.784278064069925e-07, "loss": 0.9364, "step": 40656 }, { "epoch": 0.77, "learning_rate": 6.783231793610812e-07, "loss": 1.1035, "step": 40657 }, { "epoch": 0.77, "learning_rate": 6.782185591172555e-07, "loss": 0.8345, "step": 40658 }, { "epoch": 0.77, "learning_rate": 6.781139456759056e-07, "loss": 0.9454, "step": 40659 }, { "epoch": 0.77, "learning_rate": 6.780093390374223e-07, "loss": 0.7036, "step": 40660 }, { "epoch": 0.77, "learning_rate": 6.779047392021964e-07, "loss": 0.9129, "step": 40661 }, { "epoch": 0.77, "learning_rate": 6.778001461706185e-07, "loss": 1.0214, "step": 40662 }, { "epoch": 0.77, "learning_rate": 6.776955599430796e-07, "loss": 1.1088, "step": 40663 }, { "epoch": 0.77, "learning_rate": 6.775909805199682e-07, "loss": 0.8671, "step": 40664 }, { "epoch": 0.77, "learning_rate": 6.774864079016777e-07, "loss": 0.9329, "step": 40665 }, { "epoch": 0.77, "learning_rate": 6.773818420885961e-07, "loss": 0.7828, "step": 40666 }, { "epoch": 0.77, "learning_rate": 6.772772830811141e-07, "loss": 1.0913, "step": 40667 }, { "epoch": 0.77, "learning_rate": 6.771727308796247e-07, "loss": 1.0092, "step": 40668 }, { "epoch": 0.77, "learning_rate": 6.770681854845154e-07, "loss": 1.0413, "step": 40669 }, { "epoch": 0.77, "learning_rate": 6.769636468961777e-07, "loss": 0.8466, "step": 40670 }, { "epoch": 0.77, "learning_rate": 6.768591151150017e-07, "loss": 0.8535, "step": 40671 }, { "epoch": 0.77, "learning_rate": 6.767545901413777e-07, "loss": 0.7357, "step": 40672 }, { "epoch": 0.77, "learning_rate": 6.766500719756966e-07, "loss": 0.7985, "step": 40673 }, { "epoch": 0.77, "learning_rate": 6.76545560618348e-07, "loss": 0.9124, "step": 40674 }, { "epoch": 0.77, "learning_rate": 6.764410560697233e-07, "loss": 1.0662, "step": 40675 }, { "epoch": 0.77, "learning_rate": 6.7633655833021e-07, "loss": 0.7244, "step": 40676 }, { "epoch": 0.77, "learning_rate": 6.762320674002018e-07, "loss": 0.8379, "step": 40677 }, { "epoch": 0.77, "learning_rate": 6.761275832800862e-07, "loss": 0.9577, "step": 40678 }, { "epoch": 0.77, "learning_rate": 6.760231059702544e-07, "loss": 0.6706, "step": 40679 }, { "epoch": 0.77, "learning_rate": 6.759186354710964e-07, "loss": 0.7679, "step": 40680 }, { "epoch": 0.77, "learning_rate": 6.758141717830021e-07, "loss": 1.0597, "step": 40681 }, { "epoch": 0.77, "learning_rate": 6.757097149063621e-07, "loss": 1.0106, "step": 40682 }, { "epoch": 0.77, "learning_rate": 6.75605264841566e-07, "loss": 0.7884, "step": 40683 }, { "epoch": 0.77, "learning_rate": 6.755008215890044e-07, "loss": 1.025, "step": 40684 }, { "epoch": 0.77, "learning_rate": 6.753963851490656e-07, "loss": 0.8529, "step": 40685 }, { "epoch": 0.77, "learning_rate": 6.752919555221421e-07, "loss": 0.8684, "step": 40686 }, { "epoch": 0.77, "learning_rate": 6.751875327086216e-07, "loss": 0.9075, "step": 40687 }, { "epoch": 0.77, "learning_rate": 6.750831167088945e-07, "loss": 0.9731, "step": 40688 }, { "epoch": 0.77, "learning_rate": 6.749787075233522e-07, "loss": 0.9557, "step": 40689 }, { "epoch": 0.77, "learning_rate": 6.748743051523829e-07, "loss": 0.8586, "step": 40690 }, { "epoch": 0.77, "learning_rate": 6.747699095963769e-07, "loss": 0.86, "step": 40691 }, { "epoch": 0.77, "learning_rate": 6.746655208557243e-07, "loss": 0.7262, "step": 40692 }, { "epoch": 0.77, "learning_rate": 6.745611389308146e-07, "loss": 1.0298, "step": 40693 }, { "epoch": 0.77, "learning_rate": 6.744567638220376e-07, "loss": 1.0106, "step": 40694 }, { "epoch": 0.77, "learning_rate": 6.743523955297832e-07, "loss": 0.9282, "step": 40695 }, { "epoch": 0.77, "learning_rate": 6.742480340544414e-07, "loss": 0.9153, "step": 40696 }, { "epoch": 0.77, "learning_rate": 6.741436793964002e-07, "loss": 0.7963, "step": 40697 }, { "epoch": 0.77, "learning_rate": 6.74039331556052e-07, "loss": 0.8849, "step": 40698 }, { "epoch": 0.77, "learning_rate": 6.739349905337842e-07, "loss": 0.9758, "step": 40699 }, { "epoch": 0.77, "learning_rate": 6.73830656329987e-07, "loss": 0.9813, "step": 40700 }, { "epoch": 0.77, "learning_rate": 6.737263289450504e-07, "loss": 0.8159, "step": 40701 }, { "epoch": 0.77, "learning_rate": 6.736220083793635e-07, "loss": 0.7917, "step": 40702 }, { "epoch": 0.77, "learning_rate": 6.735176946333161e-07, "loss": 0.8106, "step": 40703 }, { "epoch": 0.77, "learning_rate": 6.734133877072977e-07, "loss": 0.9304, "step": 40704 }, { "epoch": 0.77, "learning_rate": 6.733090876016981e-07, "loss": 0.9199, "step": 40705 }, { "epoch": 0.77, "learning_rate": 6.732047943169054e-07, "loss": 1.0482, "step": 40706 }, { "epoch": 0.77, "learning_rate": 6.731005078533113e-07, "loss": 1.1078, "step": 40707 }, { "epoch": 0.77, "learning_rate": 6.729962282113029e-07, "loss": 0.829, "step": 40708 }, { "epoch": 0.77, "learning_rate": 6.728919553912699e-07, "loss": 0.9541, "step": 40709 }, { "epoch": 0.77, "learning_rate": 6.727876893936039e-07, "loss": 0.8204, "step": 40710 }, { "epoch": 0.77, "learning_rate": 6.726834302186919e-07, "loss": 1.0486, "step": 40711 }, { "epoch": 0.77, "learning_rate": 6.725791778669241e-07, "loss": 0.9401, "step": 40712 }, { "epoch": 0.77, "learning_rate": 6.724749323386892e-07, "loss": 1.015, "step": 40713 }, { "epoch": 0.77, "learning_rate": 6.723706936343772e-07, "loss": 0.7632, "step": 40714 }, { "epoch": 0.77, "learning_rate": 6.72266461754377e-07, "loss": 1.0576, "step": 40715 }, { "epoch": 0.77, "learning_rate": 6.721622366990777e-07, "loss": 0.8243, "step": 40716 }, { "epoch": 0.77, "learning_rate": 6.720580184688693e-07, "loss": 0.7914, "step": 40717 }, { "epoch": 0.77, "learning_rate": 6.719538070641387e-07, "loss": 0.8363, "step": 40718 }, { "epoch": 0.77, "learning_rate": 6.71849602485278e-07, "loss": 1.0353, "step": 40719 }, { "epoch": 0.77, "learning_rate": 6.717454047326743e-07, "loss": 0.881, "step": 40720 }, { "epoch": 0.77, "learning_rate": 6.716412138067169e-07, "loss": 0.8368, "step": 40721 }, { "epoch": 0.77, "learning_rate": 6.715370297077952e-07, "loss": 0.8085, "step": 40722 }, { "epoch": 0.77, "learning_rate": 6.714328524362984e-07, "loss": 0.7716, "step": 40723 }, { "epoch": 0.77, "learning_rate": 6.713286819926151e-07, "loss": 1.0223, "step": 40724 }, { "epoch": 0.77, "learning_rate": 6.712245183771346e-07, "loss": 0.9793, "step": 40725 }, { "epoch": 0.77, "learning_rate": 6.711203615902462e-07, "loss": 0.8444, "step": 40726 }, { "epoch": 0.77, "learning_rate": 6.710162116323371e-07, "loss": 0.9305, "step": 40727 }, { "epoch": 0.77, "learning_rate": 6.709120685037987e-07, "loss": 0.9732, "step": 40728 }, { "epoch": 0.77, "learning_rate": 6.708079322050176e-07, "loss": 0.8902, "step": 40729 }, { "epoch": 0.77, "learning_rate": 6.707038027363829e-07, "loss": 1.0491, "step": 40730 }, { "epoch": 0.77, "learning_rate": 6.705996800982859e-07, "loss": 0.8391, "step": 40731 }, { "epoch": 0.77, "learning_rate": 6.704955642911126e-07, "loss": 0.8761, "step": 40732 }, { "epoch": 0.77, "learning_rate": 6.70391455315253e-07, "loss": 0.8167, "step": 40733 }, { "epoch": 0.77, "learning_rate": 6.702873531710954e-07, "loss": 0.8637, "step": 40734 }, { "epoch": 0.77, "learning_rate": 6.701832578590289e-07, "loss": 0.7574, "step": 40735 }, { "epoch": 0.77, "learning_rate": 6.700791693794426e-07, "loss": 0.7817, "step": 40736 }, { "epoch": 0.77, "learning_rate": 6.699750877327232e-07, "loss": 0.9694, "step": 40737 }, { "epoch": 0.77, "learning_rate": 6.69871012919262e-07, "loss": 0.889, "step": 40738 }, { "epoch": 0.77, "learning_rate": 6.697669449394459e-07, "loss": 0.7741, "step": 40739 }, { "epoch": 0.77, "learning_rate": 6.696628837936636e-07, "loss": 1.0154, "step": 40740 }, { "epoch": 0.77, "learning_rate": 6.695588294823041e-07, "loss": 0.9677, "step": 40741 }, { "epoch": 0.77, "learning_rate": 6.694547820057559e-07, "loss": 0.9947, "step": 40742 }, { "epoch": 0.77, "learning_rate": 6.693507413644074e-07, "loss": 1.0832, "step": 40743 }, { "epoch": 0.77, "learning_rate": 6.69246707558647e-07, "loss": 1.0328, "step": 40744 }, { "epoch": 0.77, "learning_rate": 6.69142680588864e-07, "loss": 0.9528, "step": 40745 }, { "epoch": 0.77, "learning_rate": 6.690386604554447e-07, "loss": 0.982, "step": 40746 }, { "epoch": 0.77, "learning_rate": 6.689346471587804e-07, "loss": 1.0033, "step": 40747 }, { "epoch": 0.77, "learning_rate": 6.68830640699257e-07, "loss": 0.7754, "step": 40748 }, { "epoch": 0.77, "learning_rate": 6.687266410772641e-07, "loss": 0.8828, "step": 40749 }, { "epoch": 0.77, "learning_rate": 6.686226482931898e-07, "loss": 1.169, "step": 40750 }, { "epoch": 0.77, "learning_rate": 6.685186623474222e-07, "loss": 0.8928, "step": 40751 }, { "epoch": 0.77, "learning_rate": 6.684146832403499e-07, "loss": 0.9862, "step": 40752 }, { "epoch": 0.77, "learning_rate": 6.683107109723608e-07, "loss": 0.8195, "step": 40753 }, { "epoch": 0.77, "learning_rate": 6.682067455438443e-07, "loss": 0.7719, "step": 40754 }, { "epoch": 0.77, "learning_rate": 6.681027869551862e-07, "loss": 0.8297, "step": 40755 }, { "epoch": 0.77, "learning_rate": 6.679988352067767e-07, "loss": 1.1196, "step": 40756 }, { "epoch": 0.77, "learning_rate": 6.678948902990043e-07, "loss": 0.9263, "step": 40757 }, { "epoch": 0.77, "learning_rate": 6.677909522322545e-07, "loss": 0.8666, "step": 40758 }, { "epoch": 0.77, "learning_rate": 6.676870210069189e-07, "loss": 1.0617, "step": 40759 }, { "epoch": 0.77, "learning_rate": 6.675830966233826e-07, "loss": 0.7784, "step": 40760 }, { "epoch": 0.77, "learning_rate": 6.674791790820351e-07, "loss": 0.9235, "step": 40761 }, { "epoch": 0.77, "learning_rate": 6.673752683832643e-07, "loss": 0.9993, "step": 40762 }, { "epoch": 0.77, "learning_rate": 6.672713645274578e-07, "loss": 0.9388, "step": 40763 }, { "epoch": 0.77, "learning_rate": 6.671674675150038e-07, "loss": 0.6737, "step": 40764 }, { "epoch": 0.77, "learning_rate": 6.670635773462905e-07, "loss": 0.9711, "step": 40765 }, { "epoch": 0.77, "learning_rate": 6.669596940217063e-07, "loss": 0.6702, "step": 40766 }, { "epoch": 0.77, "learning_rate": 6.668558175416371e-07, "loss": 0.8196, "step": 40767 }, { "epoch": 0.77, "learning_rate": 6.667519479064733e-07, "loss": 1.1307, "step": 40768 }, { "epoch": 0.77, "learning_rate": 6.666480851166007e-07, "loss": 1.1055, "step": 40769 }, { "epoch": 0.77, "learning_rate": 6.665442291724072e-07, "loss": 0.877, "step": 40770 }, { "epoch": 0.77, "learning_rate": 6.66440380074283e-07, "loss": 1.0067, "step": 40771 }, { "epoch": 0.77, "learning_rate": 6.663365378226134e-07, "loss": 0.6366, "step": 40772 }, { "epoch": 0.77, "learning_rate": 6.662327024177869e-07, "loss": 1.0457, "step": 40773 }, { "epoch": 0.77, "learning_rate": 6.661288738601912e-07, "loss": 0.9443, "step": 40774 }, { "epoch": 0.77, "learning_rate": 6.660250521502143e-07, "loss": 1.2033, "step": 40775 }, { "epoch": 0.77, "learning_rate": 6.659212372882434e-07, "loss": 0.9199, "step": 40776 }, { "epoch": 0.77, "learning_rate": 6.658174292746664e-07, "loss": 0.7929, "step": 40777 }, { "epoch": 0.77, "learning_rate": 6.657136281098716e-07, "loss": 0.8776, "step": 40778 }, { "epoch": 0.77, "learning_rate": 6.656098337942446e-07, "loss": 0.7714, "step": 40779 }, { "epoch": 0.77, "learning_rate": 6.655060463281756e-07, "loss": 0.8046, "step": 40780 }, { "epoch": 0.77, "learning_rate": 6.654022657120502e-07, "loss": 1.1327, "step": 40781 }, { "epoch": 0.77, "learning_rate": 6.65298491946256e-07, "loss": 0.9547, "step": 40782 }, { "epoch": 0.77, "learning_rate": 6.651947250311813e-07, "loss": 0.8929, "step": 40783 }, { "epoch": 0.77, "learning_rate": 6.650909649672133e-07, "loss": 0.9097, "step": 40784 }, { "epoch": 0.77, "learning_rate": 6.649872117547393e-07, "loss": 0.9156, "step": 40785 }, { "epoch": 0.77, "learning_rate": 6.648834653941469e-07, "loss": 0.8611, "step": 40786 }, { "epoch": 0.77, "learning_rate": 6.647797258858238e-07, "loss": 0.7952, "step": 40787 }, { "epoch": 0.77, "learning_rate": 6.646759932301558e-07, "loss": 0.9838, "step": 40788 }, { "epoch": 0.77, "learning_rate": 6.645722674275326e-07, "loss": 0.8284, "step": 40789 }, { "epoch": 0.77, "learning_rate": 6.644685484783397e-07, "loss": 0.9353, "step": 40790 }, { "epoch": 0.77, "learning_rate": 6.643648363829641e-07, "loss": 0.8514, "step": 40791 }, { "epoch": 0.77, "learning_rate": 6.642611311417954e-07, "loss": 0.7313, "step": 40792 }, { "epoch": 0.77, "learning_rate": 6.641574327552189e-07, "loss": 1.0394, "step": 40793 }, { "epoch": 0.77, "learning_rate": 6.64053741223622e-07, "loss": 1.1258, "step": 40794 }, { "epoch": 0.77, "learning_rate": 6.639500565473922e-07, "loss": 0.8722, "step": 40795 }, { "epoch": 0.77, "learning_rate": 6.638463787269165e-07, "loss": 0.9479, "step": 40796 }, { "epoch": 0.77, "learning_rate": 6.637427077625822e-07, "loss": 0.9603, "step": 40797 }, { "epoch": 0.77, "learning_rate": 6.636390436547763e-07, "loss": 0.904, "step": 40798 }, { "epoch": 0.77, "learning_rate": 6.635353864038865e-07, "loss": 0.8126, "step": 40799 }, { "epoch": 0.77, "learning_rate": 6.634317360102979e-07, "loss": 1.1412, "step": 40800 }, { "epoch": 0.77, "learning_rate": 6.633280924744006e-07, "loss": 0.8175, "step": 40801 }, { "epoch": 0.77, "learning_rate": 6.632244557965789e-07, "loss": 0.9749, "step": 40802 }, { "epoch": 0.77, "learning_rate": 6.63120825977221e-07, "loss": 0.9827, "step": 40803 }, { "epoch": 0.77, "learning_rate": 6.630172030167134e-07, "loss": 0.858, "step": 40804 }, { "epoch": 0.77, "learning_rate": 6.629135869154432e-07, "loss": 1.0064, "step": 40805 }, { "epoch": 0.77, "learning_rate": 6.628099776737973e-07, "loss": 1.1326, "step": 40806 }, { "epoch": 0.77, "learning_rate": 6.627063752921628e-07, "loss": 0.9151, "step": 40807 }, { "epoch": 0.77, "learning_rate": 6.62602779770927e-07, "loss": 0.9605, "step": 40808 }, { "epoch": 0.77, "learning_rate": 6.624991911104747e-07, "loss": 0.7967, "step": 40809 }, { "epoch": 0.77, "learning_rate": 6.623956093111955e-07, "loss": 0.9653, "step": 40810 }, { "epoch": 0.77, "learning_rate": 6.62292034373474e-07, "loss": 0.928, "step": 40811 }, { "epoch": 0.77, "learning_rate": 6.621884662976968e-07, "loss": 0.9541, "step": 40812 }, { "epoch": 0.77, "learning_rate": 6.620849050842535e-07, "loss": 0.9944, "step": 40813 }, { "epoch": 0.77, "learning_rate": 6.619813507335276e-07, "loss": 0.877, "step": 40814 }, { "epoch": 0.77, "learning_rate": 6.618778032459072e-07, "loss": 0.9254, "step": 40815 }, { "epoch": 0.77, "learning_rate": 6.617742626217785e-07, "loss": 0.8102, "step": 40816 }, { "epoch": 0.77, "learning_rate": 6.616707288615284e-07, "loss": 0.8257, "step": 40817 }, { "epoch": 0.77, "learning_rate": 6.615672019655436e-07, "loss": 0.9944, "step": 40818 }, { "epoch": 0.77, "learning_rate": 6.614636819342104e-07, "loss": 0.9978, "step": 40819 }, { "epoch": 0.77, "learning_rate": 6.613601687679163e-07, "loss": 0.6108, "step": 40820 }, { "epoch": 0.77, "learning_rate": 6.612566624670455e-07, "loss": 0.8977, "step": 40821 }, { "epoch": 0.77, "learning_rate": 6.611531630319873e-07, "loss": 0.8164, "step": 40822 }, { "epoch": 0.77, "learning_rate": 6.610496704631261e-07, "loss": 0.8272, "step": 40823 }, { "epoch": 0.77, "learning_rate": 6.60946184760849e-07, "loss": 0.9397, "step": 40824 }, { "epoch": 0.77, "learning_rate": 6.608427059255423e-07, "loss": 1.1176, "step": 40825 }, { "epoch": 0.77, "learning_rate": 6.607392339575927e-07, "loss": 0.8629, "step": 40826 }, { "epoch": 0.77, "learning_rate": 6.606357688573867e-07, "loss": 0.795, "step": 40827 }, { "epoch": 0.77, "learning_rate": 6.605323106253101e-07, "loss": 0.7711, "step": 40828 }, { "epoch": 0.77, "learning_rate": 6.604288592617499e-07, "loss": 0.7404, "step": 40829 }, { "epoch": 0.77, "learning_rate": 6.60325414767091e-07, "loss": 0.8398, "step": 40830 }, { "epoch": 0.77, "learning_rate": 6.602219771417218e-07, "loss": 1.2188, "step": 40831 }, { "epoch": 0.77, "learning_rate": 6.601185463860266e-07, "loss": 1.007, "step": 40832 }, { "epoch": 0.77, "learning_rate": 6.600151225003914e-07, "loss": 0.7392, "step": 40833 }, { "epoch": 0.77, "learning_rate": 6.59911705485205e-07, "loss": 0.6952, "step": 40834 }, { "epoch": 0.77, "learning_rate": 6.598082953408511e-07, "loss": 0.7742, "step": 40835 }, { "epoch": 0.77, "learning_rate": 6.597048920677169e-07, "loss": 1.0649, "step": 40836 }, { "epoch": 0.77, "learning_rate": 6.596014956661878e-07, "loss": 1.2028, "step": 40837 }, { "epoch": 0.77, "learning_rate": 6.594981061366504e-07, "loss": 0.8916, "step": 40838 }, { "epoch": 0.77, "learning_rate": 6.593947234794906e-07, "loss": 0.8712, "step": 40839 }, { "epoch": 0.77, "learning_rate": 6.592913476950947e-07, "loss": 0.9786, "step": 40840 }, { "epoch": 0.77, "learning_rate": 6.59187978783849e-07, "loss": 0.8641, "step": 40841 }, { "epoch": 0.77, "learning_rate": 6.590846167461373e-07, "loss": 0.8286, "step": 40842 }, { "epoch": 0.77, "learning_rate": 6.589812615823491e-07, "loss": 1.0735, "step": 40843 }, { "epoch": 0.77, "learning_rate": 6.588779132928674e-07, "loss": 0.9675, "step": 40844 }, { "epoch": 0.77, "learning_rate": 6.587745718780792e-07, "loss": 0.7393, "step": 40845 }, { "epoch": 0.77, "learning_rate": 6.586712373383703e-07, "loss": 0.8614, "step": 40846 }, { "epoch": 0.77, "learning_rate": 6.585679096741265e-07, "loss": 0.963, "step": 40847 }, { "epoch": 0.77, "learning_rate": 6.584645888857336e-07, "loss": 0.7982, "step": 40848 }, { "epoch": 0.77, "learning_rate": 6.583612749735777e-07, "loss": 0.7978, "step": 40849 }, { "epoch": 0.77, "learning_rate": 6.582579679380449e-07, "loss": 1.256, "step": 40850 }, { "epoch": 0.77, "learning_rate": 6.581546677795189e-07, "loss": 0.9597, "step": 40851 }, { "epoch": 0.77, "learning_rate": 6.580513744983883e-07, "loss": 0.9559, "step": 40852 }, { "epoch": 0.77, "learning_rate": 6.579480880950367e-07, "loss": 0.9261, "step": 40853 }, { "epoch": 0.77, "learning_rate": 6.5784480856985e-07, "loss": 0.7937, "step": 40854 }, { "epoch": 0.77, "learning_rate": 6.577415359232156e-07, "loss": 1.3656, "step": 40855 }, { "epoch": 0.77, "learning_rate": 6.57638270155517e-07, "loss": 0.9705, "step": 40856 }, { "epoch": 0.77, "learning_rate": 6.575350112671405e-07, "loss": 0.9011, "step": 40857 }, { "epoch": 0.77, "learning_rate": 6.57431759258472e-07, "loss": 0.8141, "step": 40858 }, { "epoch": 0.77, "learning_rate": 6.573285141298969e-07, "loss": 0.9456, "step": 40859 }, { "epoch": 0.77, "learning_rate": 6.572252758818004e-07, "loss": 0.8109, "step": 40860 }, { "epoch": 0.77, "learning_rate": 6.571220445145682e-07, "loss": 0.9181, "step": 40861 }, { "epoch": 0.77, "learning_rate": 6.570188200285865e-07, "loss": 1.0564, "step": 40862 }, { "epoch": 0.77, "learning_rate": 6.569156024242387e-07, "loss": 0.8859, "step": 40863 }, { "epoch": 0.77, "learning_rate": 6.568123917019132e-07, "loss": 0.9492, "step": 40864 }, { "epoch": 0.77, "learning_rate": 6.567091878619927e-07, "loss": 0.9088, "step": 40865 }, { "epoch": 0.77, "learning_rate": 6.566059909048636e-07, "loss": 0.6807, "step": 40866 }, { "epoch": 0.77, "learning_rate": 6.565028008309112e-07, "loss": 0.6589, "step": 40867 }, { "epoch": 0.77, "learning_rate": 6.563996176405208e-07, "loss": 0.9721, "step": 40868 }, { "epoch": 0.77, "learning_rate": 6.562964413340778e-07, "loss": 0.9577, "step": 40869 }, { "epoch": 0.77, "learning_rate": 6.561932719119673e-07, "loss": 0.8273, "step": 40870 }, { "epoch": 0.77, "learning_rate": 6.560901093745753e-07, "loss": 0.8853, "step": 40871 }, { "epoch": 0.77, "learning_rate": 6.559869537222848e-07, "loss": 0.89, "step": 40872 }, { "epoch": 0.77, "learning_rate": 6.558838049554841e-07, "loss": 0.7815, "step": 40873 }, { "epoch": 0.77, "learning_rate": 6.557806630745558e-07, "loss": 0.9686, "step": 40874 }, { "epoch": 0.77, "learning_rate": 6.556775280798855e-07, "loss": 1.1066, "step": 40875 }, { "epoch": 0.77, "learning_rate": 6.5557439997186e-07, "loss": 0.9464, "step": 40876 }, { "epoch": 0.77, "learning_rate": 6.554712787508624e-07, "loss": 0.8302, "step": 40877 }, { "epoch": 0.77, "learning_rate": 6.553681644172785e-07, "loss": 0.7902, "step": 40878 }, { "epoch": 0.77, "learning_rate": 6.552650569714936e-07, "loss": 0.9646, "step": 40879 }, { "epoch": 0.77, "learning_rate": 6.55161956413892e-07, "loss": 1.0372, "step": 40880 }, { "epoch": 0.77, "learning_rate": 6.550588627448592e-07, "loss": 1.0552, "step": 40881 }, { "epoch": 0.77, "learning_rate": 6.549557759647801e-07, "loss": 0.9558, "step": 40882 }, { "epoch": 0.77, "learning_rate": 6.548526960740403e-07, "loss": 1.0166, "step": 40883 }, { "epoch": 0.77, "learning_rate": 6.547496230730227e-07, "loss": 0.8033, "step": 40884 }, { "epoch": 0.77, "learning_rate": 6.546465569621146e-07, "loss": 0.958, "step": 40885 }, { "epoch": 0.77, "learning_rate": 6.545434977416993e-07, "loss": 0.9445, "step": 40886 }, { "epoch": 0.77, "learning_rate": 6.544404454121617e-07, "loss": 1.0959, "step": 40887 }, { "epoch": 0.77, "learning_rate": 6.543373999738867e-07, "loss": 0.846, "step": 40888 }, { "epoch": 0.77, "learning_rate": 6.542343614272595e-07, "loss": 0.8501, "step": 40889 }, { "epoch": 0.77, "learning_rate": 6.541313297726648e-07, "loss": 0.7407, "step": 40890 }, { "epoch": 0.77, "learning_rate": 6.540283050104868e-07, "loss": 0.896, "step": 40891 }, { "epoch": 0.77, "learning_rate": 6.539252871411114e-07, "loss": 0.821, "step": 40892 }, { "epoch": 0.77, "learning_rate": 6.538222761649207e-07, "loss": 1.1077, "step": 40893 }, { "epoch": 0.77, "learning_rate": 6.537192720823027e-07, "loss": 1.0165, "step": 40894 }, { "epoch": 0.77, "learning_rate": 6.536162748936395e-07, "loss": 0.7882, "step": 40895 }, { "epoch": 0.77, "learning_rate": 6.535132845993158e-07, "loss": 0.7982, "step": 40896 }, { "epoch": 0.77, "learning_rate": 6.534103011997187e-07, "loss": 1.0528, "step": 40897 }, { "epoch": 0.77, "learning_rate": 6.533073246952296e-07, "loss": 0.8167, "step": 40898 }, { "epoch": 0.77, "learning_rate": 6.532043550862346e-07, "loss": 0.9014, "step": 40899 }, { "epoch": 0.77, "learning_rate": 6.53101392373118e-07, "loss": 1.3339, "step": 40900 }, { "epoch": 0.77, "learning_rate": 6.529984365562642e-07, "loss": 0.9745, "step": 40901 }, { "epoch": 0.77, "learning_rate": 6.528954876360574e-07, "loss": 0.9012, "step": 40902 }, { "epoch": 0.77, "learning_rate": 6.527925456128822e-07, "loss": 0.8595, "step": 40903 }, { "epoch": 0.77, "learning_rate": 6.526896104871239e-07, "loss": 0.9597, "step": 40904 }, { "epoch": 0.77, "learning_rate": 6.525866822591645e-07, "loss": 0.8457, "step": 40905 }, { "epoch": 0.77, "learning_rate": 6.52483760929391e-07, "loss": 1.1158, "step": 40906 }, { "epoch": 0.77, "learning_rate": 6.52380846498186e-07, "loss": 0.8426, "step": 40907 }, { "epoch": 0.77, "learning_rate": 6.522779389659342e-07, "loss": 0.7521, "step": 40908 }, { "epoch": 0.77, "learning_rate": 6.5217503833302e-07, "loss": 0.8274, "step": 40909 }, { "epoch": 0.77, "learning_rate": 6.520721445998274e-07, "loss": 0.7853, "step": 40910 }, { "epoch": 0.77, "learning_rate": 6.519692577667408e-07, "loss": 0.8902, "step": 40911 }, { "epoch": 0.77, "learning_rate": 6.518663778341445e-07, "loss": 0.9104, "step": 40912 }, { "epoch": 0.77, "learning_rate": 6.517635048024229e-07, "loss": 0.8514, "step": 40913 }, { "epoch": 0.77, "learning_rate": 6.516606386719584e-07, "loss": 0.8793, "step": 40914 }, { "epoch": 0.77, "learning_rate": 6.51557779443138e-07, "loss": 1.0099, "step": 40915 }, { "epoch": 0.77, "learning_rate": 6.514549271163434e-07, "loss": 0.7181, "step": 40916 }, { "epoch": 0.77, "learning_rate": 6.513520816919585e-07, "loss": 0.8056, "step": 40917 }, { "epoch": 0.77, "learning_rate": 6.512492431703699e-07, "loss": 0.9053, "step": 40918 }, { "epoch": 0.77, "learning_rate": 6.511464115519592e-07, "loss": 1.1205, "step": 40919 }, { "epoch": 0.77, "learning_rate": 6.510435868371109e-07, "loss": 0.8799, "step": 40920 }, { "epoch": 0.77, "learning_rate": 6.509407690262093e-07, "loss": 0.7509, "step": 40921 }, { "epoch": 0.77, "learning_rate": 6.508379581196383e-07, "loss": 0.7587, "step": 40922 }, { "epoch": 0.77, "learning_rate": 6.507351541177814e-07, "loss": 0.952, "step": 40923 }, { "epoch": 0.77, "learning_rate": 6.50632357021023e-07, "loss": 1.2762, "step": 40924 }, { "epoch": 0.77, "learning_rate": 6.505295668297473e-07, "loss": 0.9593, "step": 40925 }, { "epoch": 0.77, "learning_rate": 6.504267835443359e-07, "loss": 0.92, "step": 40926 }, { "epoch": 0.77, "learning_rate": 6.503240071651759e-07, "loss": 0.8703, "step": 40927 }, { "epoch": 0.77, "learning_rate": 6.502212376926484e-07, "loss": 0.8599, "step": 40928 }, { "epoch": 0.77, "learning_rate": 6.501184751271381e-07, "loss": 0.6556, "step": 40929 }, { "epoch": 0.77, "learning_rate": 6.500157194690288e-07, "loss": 0.6859, "step": 40930 }, { "epoch": 0.77, "learning_rate": 6.499129707187041e-07, "loss": 0.9909, "step": 40931 }, { "epoch": 0.77, "learning_rate": 6.498102288765477e-07, "loss": 1.0793, "step": 40932 }, { "epoch": 0.77, "learning_rate": 6.497074939429429e-07, "loss": 0.7597, "step": 40933 }, { "epoch": 0.77, "learning_rate": 6.496047659182745e-07, "loss": 0.9455, "step": 40934 }, { "epoch": 0.77, "learning_rate": 6.495020448029238e-07, "loss": 0.9016, "step": 40935 }, { "epoch": 0.77, "learning_rate": 6.49399330597277e-07, "loss": 0.8107, "step": 40936 }, { "epoch": 0.77, "learning_rate": 6.492966233017156e-07, "loss": 0.8315, "step": 40937 }, { "epoch": 0.77, "learning_rate": 6.491939229166233e-07, "loss": 0.7375, "step": 40938 }, { "epoch": 0.77, "learning_rate": 6.490912294423854e-07, "loss": 0.8847, "step": 40939 }, { "epoch": 0.77, "learning_rate": 6.489885428793835e-07, "loss": 0.8048, "step": 40940 }, { "epoch": 0.77, "learning_rate": 6.488858632280018e-07, "loss": 0.9618, "step": 40941 }, { "epoch": 0.77, "learning_rate": 6.487831904886233e-07, "loss": 0.9031, "step": 40942 }, { "epoch": 0.77, "learning_rate": 6.486805246616317e-07, "loss": 1.0309, "step": 40943 }, { "epoch": 0.77, "learning_rate": 6.485778657474101e-07, "loss": 0.9689, "step": 40944 }, { "epoch": 0.77, "learning_rate": 6.484752137463423e-07, "loss": 0.9108, "step": 40945 }, { "epoch": 0.77, "learning_rate": 6.483725686588119e-07, "loss": 0.8031, "step": 40946 }, { "epoch": 0.77, "learning_rate": 6.482699304851999e-07, "loss": 1.0268, "step": 40947 }, { "epoch": 0.77, "learning_rate": 6.481672992258927e-07, "loss": 0.8856, "step": 40948 }, { "epoch": 0.77, "learning_rate": 6.480646748812717e-07, "loss": 1.1688, "step": 40949 }, { "epoch": 0.77, "learning_rate": 6.479620574517198e-07, "loss": 1.0211, "step": 40950 }, { "epoch": 0.77, "learning_rate": 6.478594469376212e-07, "loss": 0.7759, "step": 40951 }, { "epoch": 0.77, "learning_rate": 6.477568433393586e-07, "loss": 0.9016, "step": 40952 }, { "epoch": 0.77, "learning_rate": 6.476542466573149e-07, "loss": 0.9631, "step": 40953 }, { "epoch": 0.77, "learning_rate": 6.475516568918738e-07, "loss": 0.9174, "step": 40954 }, { "epoch": 0.77, "learning_rate": 6.474490740434187e-07, "loss": 0.9539, "step": 40955 }, { "epoch": 0.77, "learning_rate": 6.473464981123304e-07, "loss": 1.075, "step": 40956 }, { "epoch": 0.77, "learning_rate": 6.472439290989949e-07, "loss": 1.0356, "step": 40957 }, { "epoch": 0.77, "learning_rate": 6.47141367003793e-07, "loss": 0.7736, "step": 40958 }, { "epoch": 0.77, "learning_rate": 6.470388118271076e-07, "loss": 0.9525, "step": 40959 }, { "epoch": 0.77, "learning_rate": 6.469362635693241e-07, "loss": 0.937, "step": 40960 }, { "epoch": 0.77, "learning_rate": 6.46833722230823e-07, "loss": 0.7881, "step": 40961 }, { "epoch": 0.77, "learning_rate": 6.467311878119881e-07, "loss": 1.0186, "step": 40962 }, { "epoch": 0.77, "learning_rate": 6.466286603132018e-07, "loss": 0.8763, "step": 40963 }, { "epoch": 0.77, "learning_rate": 6.465261397348477e-07, "loss": 1.0548, "step": 40964 }, { "epoch": 0.77, "learning_rate": 6.464236260773077e-07, "loss": 0.84, "step": 40965 }, { "epoch": 0.77, "learning_rate": 6.463211193409655e-07, "loss": 1.0017, "step": 40966 }, { "epoch": 0.77, "learning_rate": 6.462186195262038e-07, "loss": 0.7409, "step": 40967 }, { "epoch": 0.77, "learning_rate": 6.461161266334042e-07, "loss": 1.0563, "step": 40968 }, { "epoch": 0.77, "learning_rate": 6.460136406629502e-07, "loss": 1.1154, "step": 40969 }, { "epoch": 0.77, "learning_rate": 6.459111616152247e-07, "loss": 0.8204, "step": 40970 }, { "epoch": 0.77, "learning_rate": 6.458086894906098e-07, "loss": 1.0022, "step": 40971 }, { "epoch": 0.77, "learning_rate": 6.457062242894885e-07, "loss": 1.0215, "step": 40972 }, { "epoch": 0.77, "learning_rate": 6.456037660122432e-07, "loss": 0.8353, "step": 40973 }, { "epoch": 0.77, "learning_rate": 6.455013146592573e-07, "loss": 1.0446, "step": 40974 }, { "epoch": 0.77, "learning_rate": 6.453988702309114e-07, "loss": 1.0908, "step": 40975 }, { "epoch": 0.77, "learning_rate": 6.452964327275904e-07, "loss": 0.809, "step": 40976 }, { "epoch": 0.77, "learning_rate": 6.451940021496753e-07, "loss": 0.7249, "step": 40977 }, { "epoch": 0.77, "learning_rate": 6.450915784975487e-07, "loss": 0.83, "step": 40978 }, { "epoch": 0.77, "learning_rate": 6.44989161771593e-07, "loss": 0.8231, "step": 40979 }, { "epoch": 0.77, "learning_rate": 6.448867519721913e-07, "loss": 1.0043, "step": 40980 }, { "epoch": 0.77, "learning_rate": 6.447843490997255e-07, "loss": 1.1456, "step": 40981 }, { "epoch": 0.77, "learning_rate": 6.446819531545781e-07, "loss": 0.7533, "step": 40982 }, { "epoch": 0.77, "learning_rate": 6.445795641371319e-07, "loss": 0.8816, "step": 40983 }, { "epoch": 0.77, "learning_rate": 6.444771820477674e-07, "loss": 0.9874, "step": 40984 }, { "epoch": 0.77, "learning_rate": 6.443748068868691e-07, "loss": 0.7904, "step": 40985 }, { "epoch": 0.77, "learning_rate": 6.442724386548188e-07, "loss": 0.731, "step": 40986 }, { "epoch": 0.77, "learning_rate": 6.441700773519971e-07, "loss": 1.119, "step": 40987 }, { "epoch": 0.77, "learning_rate": 6.440677229787886e-07, "loss": 0.8093, "step": 40988 }, { "epoch": 0.77, "learning_rate": 6.43965375535574e-07, "loss": 1.1105, "step": 40989 }, { "epoch": 0.77, "learning_rate": 6.438630350227354e-07, "loss": 0.9169, "step": 40990 }, { "epoch": 0.77, "learning_rate": 6.437607014406555e-07, "loss": 0.8278, "step": 40991 }, { "epoch": 0.77, "learning_rate": 6.436583747897163e-07, "loss": 0.8745, "step": 40992 }, { "epoch": 0.77, "learning_rate": 6.435560550702999e-07, "loss": 0.9469, "step": 40993 }, { "epoch": 0.77, "learning_rate": 6.43453742282788e-07, "loss": 1.1116, "step": 40994 }, { "epoch": 0.77, "learning_rate": 6.433514364275637e-07, "loss": 0.7482, "step": 40995 }, { "epoch": 0.77, "learning_rate": 6.432491375050067e-07, "loss": 0.8274, "step": 40996 }, { "epoch": 0.77, "learning_rate": 6.431468455155021e-07, "loss": 0.8359, "step": 40997 }, { "epoch": 0.77, "learning_rate": 6.430445604594296e-07, "loss": 0.9694, "step": 40998 }, { "epoch": 0.77, "learning_rate": 6.429422823371714e-07, "loss": 0.9514, "step": 40999 }, { "epoch": 0.77, "learning_rate": 6.428400111491101e-07, "loss": 0.9709, "step": 41000 }, { "epoch": 0.77, "learning_rate": 6.427377468956273e-07, "loss": 0.9033, "step": 41001 }, { "epoch": 0.77, "learning_rate": 6.426354895771045e-07, "loss": 0.8224, "step": 41002 }, { "epoch": 0.77, "learning_rate": 6.42533239193924e-07, "loss": 0.9742, "step": 41003 }, { "epoch": 0.77, "learning_rate": 6.424309957464683e-07, "loss": 0.8564, "step": 41004 }, { "epoch": 0.77, "learning_rate": 6.423287592351166e-07, "loss": 1.0373, "step": 41005 }, { "epoch": 0.77, "learning_rate": 6.422265296602531e-07, "loss": 1.0619, "step": 41006 }, { "epoch": 0.77, "learning_rate": 6.421243070222596e-07, "loss": 0.8645, "step": 41007 }, { "epoch": 0.77, "learning_rate": 6.420220913215155e-07, "loss": 1.0906, "step": 41008 }, { "epoch": 0.77, "learning_rate": 6.419198825584056e-07, "loss": 0.933, "step": 41009 }, { "epoch": 0.77, "learning_rate": 6.41817680733309e-07, "loss": 0.8153, "step": 41010 }, { "epoch": 0.77, "learning_rate": 6.417154858466083e-07, "loss": 0.7379, "step": 41011 }, { "epoch": 0.77, "learning_rate": 6.416132978986847e-07, "loss": 0.9332, "step": 41012 }, { "epoch": 0.77, "learning_rate": 6.415111168899201e-07, "loss": 0.9712, "step": 41013 }, { "epoch": 0.77, "learning_rate": 6.414089428206963e-07, "loss": 0.9254, "step": 41014 }, { "epoch": 0.77, "learning_rate": 6.413067756913944e-07, "loss": 0.92, "step": 41015 }, { "epoch": 0.77, "learning_rate": 6.412046155023969e-07, "loss": 0.9183, "step": 41016 }, { "epoch": 0.77, "learning_rate": 6.411024622540826e-07, "loss": 0.891, "step": 41017 }, { "epoch": 0.77, "learning_rate": 6.410003159468365e-07, "loss": 1.1402, "step": 41018 }, { "epoch": 0.77, "learning_rate": 6.408981765810371e-07, "loss": 1.0693, "step": 41019 }, { "epoch": 0.77, "learning_rate": 6.407960441570671e-07, "loss": 1.1291, "step": 41020 }, { "epoch": 0.77, "learning_rate": 6.406939186753077e-07, "loss": 0.9142, "step": 41021 }, { "epoch": 0.77, "learning_rate": 6.405918001361403e-07, "loss": 0.8696, "step": 41022 }, { "epoch": 0.77, "learning_rate": 6.404896885399458e-07, "loss": 0.957, "step": 41023 }, { "epoch": 0.77, "learning_rate": 6.40387583887106e-07, "loss": 0.8022, "step": 41024 }, { "epoch": 0.77, "learning_rate": 6.402854861780028e-07, "loss": 1.1168, "step": 41025 }, { "epoch": 0.77, "learning_rate": 6.401833954130149e-07, "loss": 0.8503, "step": 41026 }, { "epoch": 0.77, "learning_rate": 6.400813115925258e-07, "loss": 0.7719, "step": 41027 }, { "epoch": 0.77, "learning_rate": 6.39979234716917e-07, "loss": 1.0753, "step": 41028 }, { "epoch": 0.77, "learning_rate": 6.398771647865673e-07, "loss": 0.9362, "step": 41029 }, { "epoch": 0.77, "learning_rate": 6.397751018018606e-07, "loss": 0.9288, "step": 41030 }, { "epoch": 0.77, "learning_rate": 6.396730457631759e-07, "loss": 0.9155, "step": 41031 }, { "epoch": 0.77, "learning_rate": 6.395709966708952e-07, "loss": 0.7893, "step": 41032 }, { "epoch": 0.77, "learning_rate": 6.39468954525399e-07, "loss": 0.8873, "step": 41033 }, { "epoch": 0.77, "learning_rate": 6.393669193270688e-07, "loss": 0.8027, "step": 41034 }, { "epoch": 0.77, "learning_rate": 6.392648910762856e-07, "loss": 0.8675, "step": 41035 }, { "epoch": 0.77, "learning_rate": 6.391628697734301e-07, "loss": 0.9102, "step": 41036 }, { "epoch": 0.77, "learning_rate": 6.390608554188843e-07, "loss": 0.781, "step": 41037 }, { "epoch": 0.77, "learning_rate": 6.389588480130266e-07, "loss": 1.0305, "step": 41038 }, { "epoch": 0.77, "learning_rate": 6.388568475562409e-07, "loss": 0.7866, "step": 41039 }, { "epoch": 0.77, "learning_rate": 6.38754854048906e-07, "loss": 0.8556, "step": 41040 }, { "epoch": 0.77, "learning_rate": 6.386528674914036e-07, "loss": 0.7493, "step": 41041 }, { "epoch": 0.77, "learning_rate": 6.38550887884114e-07, "loss": 0.7721, "step": 41042 }, { "epoch": 0.77, "learning_rate": 6.384489152274187e-07, "loss": 1.0455, "step": 41043 }, { "epoch": 0.77, "learning_rate": 6.383469495216979e-07, "loss": 0.9274, "step": 41044 }, { "epoch": 0.77, "learning_rate": 6.382449907673325e-07, "loss": 0.9707, "step": 41045 }, { "epoch": 0.77, "learning_rate": 6.381430389647036e-07, "loss": 0.8618, "step": 41046 }, { "epoch": 0.77, "learning_rate": 6.380410941141904e-07, "loss": 0.9428, "step": 41047 }, { "epoch": 0.77, "learning_rate": 6.379391562161754e-07, "loss": 0.7748, "step": 41048 }, { "epoch": 0.77, "learning_rate": 6.378372252710393e-07, "loss": 0.9501, "step": 41049 }, { "epoch": 0.77, "learning_rate": 6.377353012791603e-07, "loss": 0.8976, "step": 41050 }, { "epoch": 0.77, "learning_rate": 6.376333842409221e-07, "loss": 0.9277, "step": 41051 }, { "epoch": 0.77, "learning_rate": 6.375314741567029e-07, "loss": 0.8766, "step": 41052 }, { "epoch": 0.77, "learning_rate": 6.374295710268841e-07, "loss": 0.9394, "step": 41053 }, { "epoch": 0.77, "learning_rate": 6.373276748518465e-07, "loss": 1.0149, "step": 41054 }, { "epoch": 0.77, "learning_rate": 6.3722578563197e-07, "loss": 0.915, "step": 41055 }, { "epoch": 0.77, "learning_rate": 6.371239033676352e-07, "loss": 0.9333, "step": 41056 }, { "epoch": 0.77, "learning_rate": 6.370220280592226e-07, "loss": 0.9012, "step": 41057 }, { "epoch": 0.77, "learning_rate": 6.369201597071134e-07, "loss": 0.7334, "step": 41058 }, { "epoch": 0.77, "learning_rate": 6.368182983116858e-07, "loss": 1.1136, "step": 41059 }, { "epoch": 0.77, "learning_rate": 6.367164438733231e-07, "loss": 0.7862, "step": 41060 }, { "epoch": 0.77, "learning_rate": 6.366145963924033e-07, "loss": 0.7461, "step": 41061 }, { "epoch": 0.77, "learning_rate": 6.365127558693073e-07, "loss": 0.9036, "step": 41062 }, { "epoch": 0.77, "learning_rate": 6.364109223044157e-07, "loss": 1.1567, "step": 41063 }, { "epoch": 0.77, "learning_rate": 6.363090956981086e-07, "loss": 0.8926, "step": 41064 }, { "epoch": 0.77, "learning_rate": 6.362072760507663e-07, "loss": 0.9491, "step": 41065 }, { "epoch": 0.77, "learning_rate": 6.361054633627686e-07, "loss": 0.7722, "step": 41066 }, { "epoch": 0.77, "learning_rate": 6.360036576344969e-07, "loss": 0.7623, "step": 41067 }, { "epoch": 0.77, "learning_rate": 6.359018588663288e-07, "loss": 1.0655, "step": 41068 }, { "epoch": 0.77, "learning_rate": 6.358000670586467e-07, "loss": 1.0339, "step": 41069 }, { "epoch": 0.77, "learning_rate": 6.356982822118307e-07, "loss": 0.8876, "step": 41070 }, { "epoch": 0.77, "learning_rate": 6.355965043262588e-07, "loss": 0.8195, "step": 41071 }, { "epoch": 0.77, "learning_rate": 6.35494733402314e-07, "loss": 0.8161, "step": 41072 }, { "epoch": 0.77, "learning_rate": 6.353929694403738e-07, "loss": 0.6888, "step": 41073 }, { "epoch": 0.77, "learning_rate": 6.352912124408189e-07, "loss": 1.0443, "step": 41074 }, { "epoch": 0.77, "learning_rate": 6.351894624040297e-07, "loss": 0.942, "step": 41075 }, { "epoch": 0.77, "learning_rate": 6.350877193303858e-07, "loss": 0.9823, "step": 41076 }, { "epoch": 0.77, "learning_rate": 6.34985983220267e-07, "loss": 0.9521, "step": 41077 }, { "epoch": 0.78, "learning_rate": 6.348842540740536e-07, "loss": 0.8802, "step": 41078 }, { "epoch": 0.78, "learning_rate": 6.347825318921258e-07, "loss": 0.8677, "step": 41079 }, { "epoch": 0.78, "learning_rate": 6.346808166748617e-07, "loss": 0.8915, "step": 41080 }, { "epoch": 0.78, "learning_rate": 6.345791084226432e-07, "loss": 0.975, "step": 41081 }, { "epoch": 0.78, "learning_rate": 6.344774071358486e-07, "loss": 0.8428, "step": 41082 }, { "epoch": 0.78, "learning_rate": 6.343757128148584e-07, "loss": 0.9232, "step": 41083 }, { "epoch": 0.78, "learning_rate": 6.342740254600519e-07, "loss": 1.0684, "step": 41084 }, { "epoch": 0.78, "learning_rate": 6.341723450718088e-07, "loss": 0.644, "step": 41085 }, { "epoch": 0.78, "learning_rate": 6.34070671650509e-07, "loss": 0.7845, "step": 41086 }, { "epoch": 0.78, "learning_rate": 6.339690051965325e-07, "loss": 0.9589, "step": 41087 }, { "epoch": 0.78, "learning_rate": 6.338673457102587e-07, "loss": 0.9873, "step": 41088 }, { "epoch": 0.78, "learning_rate": 6.33765693192066e-07, "loss": 1.0352, "step": 41089 }, { "epoch": 0.78, "learning_rate": 6.336640476423356e-07, "loss": 1.0092, "step": 41090 }, { "epoch": 0.78, "learning_rate": 6.33562409061447e-07, "loss": 1.1033, "step": 41091 }, { "epoch": 0.78, "learning_rate": 6.334607774497777e-07, "loss": 0.965, "step": 41092 }, { "epoch": 0.78, "learning_rate": 6.333591528077102e-07, "loss": 1.0393, "step": 41093 }, { "epoch": 0.78, "learning_rate": 6.332575351356216e-07, "loss": 0.9805, "step": 41094 }, { "epoch": 0.78, "learning_rate": 6.331559244338922e-07, "loss": 0.8945, "step": 41095 }, { "epoch": 0.78, "learning_rate": 6.330543207029011e-07, "loss": 0.7906, "step": 41096 }, { "epoch": 0.78, "learning_rate": 6.329527239430283e-07, "loss": 0.9158, "step": 41097 }, { "epoch": 0.78, "learning_rate": 6.328511341546525e-07, "loss": 0.8703, "step": 41098 }, { "epoch": 0.78, "learning_rate": 6.327495513381535e-07, "loss": 0.9243, "step": 41099 }, { "epoch": 0.78, "learning_rate": 6.32647975493911e-07, "loss": 1.0986, "step": 41100 }, { "epoch": 0.78, "learning_rate": 6.325464066223023e-07, "loss": 1.0402, "step": 41101 }, { "epoch": 0.78, "learning_rate": 6.324448447237094e-07, "loss": 0.8735, "step": 41102 }, { "epoch": 0.78, "learning_rate": 6.323432897985096e-07, "loss": 0.9667, "step": 41103 }, { "epoch": 0.78, "learning_rate": 6.322417418470828e-07, "loss": 0.7242, "step": 41104 }, { "epoch": 0.78, "learning_rate": 6.32140200869808e-07, "loss": 0.7788, "step": 41105 }, { "epoch": 0.78, "learning_rate": 6.320386668670641e-07, "loss": 1.0558, "step": 41106 }, { "epoch": 0.78, "learning_rate": 6.31937139839231e-07, "loss": 0.9812, "step": 41107 }, { "epoch": 0.78, "learning_rate": 6.318356197866871e-07, "loss": 0.8283, "step": 41108 }, { "epoch": 0.78, "learning_rate": 6.317341067098126e-07, "loss": 0.8281, "step": 41109 }, { "epoch": 0.78, "learning_rate": 6.31632600608984e-07, "loss": 0.8539, "step": 41110 }, { "epoch": 0.78, "learning_rate": 6.31531101484583e-07, "loss": 0.8851, "step": 41111 }, { "epoch": 0.78, "learning_rate": 6.314296093369879e-07, "loss": 1.1982, "step": 41112 }, { "epoch": 0.78, "learning_rate": 6.313281241665762e-07, "loss": 0.9501, "step": 41113 }, { "epoch": 0.78, "learning_rate": 6.312266459737293e-07, "loss": 0.8677, "step": 41114 }, { "epoch": 0.78, "learning_rate": 6.311251747588242e-07, "loss": 1.0676, "step": 41115 }, { "epoch": 0.78, "learning_rate": 6.310237105222403e-07, "loss": 0.9628, "step": 41116 }, { "epoch": 0.78, "learning_rate": 6.309222532643567e-07, "loss": 0.8564, "step": 41117 }, { "epoch": 0.78, "learning_rate": 6.30820802985552e-07, "loss": 1.116, "step": 41118 }, { "epoch": 0.78, "learning_rate": 6.307193596862049e-07, "loss": 0.9406, "step": 41119 }, { "epoch": 0.78, "learning_rate": 6.306179233666948e-07, "loss": 0.6995, "step": 41120 }, { "epoch": 0.78, "learning_rate": 6.305164940274005e-07, "loss": 0.919, "step": 41121 }, { "epoch": 0.78, "learning_rate": 6.304150716686988e-07, "loss": 0.7259, "step": 41122 }, { "epoch": 0.78, "learning_rate": 6.303136562909717e-07, "loss": 0.7567, "step": 41123 }, { "epoch": 0.78, "learning_rate": 6.302122478945952e-07, "loss": 0.8782, "step": 41124 }, { "epoch": 0.78, "learning_rate": 6.301108464799485e-07, "loss": 1.0111, "step": 41125 }, { "epoch": 0.78, "learning_rate": 6.30009452047411e-07, "loss": 0.7537, "step": 41126 }, { "epoch": 0.78, "learning_rate": 6.299080645973607e-07, "loss": 0.8398, "step": 41127 }, { "epoch": 0.78, "learning_rate": 6.298066841301765e-07, "loss": 1.04, "step": 41128 }, { "epoch": 0.78, "learning_rate": 6.297053106462365e-07, "loss": 0.8408, "step": 41129 }, { "epoch": 0.78, "learning_rate": 6.296039441459204e-07, "loss": 1.0451, "step": 41130 }, { "epoch": 0.78, "learning_rate": 6.295025846296044e-07, "loss": 1.0318, "step": 41131 }, { "epoch": 0.78, "learning_rate": 6.294012320976692e-07, "loss": 0.9446, "step": 41132 }, { "epoch": 0.78, "learning_rate": 6.292998865504929e-07, "loss": 0.9335, "step": 41133 }, { "epoch": 0.78, "learning_rate": 6.291985479884522e-07, "loss": 0.7409, "step": 41134 }, { "epoch": 0.78, "learning_rate": 6.290972164119283e-07, "loss": 0.8087, "step": 41135 }, { "epoch": 0.78, "learning_rate": 6.289958918212971e-07, "loss": 0.711, "step": 41136 }, { "epoch": 0.78, "learning_rate": 6.288945742169381e-07, "loss": 0.9436, "step": 41137 }, { "epoch": 0.78, "learning_rate": 6.287932635992292e-07, "loss": 0.9923, "step": 41138 }, { "epoch": 0.78, "learning_rate": 6.28691959968549e-07, "loss": 0.8889, "step": 41139 }, { "epoch": 0.78, "learning_rate": 6.285906633252756e-07, "loss": 0.9894, "step": 41140 }, { "epoch": 0.78, "learning_rate": 6.284893736697873e-07, "loss": 0.675, "step": 41141 }, { "epoch": 0.78, "learning_rate": 6.283880910024632e-07, "loss": 0.881, "step": 41142 }, { "epoch": 0.78, "learning_rate": 6.282868153236787e-07, "loss": 0.9082, "step": 41143 }, { "epoch": 0.78, "learning_rate": 6.281855466338154e-07, "loss": 1.2106, "step": 41144 }, { "epoch": 0.78, "learning_rate": 6.280842849332494e-07, "loss": 0.8682, "step": 41145 }, { "epoch": 0.78, "learning_rate": 6.279830302223594e-07, "loss": 0.8535, "step": 41146 }, { "epoch": 0.78, "learning_rate": 6.27881782501523e-07, "loss": 1.0086, "step": 41147 }, { "epoch": 0.78, "learning_rate": 6.277805417711189e-07, "loss": 0.8576, "step": 41148 }, { "epoch": 0.78, "learning_rate": 6.276793080315247e-07, "loss": 1.1297, "step": 41149 }, { "epoch": 0.78, "learning_rate": 6.275780812831184e-07, "loss": 0.9608, "step": 41150 }, { "epoch": 0.78, "learning_rate": 6.274768615262791e-07, "loss": 0.8566, "step": 41151 }, { "epoch": 0.78, "learning_rate": 6.273756487613822e-07, "loss": 0.8471, "step": 41152 }, { "epoch": 0.78, "learning_rate": 6.272744429888081e-07, "loss": 0.8408, "step": 41153 }, { "epoch": 0.78, "learning_rate": 6.271732442089346e-07, "loss": 0.7847, "step": 41154 }, { "epoch": 0.78, "learning_rate": 6.270720524221371e-07, "loss": 1.2134, "step": 41155 }, { "epoch": 0.78, "learning_rate": 6.269708676287967e-07, "loss": 0.9092, "step": 41156 }, { "epoch": 0.78, "learning_rate": 6.268696898292889e-07, "loss": 1.0047, "step": 41157 }, { "epoch": 0.78, "learning_rate": 6.267685190239922e-07, "loss": 0.8417, "step": 41158 }, { "epoch": 0.78, "learning_rate": 6.266673552132843e-07, "loss": 0.7658, "step": 41159 }, { "epoch": 0.78, "learning_rate": 6.265661983975432e-07, "loss": 0.8946, "step": 41160 }, { "epoch": 0.78, "learning_rate": 6.264650485771464e-07, "loss": 1.0612, "step": 41161 }, { "epoch": 0.78, "learning_rate": 6.26363905752472e-07, "loss": 0.9206, "step": 41162 }, { "epoch": 0.78, "learning_rate": 6.262627699238977e-07, "loss": 0.8785, "step": 41163 }, { "epoch": 0.78, "learning_rate": 6.261616410917995e-07, "loss": 0.7863, "step": 41164 }, { "epoch": 0.78, "learning_rate": 6.260605192565578e-07, "loss": 0.9651, "step": 41165 }, { "epoch": 0.78, "learning_rate": 6.259594044185477e-07, "loss": 0.8694, "step": 41166 }, { "epoch": 0.78, "learning_rate": 6.258582965781477e-07, "loss": 0.6207, "step": 41167 }, { "epoch": 0.78, "learning_rate": 6.257571957357355e-07, "loss": 0.9759, "step": 41168 }, { "epoch": 0.78, "learning_rate": 6.256561018916884e-07, "loss": 1.0327, "step": 41169 }, { "epoch": 0.78, "learning_rate": 6.25555015046384e-07, "loss": 0.8437, "step": 41170 }, { "epoch": 0.78, "learning_rate": 6.254539352001998e-07, "loss": 0.823, "step": 41171 }, { "epoch": 0.78, "learning_rate": 6.253528623535137e-07, "loss": 0.7139, "step": 41172 }, { "epoch": 0.78, "learning_rate": 6.252517965067012e-07, "loss": 0.9509, "step": 41173 }, { "epoch": 0.78, "learning_rate": 6.251507376601415e-07, "loss": 0.9175, "step": 41174 }, { "epoch": 0.78, "learning_rate": 6.250496858142124e-07, "loss": 1.0203, "step": 41175 }, { "epoch": 0.78, "learning_rate": 6.249486409692887e-07, "loss": 0.9369, "step": 41176 }, { "epoch": 0.78, "learning_rate": 6.248476031257509e-07, "loss": 0.7835, "step": 41177 }, { "epoch": 0.78, "learning_rate": 6.247465722839738e-07, "loss": 0.9533, "step": 41178 }, { "epoch": 0.78, "learning_rate": 6.246455484443357e-07, "loss": 0.9503, "step": 41179 }, { "epoch": 0.78, "learning_rate": 6.245445316072132e-07, "loss": 0.6037, "step": 41180 }, { "epoch": 0.78, "learning_rate": 6.244435217729844e-07, "loss": 1.2884, "step": 41181 }, { "epoch": 0.78, "learning_rate": 6.243425189420258e-07, "loss": 0.972, "step": 41182 }, { "epoch": 0.78, "learning_rate": 6.242415231147148e-07, "loss": 0.8795, "step": 41183 }, { "epoch": 0.78, "learning_rate": 6.241405342914289e-07, "loss": 0.9269, "step": 41184 }, { "epoch": 0.78, "learning_rate": 6.240395524725435e-07, "loss": 0.7015, "step": 41185 }, { "epoch": 0.78, "learning_rate": 6.239385776584383e-07, "loss": 1.1166, "step": 41186 }, { "epoch": 0.78, "learning_rate": 6.238376098494881e-07, "loss": 1.0699, "step": 41187 }, { "epoch": 0.78, "learning_rate": 6.237366490460709e-07, "loss": 0.9234, "step": 41188 }, { "epoch": 0.78, "learning_rate": 6.236356952485633e-07, "loss": 0.9022, "step": 41189 }, { "epoch": 0.78, "learning_rate": 6.235347484573428e-07, "loss": 0.8295, "step": 41190 }, { "epoch": 0.78, "learning_rate": 6.23433808672786e-07, "loss": 0.7034, "step": 41191 }, { "epoch": 0.78, "learning_rate": 6.233328758952695e-07, "loss": 0.9496, "step": 41192 }, { "epoch": 0.78, "learning_rate": 6.232319501251715e-07, "loss": 1.0302, "step": 41193 }, { "epoch": 0.78, "learning_rate": 6.231310313628663e-07, "loss": 1.0929, "step": 41194 }, { "epoch": 0.78, "learning_rate": 6.230301196087329e-07, "loss": 0.9619, "step": 41195 }, { "epoch": 0.78, "learning_rate": 6.229292148631483e-07, "loss": 0.9375, "step": 41196 }, { "epoch": 0.78, "learning_rate": 6.22828317126487e-07, "loss": 0.972, "step": 41197 }, { "epoch": 0.78, "learning_rate": 6.227274263991286e-07, "loss": 0.8587, "step": 41198 }, { "epoch": 0.78, "learning_rate": 6.226265426814479e-07, "loss": 0.8093, "step": 41199 }, { "epoch": 0.78, "learning_rate": 6.225256659738221e-07, "loss": 0.9828, "step": 41200 }, { "epoch": 0.78, "learning_rate": 6.224247962766277e-07, "loss": 0.9274, "step": 41201 }, { "epoch": 0.78, "learning_rate": 6.223239335902417e-07, "loss": 0.8983, "step": 41202 }, { "epoch": 0.78, "learning_rate": 6.222230779150414e-07, "loss": 0.813, "step": 41203 }, { "epoch": 0.78, "learning_rate": 6.22122229251401e-07, "loss": 0.7545, "step": 41204 }, { "epoch": 0.78, "learning_rate": 6.220213875997e-07, "loss": 0.8002, "step": 41205 }, { "epoch": 0.78, "learning_rate": 6.219205529603128e-07, "loss": 1.017, "step": 41206 }, { "epoch": 0.78, "learning_rate": 6.21819725333617e-07, "loss": 0.9312, "step": 41207 }, { "epoch": 0.78, "learning_rate": 6.217189047199885e-07, "loss": 0.7574, "step": 41208 }, { "epoch": 0.78, "learning_rate": 6.216180911198039e-07, "loss": 0.9921, "step": 41209 }, { "epoch": 0.78, "learning_rate": 6.215172845334397e-07, "loss": 0.8327, "step": 41210 }, { "epoch": 0.78, "learning_rate": 6.214164849612728e-07, "loss": 0.8217, "step": 41211 }, { "epoch": 0.78, "learning_rate": 6.213156924036795e-07, "loss": 0.8381, "step": 41212 }, { "epoch": 0.78, "learning_rate": 6.212149068610343e-07, "loss": 0.8192, "step": 41213 }, { "epoch": 0.78, "learning_rate": 6.211141283337169e-07, "loss": 0.9083, "step": 41214 }, { "epoch": 0.78, "learning_rate": 6.210133568221006e-07, "loss": 0.866, "step": 41215 }, { "epoch": 0.78, "learning_rate": 6.209125923265621e-07, "loss": 0.9114, "step": 41216 }, { "epoch": 0.78, "learning_rate": 6.208118348474801e-07, "loss": 0.7756, "step": 41217 }, { "epoch": 0.78, "learning_rate": 6.207110843852282e-07, "loss": 0.8742, "step": 41218 }, { "epoch": 0.78, "learning_rate": 6.206103409401837e-07, "loss": 0.8898, "step": 41219 }, { "epoch": 0.78, "learning_rate": 6.205096045127223e-07, "loss": 0.8814, "step": 41220 }, { "epoch": 0.78, "learning_rate": 6.204088751032205e-07, "loss": 0.8184, "step": 41221 }, { "epoch": 0.78, "learning_rate": 6.203081527120544e-07, "loss": 1.3954, "step": 41222 }, { "epoch": 0.78, "learning_rate": 6.202074373395997e-07, "loss": 0.8398, "step": 41223 }, { "epoch": 0.78, "learning_rate": 6.201067289862339e-07, "loss": 1.075, "step": 41224 }, { "epoch": 0.78, "learning_rate": 6.200060276523304e-07, "loss": 1.0645, "step": 41225 }, { "epoch": 0.78, "learning_rate": 6.199053333382682e-07, "loss": 0.7343, "step": 41226 }, { "epoch": 0.78, "learning_rate": 6.198046460444209e-07, "loss": 0.8647, "step": 41227 }, { "epoch": 0.78, "learning_rate": 6.197039657711656e-07, "loss": 0.702, "step": 41228 }, { "epoch": 0.78, "learning_rate": 6.19603292518878e-07, "loss": 0.5934, "step": 41229 }, { "epoch": 0.78, "learning_rate": 6.195026262879342e-07, "loss": 1.0108, "step": 41230 }, { "epoch": 0.78, "learning_rate": 6.194019670787097e-07, "loss": 1.2533, "step": 41231 }, { "epoch": 0.78, "learning_rate": 6.193013148915808e-07, "loss": 0.9749, "step": 41232 }, { "epoch": 0.78, "learning_rate": 6.192006697269237e-07, "loss": 0.6913, "step": 41233 }, { "epoch": 0.78, "learning_rate": 6.191000315851123e-07, "loss": 0.8126, "step": 41234 }, { "epoch": 0.78, "learning_rate": 6.189994004665251e-07, "loss": 0.6255, "step": 41235 }, { "epoch": 0.78, "learning_rate": 6.188987763715357e-07, "loss": 0.8604, "step": 41236 }, { "epoch": 0.78, "learning_rate": 6.187981593005199e-07, "loss": 1.123, "step": 41237 }, { "epoch": 0.78, "learning_rate": 6.186975492538555e-07, "loss": 0.9664, "step": 41238 }, { "epoch": 0.78, "learning_rate": 6.185969462319161e-07, "loss": 0.8384, "step": 41239 }, { "epoch": 0.78, "learning_rate": 6.18496350235078e-07, "loss": 0.8555, "step": 41240 }, { "epoch": 0.78, "learning_rate": 6.183957612637168e-07, "loss": 0.8858, "step": 41241 }, { "epoch": 0.78, "learning_rate": 6.182951793182082e-07, "loss": 0.707, "step": 41242 }, { "epoch": 0.78, "learning_rate": 6.181946043989276e-07, "loss": 1.0628, "step": 41243 }, { "epoch": 0.78, "learning_rate": 6.180940365062508e-07, "loss": 0.8605, "step": 41244 }, { "epoch": 0.78, "learning_rate": 6.179934756405539e-07, "loss": 0.8421, "step": 41245 }, { "epoch": 0.78, "learning_rate": 6.178929218022101e-07, "loss": 0.8708, "step": 41246 }, { "epoch": 0.78, "learning_rate": 6.177923749915979e-07, "loss": 0.8569, "step": 41247 }, { "epoch": 0.78, "learning_rate": 6.176918352090905e-07, "loss": 0.852, "step": 41248 }, { "epoch": 0.78, "learning_rate": 6.175913024550642e-07, "loss": 1.0753, "step": 41249 }, { "epoch": 0.78, "learning_rate": 6.17490776729894e-07, "loss": 0.9753, "step": 41250 }, { "epoch": 0.78, "learning_rate": 6.173902580339558e-07, "loss": 0.7901, "step": 41251 }, { "epoch": 0.78, "learning_rate": 6.172897463676248e-07, "loss": 0.8892, "step": 41252 }, { "epoch": 0.78, "learning_rate": 6.171892417312758e-07, "loss": 0.7982, "step": 41253 }, { "epoch": 0.78, "learning_rate": 6.170887441252851e-07, "loss": 0.8126, "step": 41254 }, { "epoch": 0.78, "learning_rate": 6.169882535500263e-07, "loss": 0.903, "step": 41255 }, { "epoch": 0.78, "learning_rate": 6.168877700058768e-07, "loss": 1.174, "step": 41256 }, { "epoch": 0.78, "learning_rate": 6.167872934932098e-07, "loss": 0.9378, "step": 41257 }, { "epoch": 0.78, "learning_rate": 6.166868240124008e-07, "loss": 0.8064, "step": 41258 }, { "epoch": 0.78, "learning_rate": 6.165863615638268e-07, "loss": 0.936, "step": 41259 }, { "epoch": 0.78, "learning_rate": 6.164859061478609e-07, "loss": 0.7789, "step": 41260 }, { "epoch": 0.78, "learning_rate": 6.163854577648787e-07, "loss": 1.0615, "step": 41261 }, { "epoch": 0.78, "learning_rate": 6.162850164152557e-07, "loss": 1.0129, "step": 41262 }, { "epoch": 0.78, "learning_rate": 6.161845820993664e-07, "loss": 0.9631, "step": 41263 }, { "epoch": 0.78, "learning_rate": 6.160841548175864e-07, "loss": 1.1061, "step": 41264 }, { "epoch": 0.78, "learning_rate": 6.159837345702901e-07, "loss": 0.9519, "step": 41265 }, { "epoch": 0.78, "learning_rate": 6.158833213578538e-07, "loss": 0.9158, "step": 41266 }, { "epoch": 0.78, "learning_rate": 6.1578291518065e-07, "loss": 0.855, "step": 41267 }, { "epoch": 0.78, "learning_rate": 6.156825160390561e-07, "loss": 1.1146, "step": 41268 }, { "epoch": 0.78, "learning_rate": 6.155821239334456e-07, "loss": 0.9734, "step": 41269 }, { "epoch": 0.78, "learning_rate": 6.154817388641934e-07, "loss": 0.9462, "step": 41270 }, { "epoch": 0.78, "learning_rate": 6.153813608316748e-07, "loss": 0.8801, "step": 41271 }, { "epoch": 0.78, "learning_rate": 6.152809898362641e-07, "loss": 0.8968, "step": 41272 }, { "epoch": 0.78, "learning_rate": 6.151806258783366e-07, "loss": 0.7766, "step": 41273 }, { "epoch": 0.78, "learning_rate": 6.150802689582668e-07, "loss": 0.9944, "step": 41274 }, { "epoch": 0.78, "learning_rate": 6.149799190764305e-07, "loss": 1.1094, "step": 41275 }, { "epoch": 0.78, "learning_rate": 6.148795762331997e-07, "loss": 0.8378, "step": 41276 }, { "epoch": 0.78, "learning_rate": 6.147792404289521e-07, "loss": 0.9868, "step": 41277 }, { "epoch": 0.78, "learning_rate": 6.146789116640603e-07, "loss": 0.9257, "step": 41278 }, { "epoch": 0.78, "learning_rate": 6.145785899388992e-07, "loss": 0.9287, "step": 41279 }, { "epoch": 0.78, "learning_rate": 6.14478275253845e-07, "loss": 0.883, "step": 41280 }, { "epoch": 0.78, "learning_rate": 6.143779676092704e-07, "loss": 1.1198, "step": 41281 }, { "epoch": 0.78, "learning_rate": 6.142776670055509e-07, "loss": 1.0187, "step": 41282 }, { "epoch": 0.78, "learning_rate": 6.141773734430607e-07, "loss": 0.872, "step": 41283 }, { "epoch": 0.78, "learning_rate": 6.140770869221741e-07, "loss": 0.9269, "step": 41284 }, { "epoch": 0.78, "learning_rate": 6.139768074432661e-07, "loss": 0.7567, "step": 41285 }, { "epoch": 0.78, "learning_rate": 6.138765350067108e-07, "loss": 1.0521, "step": 41286 }, { "epoch": 0.78, "learning_rate": 6.137762696128832e-07, "loss": 1.1613, "step": 41287 }, { "epoch": 0.78, "learning_rate": 6.136760112621559e-07, "loss": 1.0468, "step": 41288 }, { "epoch": 0.78, "learning_rate": 6.135757599549061e-07, "loss": 0.9319, "step": 41289 }, { "epoch": 0.78, "learning_rate": 6.134755156915059e-07, "loss": 0.8391, "step": 41290 }, { "epoch": 0.78, "learning_rate": 6.133752784723302e-07, "loss": 0.8954, "step": 41291 }, { "epoch": 0.78, "learning_rate": 6.132750482977532e-07, "loss": 0.7521, "step": 41292 }, { "epoch": 0.78, "learning_rate": 6.131748251681493e-07, "loss": 0.9962, "step": 41293 }, { "epoch": 0.78, "learning_rate": 6.130746090838929e-07, "loss": 0.9502, "step": 41294 }, { "epoch": 0.78, "learning_rate": 6.12974400045358e-07, "loss": 0.8844, "step": 41295 }, { "epoch": 0.78, "learning_rate": 6.128741980529195e-07, "loss": 0.9874, "step": 41296 }, { "epoch": 0.78, "learning_rate": 6.127740031069499e-07, "loss": 0.8793, "step": 41297 }, { "epoch": 0.78, "learning_rate": 6.126738152078251e-07, "loss": 0.6743, "step": 41298 }, { "epoch": 0.78, "learning_rate": 6.12573634355918e-07, "loss": 0.9805, "step": 41299 }, { "epoch": 0.78, "learning_rate": 6.124734605516025e-07, "loss": 1.146, "step": 41300 }, { "epoch": 0.78, "learning_rate": 6.123732937952545e-07, "loss": 0.8123, "step": 41301 }, { "epoch": 0.78, "learning_rate": 6.122731340872459e-07, "loss": 0.9986, "step": 41302 }, { "epoch": 0.78, "learning_rate": 6.121729814279517e-07, "loss": 0.8739, "step": 41303 }, { "epoch": 0.78, "learning_rate": 6.120728358177458e-07, "loss": 0.7781, "step": 41304 }, { "epoch": 0.78, "learning_rate": 6.119726972570017e-07, "loss": 0.9564, "step": 41305 }, { "epoch": 0.78, "learning_rate": 6.118725657460939e-07, "loss": 1.1158, "step": 41306 }, { "epoch": 0.78, "learning_rate": 6.117724412853959e-07, "loss": 0.907, "step": 41307 }, { "epoch": 0.78, "learning_rate": 6.116723238752829e-07, "loss": 0.8584, "step": 41308 }, { "epoch": 0.78, "learning_rate": 6.115722135161257e-07, "loss": 1.0232, "step": 41309 }, { "epoch": 0.78, "learning_rate": 6.114721102083013e-07, "loss": 0.8195, "step": 41310 }, { "epoch": 0.78, "learning_rate": 6.113720139521817e-07, "loss": 0.9853, "step": 41311 }, { "epoch": 0.78, "learning_rate": 6.112719247481408e-07, "loss": 0.8765, "step": 41312 }, { "epoch": 0.78, "learning_rate": 6.111718425965529e-07, "loss": 0.801, "step": 41313 }, { "epoch": 0.78, "learning_rate": 6.110717674977911e-07, "loss": 0.8311, "step": 41314 }, { "epoch": 0.78, "learning_rate": 6.109716994522297e-07, "loss": 0.6991, "step": 41315 }, { "epoch": 0.78, "learning_rate": 6.10871638460242e-07, "loss": 1.2001, "step": 41316 }, { "epoch": 0.78, "learning_rate": 6.107715845222024e-07, "loss": 0.7961, "step": 41317 }, { "epoch": 0.78, "learning_rate": 6.106715376384822e-07, "loss": 1.098, "step": 41318 }, { "epoch": 0.78, "learning_rate": 6.105714978094582e-07, "loss": 1.0007, "step": 41319 }, { "epoch": 0.78, "learning_rate": 6.104714650355014e-07, "loss": 0.7981, "step": 41320 }, { "epoch": 0.78, "learning_rate": 6.103714393169857e-07, "loss": 0.8361, "step": 41321 }, { "epoch": 0.78, "learning_rate": 6.102714206542865e-07, "loss": 0.7697, "step": 41322 }, { "epoch": 0.78, "learning_rate": 6.101714090477748e-07, "loss": 0.9111, "step": 41323 }, { "epoch": 0.78, "learning_rate": 6.100714044978253e-07, "loss": 1.0215, "step": 41324 }, { "epoch": 0.78, "learning_rate": 6.099714070048116e-07, "loss": 0.9594, "step": 41325 }, { "epoch": 0.78, "learning_rate": 6.098714165691063e-07, "loss": 0.8007, "step": 41326 }, { "epoch": 0.78, "learning_rate": 6.097714331910834e-07, "loss": 0.8396, "step": 41327 }, { "epoch": 0.78, "learning_rate": 6.09671456871116e-07, "loss": 1.127, "step": 41328 }, { "epoch": 0.78, "learning_rate": 6.095714876095779e-07, "loss": 0.9548, "step": 41329 }, { "epoch": 0.78, "learning_rate": 6.094715254068406e-07, "loss": 1.2765, "step": 41330 }, { "epoch": 0.78, "learning_rate": 6.093715702632802e-07, "loss": 0.8781, "step": 41331 }, { "epoch": 0.78, "learning_rate": 6.092716221792678e-07, "loss": 0.896, "step": 41332 }, { "epoch": 0.78, "learning_rate": 6.091716811551768e-07, "loss": 0.8104, "step": 41333 }, { "epoch": 0.78, "learning_rate": 6.09071747191381e-07, "loss": 0.9087, "step": 41334 }, { "epoch": 0.78, "learning_rate": 6.089718202882533e-07, "loss": 0.9688, "step": 41335 }, { "epoch": 0.78, "learning_rate": 6.088719004461668e-07, "loss": 0.9579, "step": 41336 }, { "epoch": 0.78, "learning_rate": 6.087719876654946e-07, "loss": 1.1411, "step": 41337 }, { "epoch": 0.78, "learning_rate": 6.086720819466105e-07, "loss": 1.0436, "step": 41338 }, { "epoch": 0.78, "learning_rate": 6.085721832898856e-07, "loss": 1.0325, "step": 41339 }, { "epoch": 0.78, "learning_rate": 6.084722916956956e-07, "loss": 0.7056, "step": 41340 }, { "epoch": 0.78, "learning_rate": 6.083724071644112e-07, "loss": 0.8356, "step": 41341 }, { "epoch": 0.78, "learning_rate": 6.082725296964057e-07, "loss": 0.8275, "step": 41342 }, { "epoch": 0.78, "learning_rate": 6.081726592920537e-07, "loss": 1.0703, "step": 41343 }, { "epoch": 0.78, "learning_rate": 6.080727959517266e-07, "loss": 1.156, "step": 41344 }, { "epoch": 0.78, "learning_rate": 6.079729396757974e-07, "loss": 0.762, "step": 41345 }, { "epoch": 0.78, "learning_rate": 6.078730904646393e-07, "loss": 0.8382, "step": 41346 }, { "epoch": 0.78, "learning_rate": 6.077732483186252e-07, "loss": 0.8785, "step": 41347 }, { "epoch": 0.78, "learning_rate": 6.076734132381276e-07, "loss": 0.7857, "step": 41348 }, { "epoch": 0.78, "learning_rate": 6.075735852235195e-07, "loss": 0.8245, "step": 41349 }, { "epoch": 0.78, "learning_rate": 6.074737642751747e-07, "loss": 0.9688, "step": 41350 }, { "epoch": 0.78, "learning_rate": 6.073739503934631e-07, "loss": 0.834, "step": 41351 }, { "epoch": 0.78, "learning_rate": 6.072741435787605e-07, "loss": 0.7776, "step": 41352 }, { "epoch": 0.78, "learning_rate": 6.071743438314376e-07, "loss": 1.025, "step": 41353 }, { "epoch": 0.78, "learning_rate": 6.070745511518675e-07, "loss": 0.6241, "step": 41354 }, { "epoch": 0.78, "learning_rate": 6.069747655404231e-07, "loss": 0.94, "step": 41355 }, { "epoch": 0.78, "learning_rate": 6.068749869974769e-07, "loss": 0.9439, "step": 41356 }, { "epoch": 0.78, "learning_rate": 6.067752155234016e-07, "loss": 0.98, "step": 41357 }, { "epoch": 0.78, "learning_rate": 6.066754511185693e-07, "loss": 0.8305, "step": 41358 }, { "epoch": 0.78, "learning_rate": 6.065756937833536e-07, "loss": 0.8077, "step": 41359 }, { "epoch": 0.78, "learning_rate": 6.06475943518125e-07, "loss": 0.7386, "step": 41360 }, { "epoch": 0.78, "learning_rate": 6.063762003232585e-07, "loss": 0.8579, "step": 41361 }, { "epoch": 0.78, "learning_rate": 6.062764641991245e-07, "loss": 1.0523, "step": 41362 }, { "epoch": 0.78, "learning_rate": 6.061767351460954e-07, "loss": 1.1655, "step": 41363 }, { "epoch": 0.78, "learning_rate": 6.060770131645455e-07, "loss": 0.7715, "step": 41364 }, { "epoch": 0.78, "learning_rate": 6.059772982548457e-07, "loss": 0.6546, "step": 41365 }, { "epoch": 0.78, "learning_rate": 6.058775904173681e-07, "loss": 0.8334, "step": 41366 }, { "epoch": 0.78, "learning_rate": 6.057778896524857e-07, "loss": 0.8466, "step": 41367 }, { "epoch": 0.78, "learning_rate": 6.056781959605707e-07, "loss": 0.8846, "step": 41368 }, { "epoch": 0.78, "learning_rate": 6.055785093419952e-07, "loss": 0.884, "step": 41369 }, { "epoch": 0.78, "learning_rate": 6.054788297971314e-07, "loss": 0.8144, "step": 41370 }, { "epoch": 0.78, "learning_rate": 6.053791573263523e-07, "loss": 1.0848, "step": 41371 }, { "epoch": 0.78, "learning_rate": 6.052794919300279e-07, "loss": 0.7505, "step": 41372 }, { "epoch": 0.78, "learning_rate": 6.051798336085332e-07, "loss": 0.8978, "step": 41373 }, { "epoch": 0.78, "learning_rate": 6.050801823622382e-07, "loss": 0.9063, "step": 41374 }, { "epoch": 0.78, "learning_rate": 6.049805381915158e-07, "loss": 1.156, "step": 41375 }, { "epoch": 0.78, "learning_rate": 6.048809010967377e-07, "loss": 1.0012, "step": 41376 }, { "epoch": 0.78, "learning_rate": 6.047812710782764e-07, "loss": 0.8743, "step": 41377 }, { "epoch": 0.78, "learning_rate": 6.046816481365036e-07, "loss": 0.7989, "step": 41378 }, { "epoch": 0.78, "learning_rate": 6.045820322717915e-07, "loss": 0.9655, "step": 41379 }, { "epoch": 0.78, "learning_rate": 6.044824234845129e-07, "loss": 0.7396, "step": 41380 }, { "epoch": 0.78, "learning_rate": 6.043828217750372e-07, "loss": 1.0908, "step": 41381 }, { "epoch": 0.78, "learning_rate": 6.042832271437385e-07, "loss": 0.9709, "step": 41382 }, { "epoch": 0.78, "learning_rate": 6.041836395909892e-07, "loss": 0.9853, "step": 41383 }, { "epoch": 0.78, "learning_rate": 6.040840591171582e-07, "loss": 0.8192, "step": 41384 }, { "epoch": 0.78, "learning_rate": 6.03984485722621e-07, "loss": 0.8024, "step": 41385 }, { "epoch": 0.78, "learning_rate": 6.038849194077465e-07, "loss": 0.8325, "step": 41386 }, { "epoch": 0.78, "learning_rate": 6.03785360172908e-07, "loss": 1.171, "step": 41387 }, { "epoch": 0.78, "learning_rate": 6.036858080184766e-07, "loss": 0.9248, "step": 41388 }, { "epoch": 0.78, "learning_rate": 6.035862629448241e-07, "loss": 0.8509, "step": 41389 }, { "epoch": 0.78, "learning_rate": 6.034867249523224e-07, "loss": 0.9766, "step": 41390 }, { "epoch": 0.78, "learning_rate": 6.033871940413433e-07, "loss": 0.7859, "step": 41391 }, { "epoch": 0.78, "learning_rate": 6.032876702122589e-07, "loss": 0.8237, "step": 41392 }, { "epoch": 0.78, "learning_rate": 6.031881534654388e-07, "loss": 1.0476, "step": 41393 }, { "epoch": 0.78, "learning_rate": 6.030886438012574e-07, "loss": 1.1648, "step": 41394 }, { "epoch": 0.78, "learning_rate": 6.029891412200839e-07, "loss": 0.8276, "step": 41395 }, { "epoch": 0.78, "learning_rate": 6.02889645722291e-07, "loss": 0.9271, "step": 41396 }, { "epoch": 0.78, "learning_rate": 6.027901573082501e-07, "loss": 0.8686, "step": 41397 }, { "epoch": 0.78, "learning_rate": 6.026906759783324e-07, "loss": 0.651, "step": 41398 }, { "epoch": 0.78, "learning_rate": 6.025912017329095e-07, "loss": 0.9651, "step": 41399 }, { "epoch": 0.78, "learning_rate": 6.02491734572353e-07, "loss": 1.0503, "step": 41400 }, { "epoch": 0.78, "learning_rate": 6.023922744970348e-07, "loss": 0.8656, "step": 41401 }, { "epoch": 0.78, "learning_rate": 6.022928215073243e-07, "loss": 0.9152, "step": 41402 }, { "epoch": 0.78, "learning_rate": 6.02193375603595e-07, "loss": 0.7966, "step": 41403 }, { "epoch": 0.78, "learning_rate": 6.02093936786218e-07, "loss": 1.0068, "step": 41404 }, { "epoch": 0.78, "learning_rate": 6.019945050555628e-07, "loss": 0.9721, "step": 41405 }, { "epoch": 0.78, "learning_rate": 6.018950804120032e-07, "loss": 1.0771, "step": 41406 }, { "epoch": 0.78, "learning_rate": 6.017956628559085e-07, "loss": 1.0314, "step": 41407 }, { "epoch": 0.78, "learning_rate": 6.016962523876507e-07, "loss": 0.9766, "step": 41408 }, { "epoch": 0.78, "learning_rate": 6.015968490076007e-07, "loss": 0.8826, "step": 41409 }, { "epoch": 0.78, "learning_rate": 6.014974527161302e-07, "loss": 0.7659, "step": 41410 }, { "epoch": 0.78, "learning_rate": 6.013980635136096e-07, "loss": 1.0585, "step": 41411 }, { "epoch": 0.78, "learning_rate": 6.012986814004107e-07, "loss": 1.0891, "step": 41412 }, { "epoch": 0.78, "learning_rate": 6.011993063769051e-07, "loss": 0.9437, "step": 41413 }, { "epoch": 0.78, "learning_rate": 6.010999384434613e-07, "loss": 0.868, "step": 41414 }, { "epoch": 0.78, "learning_rate": 6.010005776004537e-07, "loss": 0.7805, "step": 41415 }, { "epoch": 0.78, "learning_rate": 6.009012238482509e-07, "loss": 0.8689, "step": 41416 }, { "epoch": 0.78, "learning_rate": 6.008018771872248e-07, "loss": 0.775, "step": 41417 }, { "epoch": 0.78, "learning_rate": 6.007025376177463e-07, "loss": 1.1675, "step": 41418 }, { "epoch": 0.78, "learning_rate": 6.006032051401864e-07, "loss": 1.0507, "step": 41419 }, { "epoch": 0.78, "learning_rate": 6.005038797549157e-07, "loss": 0.7565, "step": 41420 }, { "epoch": 0.78, "learning_rate": 6.004045614623052e-07, "loss": 0.8041, "step": 41421 }, { "epoch": 0.78, "learning_rate": 6.003052502627268e-07, "loss": 0.9561, "step": 41422 }, { "epoch": 0.78, "learning_rate": 6.002059461565488e-07, "loss": 0.7997, "step": 41423 }, { "epoch": 0.78, "learning_rate": 6.001066491441443e-07, "loss": 0.9103, "step": 41424 }, { "epoch": 0.78, "learning_rate": 6.00007359225884e-07, "loss": 1.0176, "step": 41425 }, { "epoch": 0.78, "learning_rate": 5.999080764021364e-07, "loss": 0.9596, "step": 41426 }, { "epoch": 0.78, "learning_rate": 5.998088006732753e-07, "loss": 0.7493, "step": 41427 }, { "epoch": 0.78, "learning_rate": 5.997095320396692e-07, "loss": 0.8087, "step": 41428 }, { "epoch": 0.78, "learning_rate": 5.996102705016896e-07, "loss": 0.6908, "step": 41429 }, { "epoch": 0.78, "learning_rate": 5.995110160597067e-07, "loss": 0.9546, "step": 41430 }, { "epoch": 0.78, "learning_rate": 5.994117687140916e-07, "loss": 1.1483, "step": 41431 }, { "epoch": 0.78, "learning_rate": 5.993125284652146e-07, "loss": 0.8463, "step": 41432 }, { "epoch": 0.78, "learning_rate": 5.992132953134461e-07, "loss": 0.7589, "step": 41433 }, { "epoch": 0.78, "learning_rate": 5.991140692591579e-07, "loss": 0.8616, "step": 41434 }, { "epoch": 0.78, "learning_rate": 5.990148503027179e-07, "loss": 0.6546, "step": 41435 }, { "epoch": 0.78, "learning_rate": 5.989156384444997e-07, "loss": 0.8124, "step": 41436 }, { "epoch": 0.78, "learning_rate": 5.988164336848714e-07, "loss": 1.1162, "step": 41437 }, { "epoch": 0.78, "learning_rate": 5.987172360242044e-07, "loss": 1.0536, "step": 41438 }, { "epoch": 0.78, "learning_rate": 5.98618045462869e-07, "loss": 0.7712, "step": 41439 }, { "epoch": 0.78, "learning_rate": 5.985188620012353e-07, "loss": 0.772, "step": 41440 }, { "epoch": 0.78, "learning_rate": 5.984196856396748e-07, "loss": 0.8886, "step": 41441 }, { "epoch": 0.78, "learning_rate": 5.983205163785552e-07, "loss": 0.9036, "step": 41442 }, { "epoch": 0.78, "learning_rate": 5.982213542182502e-07, "loss": 1.0322, "step": 41443 }, { "epoch": 0.78, "learning_rate": 5.981221991591274e-07, "loss": 1.1394, "step": 41444 }, { "epoch": 0.78, "learning_rate": 5.980230512015575e-07, "loss": 1.0079, "step": 41445 }, { "epoch": 0.78, "learning_rate": 5.979239103459125e-07, "loss": 0.7593, "step": 41446 }, { "epoch": 0.78, "learning_rate": 5.978247765925604e-07, "loss": 0.936, "step": 41447 }, { "epoch": 0.78, "learning_rate": 5.977256499418727e-07, "loss": 0.6559, "step": 41448 }, { "epoch": 0.78, "learning_rate": 5.976265303942186e-07, "loss": 0.7946, "step": 41449 }, { "epoch": 0.78, "learning_rate": 5.975274179499691e-07, "loss": 0.9767, "step": 41450 }, { "epoch": 0.78, "learning_rate": 5.974283126094938e-07, "loss": 0.9745, "step": 41451 }, { "epoch": 0.78, "learning_rate": 5.973292143731627e-07, "loss": 0.6456, "step": 41452 }, { "epoch": 0.78, "learning_rate": 5.972301232413469e-07, "loss": 1.0214, "step": 41453 }, { "epoch": 0.78, "learning_rate": 5.971310392144139e-07, "loss": 0.924, "step": 41454 }, { "epoch": 0.78, "learning_rate": 5.970319622927368e-07, "loss": 0.9776, "step": 41455 }, { "epoch": 0.78, "learning_rate": 5.969328924766832e-07, "loss": 1.0173, "step": 41456 }, { "epoch": 0.78, "learning_rate": 5.968338297666237e-07, "loss": 0.7568, "step": 41457 }, { "epoch": 0.78, "learning_rate": 5.967347741629285e-07, "loss": 0.6925, "step": 41458 }, { "epoch": 0.78, "learning_rate": 5.966357256659672e-07, "loss": 0.8115, "step": 41459 }, { "epoch": 0.78, "learning_rate": 5.9653668427611e-07, "loss": 0.8762, "step": 41460 }, { "epoch": 0.78, "learning_rate": 5.96437649993726e-07, "loss": 1.1025, "step": 41461 }, { "epoch": 0.78, "learning_rate": 5.963386228191867e-07, "loss": 1.1342, "step": 41462 }, { "epoch": 0.78, "learning_rate": 5.962396027528589e-07, "loss": 0.9985, "step": 41463 }, { "epoch": 0.78, "learning_rate": 5.961405897951156e-07, "loss": 0.7477, "step": 41464 }, { "epoch": 0.78, "learning_rate": 5.96041583946324e-07, "loss": 0.8774, "step": 41465 }, { "epoch": 0.78, "learning_rate": 5.959425852068543e-07, "loss": 0.7855, "step": 41466 }, { "epoch": 0.78, "learning_rate": 5.958435935770779e-07, "loss": 0.7521, "step": 41467 }, { "epoch": 0.78, "learning_rate": 5.957446090573623e-07, "loss": 0.7821, "step": 41468 }, { "epoch": 0.78, "learning_rate": 5.956456316480782e-07, "loss": 0.8879, "step": 41469 }, { "epoch": 0.78, "learning_rate": 5.955466613495948e-07, "loss": 0.8524, "step": 41470 }, { "epoch": 0.78, "learning_rate": 5.954476981622817e-07, "loss": 0.9446, "step": 41471 }, { "epoch": 0.78, "learning_rate": 5.953487420865087e-07, "loss": 0.7695, "step": 41472 }, { "epoch": 0.78, "learning_rate": 5.95249793122645e-07, "loss": 0.9355, "step": 41473 }, { "epoch": 0.78, "learning_rate": 5.951508512710608e-07, "loss": 1.087, "step": 41474 }, { "epoch": 0.78, "learning_rate": 5.950519165321237e-07, "loss": 1.2035, "step": 41475 }, { "epoch": 0.78, "learning_rate": 5.949529889062056e-07, "loss": 0.9253, "step": 41476 }, { "epoch": 0.78, "learning_rate": 5.948540683936741e-07, "loss": 0.9267, "step": 41477 }, { "epoch": 0.78, "learning_rate": 5.947551549948988e-07, "loss": 0.912, "step": 41478 }, { "epoch": 0.78, "learning_rate": 5.946562487102494e-07, "loss": 0.7513, "step": 41479 }, { "epoch": 0.78, "learning_rate": 5.945573495400953e-07, "loss": 1.0132, "step": 41480 }, { "epoch": 0.78, "learning_rate": 5.944584574848056e-07, "loss": 1.1462, "step": 41481 }, { "epoch": 0.78, "learning_rate": 5.943595725447496e-07, "loss": 0.7528, "step": 41482 }, { "epoch": 0.78, "learning_rate": 5.942606947202969e-07, "loss": 0.9379, "step": 41483 }, { "epoch": 0.78, "learning_rate": 5.941618240118154e-07, "loss": 0.8531, "step": 41484 }, { "epoch": 0.78, "learning_rate": 5.940629604196765e-07, "loss": 0.992, "step": 41485 }, { "epoch": 0.78, "learning_rate": 5.939641039442473e-07, "loss": 0.967, "step": 41486 }, { "epoch": 0.78, "learning_rate": 5.938652545858969e-07, "loss": 0.959, "step": 41487 }, { "epoch": 0.78, "learning_rate": 5.937664123449968e-07, "loss": 1.0667, "step": 41488 }, { "epoch": 0.78, "learning_rate": 5.936675772219136e-07, "loss": 0.9382, "step": 41489 }, { "epoch": 0.78, "learning_rate": 5.935687492170172e-07, "loss": 0.9684, "step": 41490 }, { "epoch": 0.78, "learning_rate": 5.934699283306769e-07, "loss": 0.9141, "step": 41491 }, { "epoch": 0.78, "learning_rate": 5.933711145632612e-07, "loss": 0.8373, "step": 41492 }, { "epoch": 0.78, "learning_rate": 5.932723079151392e-07, "loss": 1.2144, "step": 41493 }, { "epoch": 0.78, "learning_rate": 5.931735083866802e-07, "loss": 1.0741, "step": 41494 }, { "epoch": 0.78, "learning_rate": 5.930747159782536e-07, "loss": 1.0451, "step": 41495 }, { "epoch": 0.78, "learning_rate": 5.929759306902258e-07, "loss": 0.8646, "step": 41496 }, { "epoch": 0.78, "learning_rate": 5.92877152522969e-07, "loss": 0.8984, "step": 41497 }, { "epoch": 0.78, "learning_rate": 5.927783814768498e-07, "loss": 0.7833, "step": 41498 }, { "epoch": 0.78, "learning_rate": 5.926796175522376e-07, "loss": 0.9298, "step": 41499 }, { "epoch": 0.78, "learning_rate": 5.925808607495012e-07, "loss": 0.9039, "step": 41500 }, { "epoch": 0.78, "learning_rate": 5.924821110690093e-07, "loss": 0.8776, "step": 41501 }, { "epoch": 0.78, "learning_rate": 5.923833685111308e-07, "loss": 0.9632, "step": 41502 }, { "epoch": 0.78, "learning_rate": 5.922846330762344e-07, "loss": 0.8996, "step": 41503 }, { "epoch": 0.78, "learning_rate": 5.921859047646894e-07, "loss": 0.8658, "step": 41504 }, { "epoch": 0.78, "learning_rate": 5.920871835768622e-07, "loss": 0.8763, "step": 41505 }, { "epoch": 0.78, "learning_rate": 5.919884695131242e-07, "loss": 1.0126, "step": 41506 }, { "epoch": 0.78, "learning_rate": 5.918897625738423e-07, "loss": 0.8331, "step": 41507 }, { "epoch": 0.78, "learning_rate": 5.917910627593848e-07, "loss": 0.9469, "step": 41508 }, { "epoch": 0.78, "learning_rate": 5.916923700701224e-07, "loss": 0.8332, "step": 41509 }, { "epoch": 0.78, "learning_rate": 5.915936845064213e-07, "loss": 0.735, "step": 41510 }, { "epoch": 0.78, "learning_rate": 5.914950060686511e-07, "loss": 0.7438, "step": 41511 }, { "epoch": 0.78, "learning_rate": 5.913963347571799e-07, "loss": 0.9473, "step": 41512 }, { "epoch": 0.78, "learning_rate": 5.912976705723763e-07, "loss": 0.9587, "step": 41513 }, { "epoch": 0.78, "learning_rate": 5.911990135146087e-07, "loss": 0.9003, "step": 41514 }, { "epoch": 0.78, "learning_rate": 5.911003635842455e-07, "loss": 0.9111, "step": 41515 }, { "epoch": 0.78, "learning_rate": 5.910017207816557e-07, "loss": 0.8694, "step": 41516 }, { "epoch": 0.78, "learning_rate": 5.909030851072054e-07, "loss": 0.9387, "step": 41517 }, { "epoch": 0.78, "learning_rate": 5.908044565612658e-07, "loss": 0.8503, "step": 41518 }, { "epoch": 0.78, "learning_rate": 5.907058351442032e-07, "loss": 0.9229, "step": 41519 }, { "epoch": 0.78, "learning_rate": 5.906072208563865e-07, "loss": 1.0319, "step": 41520 }, { "epoch": 0.78, "learning_rate": 5.905086136981842e-07, "loss": 0.8375, "step": 41521 }, { "epoch": 0.78, "learning_rate": 5.904100136699637e-07, "loss": 0.8107, "step": 41522 }, { "epoch": 0.78, "learning_rate": 5.903114207720939e-07, "loss": 0.7755, "step": 41523 }, { "epoch": 0.78, "learning_rate": 5.902128350049427e-07, "loss": 0.8555, "step": 41524 }, { "epoch": 0.78, "learning_rate": 5.901142563688788e-07, "loss": 1.2198, "step": 41525 }, { "epoch": 0.78, "learning_rate": 5.900156848642685e-07, "loss": 0.9082, "step": 41526 }, { "epoch": 0.78, "learning_rate": 5.899171204914825e-07, "loss": 0.9407, "step": 41527 }, { "epoch": 0.78, "learning_rate": 5.898185632508866e-07, "loss": 0.9029, "step": 41528 }, { "epoch": 0.78, "learning_rate": 5.897200131428487e-07, "loss": 0.8357, "step": 41529 }, { "epoch": 0.78, "learning_rate": 5.896214701677394e-07, "loss": 0.826, "step": 41530 }, { "epoch": 0.78, "learning_rate": 5.89522934325924e-07, "loss": 1.1294, "step": 41531 }, { "epoch": 0.78, "learning_rate": 5.894244056177717e-07, "loss": 0.7694, "step": 41532 }, { "epoch": 0.78, "learning_rate": 5.893258840436497e-07, "loss": 0.923, "step": 41533 }, { "epoch": 0.78, "learning_rate": 5.892273696039266e-07, "loss": 0.8326, "step": 41534 }, { "epoch": 0.78, "learning_rate": 5.891288622989699e-07, "loss": 1.0915, "step": 41535 }, { "epoch": 0.78, "learning_rate": 5.890303621291471e-07, "loss": 0.6465, "step": 41536 }, { "epoch": 0.78, "learning_rate": 5.889318690948273e-07, "loss": 0.9255, "step": 41537 }, { "epoch": 0.78, "learning_rate": 5.888333831963761e-07, "loss": 0.9139, "step": 41538 }, { "epoch": 0.78, "learning_rate": 5.887349044341636e-07, "loss": 0.9377, "step": 41539 }, { "epoch": 0.78, "learning_rate": 5.886364328085556e-07, "loss": 0.9418, "step": 41540 }, { "epoch": 0.78, "learning_rate": 5.885379683199208e-07, "loss": 0.8401, "step": 41541 }, { "epoch": 0.78, "learning_rate": 5.884395109686263e-07, "loss": 0.881, "step": 41542 }, { "epoch": 0.78, "learning_rate": 5.883410607550402e-07, "loss": 1.0419, "step": 41543 }, { "epoch": 0.78, "learning_rate": 5.882426176795303e-07, "loss": 0.7314, "step": 41544 }, { "epoch": 0.78, "learning_rate": 5.881441817424636e-07, "loss": 0.9234, "step": 41545 }, { "epoch": 0.78, "learning_rate": 5.880457529442082e-07, "loss": 0.8522, "step": 41546 }, { "epoch": 0.78, "learning_rate": 5.879473312851305e-07, "loss": 0.8079, "step": 41547 }, { "epoch": 0.78, "learning_rate": 5.878489167656002e-07, "loss": 0.6253, "step": 41548 }, { "epoch": 0.78, "learning_rate": 5.877505093859823e-07, "loss": 0.8449, "step": 41549 }, { "epoch": 0.78, "learning_rate": 5.87652109146645e-07, "loss": 0.9524, "step": 41550 }, { "epoch": 0.78, "learning_rate": 5.875537160479574e-07, "loss": 0.9608, "step": 41551 }, { "epoch": 0.78, "learning_rate": 5.87455330090285e-07, "loss": 0.9379, "step": 41552 }, { "epoch": 0.78, "learning_rate": 5.873569512739955e-07, "loss": 1.1758, "step": 41553 }, { "epoch": 0.78, "learning_rate": 5.872585795994567e-07, "loss": 0.7043, "step": 41554 }, { "epoch": 0.78, "learning_rate": 5.871602150670358e-07, "loss": 0.902, "step": 41555 }, { "epoch": 0.78, "learning_rate": 5.870618576770998e-07, "loss": 1.2565, "step": 41556 }, { "epoch": 0.78, "learning_rate": 5.869635074300162e-07, "loss": 0.9227, "step": 41557 }, { "epoch": 0.78, "learning_rate": 5.86865164326153e-07, "loss": 0.996, "step": 41558 }, { "epoch": 0.78, "learning_rate": 5.86766828365875e-07, "loss": 0.9078, "step": 41559 }, { "epoch": 0.78, "learning_rate": 5.866684995495528e-07, "loss": 0.697, "step": 41560 }, { "epoch": 0.78, "learning_rate": 5.865701778775506e-07, "loss": 0.8812, "step": 41561 }, { "epoch": 0.78, "learning_rate": 5.864718633502372e-07, "loss": 0.9164, "step": 41562 }, { "epoch": 0.78, "learning_rate": 5.86373555967979e-07, "loss": 1.1371, "step": 41563 }, { "epoch": 0.78, "learning_rate": 5.86275255731143e-07, "loss": 0.8902, "step": 41564 }, { "epoch": 0.78, "learning_rate": 5.861769626400967e-07, "loss": 0.9853, "step": 41565 }, { "epoch": 0.78, "learning_rate": 5.86078676695207e-07, "loss": 0.747, "step": 41566 }, { "epoch": 0.78, "learning_rate": 5.859803978968415e-07, "loss": 0.8753, "step": 41567 }, { "epoch": 0.78, "learning_rate": 5.858821262453652e-07, "loss": 1.112, "step": 41568 }, { "epoch": 0.78, "learning_rate": 5.857838617411477e-07, "loss": 0.989, "step": 41569 }, { "epoch": 0.78, "learning_rate": 5.856856043845538e-07, "loss": 0.8268, "step": 41570 }, { "epoch": 0.78, "learning_rate": 5.855873541759505e-07, "loss": 0.7853, "step": 41571 }, { "epoch": 0.78, "learning_rate": 5.854891111157065e-07, "loss": 0.8667, "step": 41572 }, { "epoch": 0.78, "learning_rate": 5.85390875204187e-07, "loss": 0.9153, "step": 41573 }, { "epoch": 0.78, "learning_rate": 5.852926464417594e-07, "loss": 0.6635, "step": 41574 }, { "epoch": 0.78, "learning_rate": 5.8519442482879e-07, "loss": 0.9351, "step": 41575 }, { "epoch": 0.78, "learning_rate": 5.85096210365646e-07, "loss": 1.0409, "step": 41576 }, { "epoch": 0.78, "learning_rate": 5.849980030526942e-07, "loss": 0.9103, "step": 41577 }, { "epoch": 0.78, "learning_rate": 5.848998028903011e-07, "loss": 0.9324, "step": 41578 }, { "epoch": 0.78, "learning_rate": 5.848016098788342e-07, "loss": 0.6862, "step": 41579 }, { "epoch": 0.78, "learning_rate": 5.847034240186577e-07, "loss": 1.0392, "step": 41580 }, { "epoch": 0.78, "learning_rate": 5.846052453101417e-07, "loss": 1.1521, "step": 41581 }, { "epoch": 0.78, "learning_rate": 5.845070737536498e-07, "loss": 0.7593, "step": 41582 }, { "epoch": 0.78, "learning_rate": 5.8440890934955e-07, "loss": 1.0096, "step": 41583 }, { "epoch": 0.78, "learning_rate": 5.843107520982086e-07, "loss": 0.8667, "step": 41584 }, { "epoch": 0.78, "learning_rate": 5.842126019999922e-07, "loss": 0.9413, "step": 41585 }, { "epoch": 0.78, "learning_rate": 5.841144590552672e-07, "loss": 0.8926, "step": 41586 }, { "epoch": 0.78, "learning_rate": 5.840163232644e-07, "loss": 1.0962, "step": 41587 }, { "epoch": 0.78, "learning_rate": 5.839181946277578e-07, "loss": 0.8879, "step": 41588 }, { "epoch": 0.78, "learning_rate": 5.838200731457047e-07, "loss": 0.946, "step": 41589 }, { "epoch": 0.78, "learning_rate": 5.837219588186102e-07, "loss": 0.9743, "step": 41590 }, { "epoch": 0.78, "learning_rate": 5.836238516468387e-07, "loss": 0.8752, "step": 41591 }, { "epoch": 0.78, "learning_rate": 5.83525751630756e-07, "loss": 0.8517, "step": 41592 }, { "epoch": 0.78, "learning_rate": 5.83427658770731e-07, "loss": 1.0659, "step": 41593 }, { "epoch": 0.78, "learning_rate": 5.833295730671276e-07, "loss": 1.0736, "step": 41594 }, { "epoch": 0.78, "learning_rate": 5.832314945203127e-07, "loss": 0.8441, "step": 41595 }, { "epoch": 0.78, "learning_rate": 5.831334231306526e-07, "loss": 0.8772, "step": 41596 }, { "epoch": 0.78, "learning_rate": 5.830353588985138e-07, "loss": 0.8459, "step": 41597 }, { "epoch": 0.78, "learning_rate": 5.82937301824262e-07, "loss": 0.8162, "step": 41598 }, { "epoch": 0.78, "learning_rate": 5.828392519082635e-07, "loss": 0.9863, "step": 41599 }, { "epoch": 0.78, "learning_rate": 5.827412091508852e-07, "loss": 0.9695, "step": 41600 }, { "epoch": 0.78, "learning_rate": 5.826431735524913e-07, "loss": 0.9469, "step": 41601 }, { "epoch": 0.78, "learning_rate": 5.825451451134501e-07, "loss": 1.0034, "step": 41602 }, { "epoch": 0.78, "learning_rate": 5.824471238341258e-07, "loss": 0.9379, "step": 41603 }, { "epoch": 0.78, "learning_rate": 5.823491097148853e-07, "loss": 0.9276, "step": 41604 }, { "epoch": 0.78, "learning_rate": 5.822511027560942e-07, "loss": 1.0298, "step": 41605 }, { "epoch": 0.78, "learning_rate": 5.82153102958119e-07, "loss": 1.0548, "step": 41606 }, { "epoch": 0.78, "learning_rate": 5.820551103213251e-07, "loss": 0.8169, "step": 41607 }, { "epoch": 0.79, "learning_rate": 5.819571248460787e-07, "loss": 0.8407, "step": 41608 }, { "epoch": 0.79, "learning_rate": 5.818591465327462e-07, "loss": 0.9282, "step": 41609 }, { "epoch": 0.79, "learning_rate": 5.817611753816915e-07, "loss": 0.8029, "step": 41610 }, { "epoch": 0.79, "learning_rate": 5.816632113932833e-07, "loss": 0.9962, "step": 41611 }, { "epoch": 0.79, "learning_rate": 5.815652545678849e-07, "loss": 1.0148, "step": 41612 }, { "epoch": 0.79, "learning_rate": 5.814673049058625e-07, "loss": 0.9872, "step": 41613 }, { "epoch": 0.79, "learning_rate": 5.813693624075837e-07, "loss": 0.8786, "step": 41614 }, { "epoch": 0.79, "learning_rate": 5.812714270734121e-07, "loss": 0.9127, "step": 41615 }, { "epoch": 0.79, "learning_rate": 5.81173498903714e-07, "loss": 0.8643, "step": 41616 }, { "epoch": 0.79, "learning_rate": 5.810755778988555e-07, "loss": 0.8817, "step": 41617 }, { "epoch": 0.79, "learning_rate": 5.809776640592019e-07, "loss": 0.8748, "step": 41618 }, { "epoch": 0.79, "learning_rate": 5.808797573851188e-07, "loss": 0.9644, "step": 41619 }, { "epoch": 0.79, "learning_rate": 5.807818578769719e-07, "loss": 0.9553, "step": 41620 }, { "epoch": 0.79, "learning_rate": 5.806839655351276e-07, "loss": 0.9955, "step": 41621 }, { "epoch": 0.79, "learning_rate": 5.805860803599489e-07, "loss": 0.8303, "step": 41622 }, { "epoch": 0.79, "learning_rate": 5.804882023518044e-07, "loss": 0.7212, "step": 41623 }, { "epoch": 0.79, "learning_rate": 5.803903315110574e-07, "loss": 0.942, "step": 41624 }, { "epoch": 0.79, "learning_rate": 5.80292467838074e-07, "loss": 1.1271, "step": 41625 }, { "epoch": 0.79, "learning_rate": 5.801946113332196e-07, "loss": 0.8995, "step": 41626 }, { "epoch": 0.79, "learning_rate": 5.800967619968598e-07, "loss": 0.7478, "step": 41627 }, { "epoch": 0.79, "learning_rate": 5.799989198293596e-07, "loss": 0.7997, "step": 41628 }, { "epoch": 0.79, "learning_rate": 5.799010848310849e-07, "loss": 0.8743, "step": 41629 }, { "epoch": 0.79, "learning_rate": 5.798032570024009e-07, "loss": 0.8604, "step": 41630 }, { "epoch": 0.79, "learning_rate": 5.797054363436716e-07, "loss": 0.8936, "step": 41631 }, { "epoch": 0.79, "learning_rate": 5.796076228552647e-07, "loss": 1.0022, "step": 41632 }, { "epoch": 0.79, "learning_rate": 5.795098165375435e-07, "loss": 0.8608, "step": 41633 }, { "epoch": 0.79, "learning_rate": 5.794120173908727e-07, "loss": 0.9373, "step": 41634 }, { "epoch": 0.79, "learning_rate": 5.793142254156204e-07, "loss": 0.752, "step": 41635 }, { "epoch": 0.79, "learning_rate": 5.792164406121486e-07, "loss": 0.8521, "step": 41636 }, { "epoch": 0.79, "learning_rate": 5.791186629808243e-07, "loss": 1.1835, "step": 41637 }, { "epoch": 0.79, "learning_rate": 5.790208925220118e-07, "loss": 0.9764, "step": 41638 }, { "epoch": 0.79, "learning_rate": 5.789231292360761e-07, "loss": 0.9801, "step": 41639 }, { "epoch": 0.79, "learning_rate": 5.788253731233828e-07, "loss": 0.8704, "step": 41640 }, { "epoch": 0.79, "learning_rate": 5.787276241842968e-07, "loss": 1.045, "step": 41641 }, { "epoch": 0.79, "learning_rate": 5.786298824191835e-07, "loss": 0.9227, "step": 41642 }, { "epoch": 0.79, "learning_rate": 5.785321478284059e-07, "loss": 1.0162, "step": 41643 }, { "epoch": 0.79, "learning_rate": 5.784344204123316e-07, "loss": 0.9663, "step": 41644 }, { "epoch": 0.79, "learning_rate": 5.783367001713239e-07, "loss": 0.9671, "step": 41645 }, { "epoch": 0.79, "learning_rate": 5.782389871057478e-07, "loss": 0.7235, "step": 41646 }, { "epoch": 0.79, "learning_rate": 5.781412812159684e-07, "loss": 0.9211, "step": 41647 }, { "epoch": 0.79, "learning_rate": 5.780435825023506e-07, "loss": 0.9179, "step": 41648 }, { "epoch": 0.79, "learning_rate": 5.779458909652591e-07, "loss": 0.9478, "step": 41649 }, { "epoch": 0.79, "learning_rate": 5.778482066050587e-07, "loss": 1.1528, "step": 41650 }, { "epoch": 0.79, "learning_rate": 5.777505294221147e-07, "loss": 0.7675, "step": 41651 }, { "epoch": 0.79, "learning_rate": 5.776528594167902e-07, "loss": 0.6814, "step": 41652 }, { "epoch": 0.79, "learning_rate": 5.775551965894521e-07, "loss": 0.9179, "step": 41653 }, { "epoch": 0.79, "learning_rate": 5.774575409404634e-07, "loss": 0.9232, "step": 41654 }, { "epoch": 0.79, "learning_rate": 5.773598924701887e-07, "loss": 0.8303, "step": 41655 }, { "epoch": 0.79, "learning_rate": 5.772622511789944e-07, "loss": 1.0214, "step": 41656 }, { "epoch": 0.79, "learning_rate": 5.771646170672434e-07, "loss": 1.0972, "step": 41657 }, { "epoch": 0.79, "learning_rate": 5.770669901353008e-07, "loss": 1.0942, "step": 41658 }, { "epoch": 0.79, "learning_rate": 5.769693703835308e-07, "loss": 0.772, "step": 41659 }, { "epoch": 0.79, "learning_rate": 5.768717578122984e-07, "loss": 0.9025, "step": 41660 }, { "epoch": 0.79, "learning_rate": 5.767741524219677e-07, "loss": 0.8301, "step": 41661 }, { "epoch": 0.79, "learning_rate": 5.766765542129038e-07, "loss": 1.0222, "step": 41662 }, { "epoch": 0.79, "learning_rate": 5.765789631854709e-07, "loss": 0.7913, "step": 41663 }, { "epoch": 0.79, "learning_rate": 5.76481379340032e-07, "loss": 0.9464, "step": 41664 }, { "epoch": 0.79, "learning_rate": 5.763838026769541e-07, "loss": 0.8903, "step": 41665 }, { "epoch": 0.79, "learning_rate": 5.762862331965993e-07, "loss": 0.8419, "step": 41666 }, { "epoch": 0.79, "learning_rate": 5.761886708993328e-07, "loss": 0.8718, "step": 41667 }, { "epoch": 0.79, "learning_rate": 5.760911157855187e-07, "loss": 0.9896, "step": 41668 }, { "epoch": 0.79, "learning_rate": 5.759935678555214e-07, "loss": 0.9578, "step": 41669 }, { "epoch": 0.79, "learning_rate": 5.758960271097061e-07, "loss": 0.9081, "step": 41670 }, { "epoch": 0.79, "learning_rate": 5.757984935484342e-07, "loss": 0.9687, "step": 41671 }, { "epoch": 0.79, "learning_rate": 5.757009671720734e-07, "loss": 0.7029, "step": 41672 }, { "epoch": 0.79, "learning_rate": 5.756034479809855e-07, "loss": 0.8171, "step": 41673 }, { "epoch": 0.79, "learning_rate": 5.755059359755352e-07, "loss": 1.0571, "step": 41674 }, { "epoch": 0.79, "learning_rate": 5.754084311560867e-07, "loss": 1.0258, "step": 41675 }, { "epoch": 0.79, "learning_rate": 5.753109335230045e-07, "loss": 1.0923, "step": 41676 }, { "epoch": 0.79, "learning_rate": 5.752134430766518e-07, "loss": 0.8296, "step": 41677 }, { "epoch": 0.79, "learning_rate": 5.751159598173933e-07, "loss": 0.8488, "step": 41678 }, { "epoch": 0.79, "learning_rate": 5.750184837455933e-07, "loss": 0.8257, "step": 41679 }, { "epoch": 0.79, "learning_rate": 5.749210148616141e-07, "loss": 0.9278, "step": 41680 }, { "epoch": 0.79, "learning_rate": 5.748235531658214e-07, "loss": 0.9695, "step": 41681 }, { "epoch": 0.79, "learning_rate": 5.747260986585792e-07, "loss": 0.9569, "step": 41682 }, { "epoch": 0.79, "learning_rate": 5.746286513402494e-07, "loss": 0.8034, "step": 41683 }, { "epoch": 0.79, "learning_rate": 5.745312112111983e-07, "loss": 1.0189, "step": 41684 }, { "epoch": 0.79, "learning_rate": 5.744337782717885e-07, "loss": 0.8297, "step": 41685 }, { "epoch": 0.79, "learning_rate": 5.743363525223833e-07, "loss": 0.7587, "step": 41686 }, { "epoch": 0.79, "learning_rate": 5.742389339633475e-07, "loss": 1.0181, "step": 41687 }, { "epoch": 0.79, "learning_rate": 5.741415225950445e-07, "loss": 1.0656, "step": 41688 }, { "epoch": 0.79, "learning_rate": 5.740441184178377e-07, "loss": 0.799, "step": 41689 }, { "epoch": 0.79, "learning_rate": 5.739467214320912e-07, "loss": 0.9525, "step": 41690 }, { "epoch": 0.79, "learning_rate": 5.738493316381697e-07, "loss": 0.8632, "step": 41691 }, { "epoch": 0.79, "learning_rate": 5.737519490364337e-07, "loss": 0.6704, "step": 41692 }, { "epoch": 0.79, "learning_rate": 5.736545736272508e-07, "loss": 0.9629, "step": 41693 }, { "epoch": 0.79, "learning_rate": 5.735572054109817e-07, "loss": 0.9219, "step": 41694 }, { "epoch": 0.79, "learning_rate": 5.73459844387991e-07, "loss": 0.8534, "step": 41695 }, { "epoch": 0.79, "learning_rate": 5.733624905586421e-07, "loss": 0.8838, "step": 41696 }, { "epoch": 0.79, "learning_rate": 5.732651439232986e-07, "loss": 0.9409, "step": 41697 }, { "epoch": 0.79, "learning_rate": 5.731678044823241e-07, "loss": 0.8318, "step": 41698 }, { "epoch": 0.79, "learning_rate": 5.73070472236082e-07, "loss": 0.9286, "step": 41699 }, { "epoch": 0.79, "learning_rate": 5.729731471849359e-07, "loss": 1.2014, "step": 41700 }, { "epoch": 0.79, "learning_rate": 5.72875829329248e-07, "loss": 1.032, "step": 41701 }, { "epoch": 0.79, "learning_rate": 5.727785186693832e-07, "loss": 0.912, "step": 41702 }, { "epoch": 0.79, "learning_rate": 5.726812152057051e-07, "loss": 0.9474, "step": 41703 }, { "epoch": 0.79, "learning_rate": 5.725839189385748e-07, "loss": 0.7728, "step": 41704 }, { "epoch": 0.79, "learning_rate": 5.724866298683587e-07, "loss": 0.7721, "step": 41705 }, { "epoch": 0.79, "learning_rate": 5.723893479954174e-07, "loss": 0.9215, "step": 41706 }, { "epoch": 0.79, "learning_rate": 5.722920733201154e-07, "loss": 0.8834, "step": 41707 }, { "epoch": 0.79, "learning_rate": 5.721948058428156e-07, "loss": 0.7062, "step": 41708 }, { "epoch": 0.79, "learning_rate": 5.72097545563881e-07, "loss": 0.868, "step": 41709 }, { "epoch": 0.79, "learning_rate": 5.720002924836754e-07, "loss": 0.787, "step": 41710 }, { "epoch": 0.79, "learning_rate": 5.719030466025616e-07, "loss": 0.9151, "step": 41711 }, { "epoch": 0.79, "learning_rate": 5.718058079209035e-07, "loss": 1.1837, "step": 41712 }, { "epoch": 0.79, "learning_rate": 5.717085764390617e-07, "loss": 1.0081, "step": 41713 }, { "epoch": 0.79, "learning_rate": 5.716113521574024e-07, "loss": 0.8786, "step": 41714 }, { "epoch": 0.79, "learning_rate": 5.715141350762865e-07, "loss": 0.8002, "step": 41715 }, { "epoch": 0.79, "learning_rate": 5.71416925196078e-07, "loss": 0.6951, "step": 41716 }, { "epoch": 0.79, "learning_rate": 5.71319722517139e-07, "loss": 0.861, "step": 41717 }, { "epoch": 0.79, "learning_rate": 5.712225270398336e-07, "loss": 0.9717, "step": 41718 }, { "epoch": 0.79, "learning_rate": 5.711253387645238e-07, "loss": 1.0142, "step": 41719 }, { "epoch": 0.79, "learning_rate": 5.71028157691573e-07, "loss": 0.995, "step": 41720 }, { "epoch": 0.79, "learning_rate": 5.709309838213445e-07, "loss": 0.8777, "step": 41721 }, { "epoch": 0.79, "learning_rate": 5.708338171541991e-07, "loss": 0.9809, "step": 41722 }, { "epoch": 0.79, "learning_rate": 5.707366576905021e-07, "loss": 0.8577, "step": 41723 }, { "epoch": 0.79, "learning_rate": 5.706395054306157e-07, "loss": 0.994, "step": 41724 }, { "epoch": 0.79, "learning_rate": 5.705423603749008e-07, "loss": 0.8542, "step": 41725 }, { "epoch": 0.79, "learning_rate": 5.704452225237231e-07, "loss": 1.0168, "step": 41726 }, { "epoch": 0.79, "learning_rate": 5.703480918774432e-07, "loss": 0.957, "step": 41727 }, { "epoch": 0.79, "learning_rate": 5.702509684364241e-07, "loss": 0.8155, "step": 41728 }, { "epoch": 0.79, "learning_rate": 5.701538522010288e-07, "loss": 0.8359, "step": 41729 }, { "epoch": 0.79, "learning_rate": 5.700567431716197e-07, "loss": 0.728, "step": 41730 }, { "epoch": 0.79, "learning_rate": 5.699596413485597e-07, "loss": 1.0712, "step": 41731 }, { "epoch": 0.79, "learning_rate": 5.698625467322114e-07, "loss": 0.8177, "step": 41732 }, { "epoch": 0.79, "learning_rate": 5.697654593229377e-07, "loss": 1.0168, "step": 41733 }, { "epoch": 0.79, "learning_rate": 5.696683791210991e-07, "loss": 0.9759, "step": 41734 }, { "epoch": 0.79, "learning_rate": 5.695713061270611e-07, "loss": 0.7932, "step": 41735 }, { "epoch": 0.79, "learning_rate": 5.694742403411841e-07, "loss": 0.8837, "step": 41736 }, { "epoch": 0.79, "learning_rate": 5.693771817638307e-07, "loss": 1.1848, "step": 41737 }, { "epoch": 0.79, "learning_rate": 5.692801303953641e-07, "loss": 1.0109, "step": 41738 }, { "epoch": 0.79, "learning_rate": 5.69183086236146e-07, "loss": 1.072, "step": 41739 }, { "epoch": 0.79, "learning_rate": 5.690860492865391e-07, "loss": 0.9394, "step": 41740 }, { "epoch": 0.79, "learning_rate": 5.689890195469058e-07, "loss": 0.8689, "step": 41741 }, { "epoch": 0.79, "learning_rate": 5.68891997017609e-07, "loss": 0.794, "step": 41742 }, { "epoch": 0.79, "learning_rate": 5.687949816990087e-07, "loss": 1.0615, "step": 41743 }, { "epoch": 0.79, "learning_rate": 5.686979735914697e-07, "loss": 1.1813, "step": 41744 }, { "epoch": 0.79, "learning_rate": 5.68600972695354e-07, "loss": 0.8651, "step": 41745 }, { "epoch": 0.79, "learning_rate": 5.685039790110214e-07, "loss": 0.9095, "step": 41746 }, { "epoch": 0.79, "learning_rate": 5.684069925388371e-07, "loss": 0.7562, "step": 41747 }, { "epoch": 0.79, "learning_rate": 5.683100132791613e-07, "loss": 0.865, "step": 41748 }, { "epoch": 0.79, "learning_rate": 5.682130412323567e-07, "loss": 0.9167, "step": 41749 }, { "epoch": 0.79, "learning_rate": 5.681160763987853e-07, "loss": 0.9371, "step": 41750 }, { "epoch": 0.79, "learning_rate": 5.680191187788092e-07, "loss": 0.7989, "step": 41751 }, { "epoch": 0.79, "learning_rate": 5.679221683727906e-07, "loss": 0.7332, "step": 41752 }, { "epoch": 0.79, "learning_rate": 5.678252251810912e-07, "loss": 0.917, "step": 41753 }, { "epoch": 0.79, "learning_rate": 5.67728289204074e-07, "loss": 0.8113, "step": 41754 }, { "epoch": 0.79, "learning_rate": 5.676313604420988e-07, "loss": 1.0275, "step": 41755 }, { "epoch": 0.79, "learning_rate": 5.675344388955301e-07, "loss": 1.0557, "step": 41756 }, { "epoch": 0.79, "learning_rate": 5.674375245647279e-07, "loss": 0.9275, "step": 41757 }, { "epoch": 0.79, "learning_rate": 5.673406174500548e-07, "loss": 0.8992, "step": 41758 }, { "epoch": 0.79, "learning_rate": 5.672437175518725e-07, "loss": 1.0061, "step": 41759 }, { "epoch": 0.79, "learning_rate": 5.671468248705428e-07, "loss": 0.7858, "step": 41760 }, { "epoch": 0.79, "learning_rate": 5.670499394064277e-07, "loss": 0.8579, "step": 41761 }, { "epoch": 0.79, "learning_rate": 5.669530611598889e-07, "loss": 1.0567, "step": 41762 }, { "epoch": 0.79, "learning_rate": 5.668561901312889e-07, "loss": 1.1304, "step": 41763 }, { "epoch": 0.79, "learning_rate": 5.667593263209869e-07, "loss": 0.8679, "step": 41764 }, { "epoch": 0.79, "learning_rate": 5.666624697293474e-07, "loss": 0.8258, "step": 41765 }, { "epoch": 0.79, "learning_rate": 5.665656203567313e-07, "loss": 0.8467, "step": 41766 }, { "epoch": 0.79, "learning_rate": 5.664687782034986e-07, "loss": 0.6826, "step": 41767 }, { "epoch": 0.79, "learning_rate": 5.663719432700137e-07, "loss": 1.0872, "step": 41768 }, { "epoch": 0.79, "learning_rate": 5.66275115556636e-07, "loss": 0.981, "step": 41769 }, { "epoch": 0.79, "learning_rate": 5.661782950637276e-07, "loss": 0.9178, "step": 41770 }, { "epoch": 0.79, "learning_rate": 5.660814817916501e-07, "loss": 0.978, "step": 41771 }, { "epoch": 0.79, "learning_rate": 5.659846757407653e-07, "loss": 0.9442, "step": 41772 }, { "epoch": 0.79, "learning_rate": 5.658878769114343e-07, "loss": 0.6594, "step": 41773 }, { "epoch": 0.79, "learning_rate": 5.657910853040186e-07, "loss": 1.2355, "step": 41774 }, { "epoch": 0.79, "learning_rate": 5.656943009188803e-07, "loss": 1.103, "step": 41775 }, { "epoch": 0.79, "learning_rate": 5.655975237563791e-07, "loss": 0.9031, "step": 41776 }, { "epoch": 0.79, "learning_rate": 5.655007538168786e-07, "loss": 0.9197, "step": 41777 }, { "epoch": 0.79, "learning_rate": 5.654039911007384e-07, "loss": 1.0006, "step": 41778 }, { "epoch": 0.79, "learning_rate": 5.653072356083203e-07, "loss": 0.8719, "step": 41779 }, { "epoch": 0.79, "learning_rate": 5.652104873399855e-07, "loss": 0.9346, "step": 41780 }, { "epoch": 0.79, "learning_rate": 5.651137462960957e-07, "loss": 1.0411, "step": 41781 }, { "epoch": 0.79, "learning_rate": 5.650170124770116e-07, "loss": 0.8537, "step": 41782 }, { "epoch": 0.79, "learning_rate": 5.649202858830949e-07, "loss": 1.1205, "step": 41783 }, { "epoch": 0.79, "learning_rate": 5.64823566514707e-07, "loss": 0.9576, "step": 41784 }, { "epoch": 0.79, "learning_rate": 5.647268543722073e-07, "loss": 0.7162, "step": 41785 }, { "epoch": 0.79, "learning_rate": 5.646301494559588e-07, "loss": 0.9774, "step": 41786 }, { "epoch": 0.79, "learning_rate": 5.645334517663225e-07, "loss": 0.8943, "step": 41787 }, { "epoch": 0.79, "learning_rate": 5.64436761303658e-07, "loss": 1.0502, "step": 41788 }, { "epoch": 0.79, "learning_rate": 5.643400780683284e-07, "loss": 0.7368, "step": 41789 }, { "epoch": 0.79, "learning_rate": 5.642434020606929e-07, "loss": 0.7766, "step": 41790 }, { "epoch": 0.79, "learning_rate": 5.641467332811134e-07, "loss": 0.6391, "step": 41791 }, { "epoch": 0.79, "learning_rate": 5.640500717299505e-07, "loss": 0.8062, "step": 41792 }, { "epoch": 0.79, "learning_rate": 5.639534174075653e-07, "loss": 0.9218, "step": 41793 }, { "epoch": 0.79, "learning_rate": 5.638567703143186e-07, "loss": 0.9832, "step": 41794 }, { "epoch": 0.79, "learning_rate": 5.637601304505713e-07, "loss": 0.7083, "step": 41795 }, { "epoch": 0.79, "learning_rate": 5.636634978166852e-07, "loss": 0.9243, "step": 41796 }, { "epoch": 0.79, "learning_rate": 5.635668724130187e-07, "loss": 0.8652, "step": 41797 }, { "epoch": 0.79, "learning_rate": 5.634702542399356e-07, "loss": 0.8801, "step": 41798 }, { "epoch": 0.79, "learning_rate": 5.633736432977943e-07, "loss": 1.0716, "step": 41799 }, { "epoch": 0.79, "learning_rate": 5.632770395869566e-07, "loss": 0.9562, "step": 41800 }, { "epoch": 0.79, "learning_rate": 5.631804431077831e-07, "loss": 0.8536, "step": 41801 }, { "epoch": 0.79, "learning_rate": 5.630838538606345e-07, "loss": 0.8484, "step": 41802 }, { "epoch": 0.79, "learning_rate": 5.629872718458712e-07, "loss": 0.8882, "step": 41803 }, { "epoch": 0.79, "learning_rate": 5.628906970638543e-07, "loss": 0.8674, "step": 41804 }, { "epoch": 0.79, "learning_rate": 5.627941295149445e-07, "loss": 1.0308, "step": 41805 }, { "epoch": 0.79, "learning_rate": 5.626975691995009e-07, "loss": 1.192, "step": 41806 }, { "epoch": 0.79, "learning_rate": 5.626010161178857e-07, "loss": 0.8268, "step": 41807 }, { "epoch": 0.79, "learning_rate": 5.625044702704597e-07, "loss": 0.8566, "step": 41808 }, { "epoch": 0.79, "learning_rate": 5.624079316575812e-07, "loss": 0.756, "step": 41809 }, { "epoch": 0.79, "learning_rate": 5.623114002796135e-07, "loss": 0.8824, "step": 41810 }, { "epoch": 0.79, "learning_rate": 5.622148761369148e-07, "loss": 1.1464, "step": 41811 }, { "epoch": 0.79, "learning_rate": 5.621183592298465e-07, "loss": 1.0449, "step": 41812 }, { "epoch": 0.79, "learning_rate": 5.620218495587687e-07, "loss": 0.9501, "step": 41813 }, { "epoch": 0.79, "learning_rate": 5.619253471240418e-07, "loss": 0.9, "step": 41814 }, { "epoch": 0.79, "learning_rate": 5.618288519260265e-07, "loss": 0.9023, "step": 41815 }, { "epoch": 0.79, "learning_rate": 5.617323639650826e-07, "loss": 0.7986, "step": 41816 }, { "epoch": 0.79, "learning_rate": 5.616358832415717e-07, "loss": 0.7099, "step": 41817 }, { "epoch": 0.79, "learning_rate": 5.615394097558513e-07, "loss": 1.137, "step": 41818 }, { "epoch": 0.79, "learning_rate": 5.614429435082846e-07, "loss": 1.001, "step": 41819 }, { "epoch": 0.79, "learning_rate": 5.6134648449923e-07, "loss": 0.8906, "step": 41820 }, { "epoch": 0.79, "learning_rate": 5.612500327290482e-07, "loss": 1.1377, "step": 41821 }, { "epoch": 0.79, "learning_rate": 5.611535881980992e-07, "loss": 0.9261, "step": 41822 }, { "epoch": 0.79, "learning_rate": 5.610571509067434e-07, "loss": 0.7164, "step": 41823 }, { "epoch": 0.79, "learning_rate": 5.609607208553406e-07, "loss": 0.916, "step": 41824 }, { "epoch": 0.79, "learning_rate": 5.608642980442511e-07, "loss": 1.1948, "step": 41825 }, { "epoch": 0.79, "learning_rate": 5.607678824738355e-07, "loss": 0.8988, "step": 41826 }, { "epoch": 0.79, "learning_rate": 5.606714741444519e-07, "loss": 0.8225, "step": 41827 }, { "epoch": 0.79, "learning_rate": 5.605750730564621e-07, "loss": 0.6646, "step": 41828 }, { "epoch": 0.79, "learning_rate": 5.604786792102263e-07, "loss": 0.7108, "step": 41829 }, { "epoch": 0.79, "learning_rate": 5.60382292606102e-07, "loss": 0.8068, "step": 41830 }, { "epoch": 0.79, "learning_rate": 5.602859132444524e-07, "loss": 1.1655, "step": 41831 }, { "epoch": 0.79, "learning_rate": 5.60189541125635e-07, "loss": 0.9457, "step": 41832 }, { "epoch": 0.79, "learning_rate": 5.600931762500103e-07, "loss": 0.9483, "step": 41833 }, { "epoch": 0.79, "learning_rate": 5.599968186179383e-07, "loss": 0.9108, "step": 41834 }, { "epoch": 0.79, "learning_rate": 5.599004682297787e-07, "loss": 0.9808, "step": 41835 }, { "epoch": 0.79, "learning_rate": 5.598041250858913e-07, "loss": 0.9216, "step": 41836 }, { "epoch": 0.79, "learning_rate": 5.597077891866357e-07, "loss": 1.1047, "step": 41837 }, { "epoch": 0.79, "learning_rate": 5.596114605323725e-07, "loss": 0.933, "step": 41838 }, { "epoch": 0.79, "learning_rate": 5.595151391234594e-07, "loss": 0.8451, "step": 41839 }, { "epoch": 0.79, "learning_rate": 5.594188249602584e-07, "loss": 0.8895, "step": 41840 }, { "epoch": 0.79, "learning_rate": 5.593225180431272e-07, "loss": 0.7586, "step": 41841 }, { "epoch": 0.79, "learning_rate": 5.592262183724264e-07, "loss": 0.8825, "step": 41842 }, { "epoch": 0.79, "learning_rate": 5.591299259485153e-07, "loss": 0.8615, "step": 41843 }, { "epoch": 0.79, "learning_rate": 5.590336407717537e-07, "loss": 1.0367, "step": 41844 }, { "epoch": 0.79, "learning_rate": 5.58937362842501e-07, "loss": 0.9905, "step": 41845 }, { "epoch": 0.79, "learning_rate": 5.588410921611165e-07, "loss": 0.9424, "step": 41846 }, { "epoch": 0.79, "learning_rate": 5.587448287279607e-07, "loss": 0.9105, "step": 41847 }, { "epoch": 0.79, "learning_rate": 5.586485725433907e-07, "loss": 0.8564, "step": 41848 }, { "epoch": 0.79, "learning_rate": 5.58552323607768e-07, "loss": 0.9052, "step": 41849 }, { "epoch": 0.79, "learning_rate": 5.584560819214524e-07, "loss": 1.1589, "step": 41850 }, { "epoch": 0.79, "learning_rate": 5.583598474848006e-07, "loss": 0.9302, "step": 41851 }, { "epoch": 0.79, "learning_rate": 5.58263620298175e-07, "loss": 0.8621, "step": 41852 }, { "epoch": 0.79, "learning_rate": 5.581674003619328e-07, "loss": 0.9223, "step": 41853 }, { "epoch": 0.79, "learning_rate": 5.580711876764341e-07, "loss": 0.8477, "step": 41854 }, { "epoch": 0.79, "learning_rate": 5.57974982242038e-07, "loss": 0.9534, "step": 41855 }, { "epoch": 0.79, "learning_rate": 5.578787840591037e-07, "loss": 1.1945, "step": 41856 }, { "epoch": 0.79, "learning_rate": 5.577825931279906e-07, "loss": 0.9448, "step": 41857 }, { "epoch": 0.79, "learning_rate": 5.576864094490578e-07, "loss": 0.6349, "step": 41858 }, { "epoch": 0.79, "learning_rate": 5.575902330226651e-07, "loss": 0.9897, "step": 41859 }, { "epoch": 0.79, "learning_rate": 5.574940638491694e-07, "loss": 0.8442, "step": 41860 }, { "epoch": 0.79, "learning_rate": 5.573979019289327e-07, "loss": 0.7779, "step": 41861 }, { "epoch": 0.79, "learning_rate": 5.573017472623118e-07, "loss": 1.1065, "step": 41862 }, { "epoch": 0.79, "learning_rate": 5.57205599849667e-07, "loss": 0.9085, "step": 41863 }, { "epoch": 0.79, "learning_rate": 5.571094596913568e-07, "loss": 0.7738, "step": 41864 }, { "epoch": 0.79, "learning_rate": 5.570133267877401e-07, "loss": 1.0651, "step": 41865 }, { "epoch": 0.79, "learning_rate": 5.569172011391764e-07, "loss": 0.6504, "step": 41866 }, { "epoch": 0.79, "learning_rate": 5.568210827460238e-07, "loss": 0.7455, "step": 41867 }, { "epoch": 0.79, "learning_rate": 5.567249716086429e-07, "loss": 1.0051, "step": 41868 }, { "epoch": 0.79, "learning_rate": 5.566288677273895e-07, "loss": 1.0434, "step": 41869 }, { "epoch": 0.79, "learning_rate": 5.565327711026255e-07, "loss": 1.0356, "step": 41870 }, { "epoch": 0.79, "learning_rate": 5.564366817347089e-07, "loss": 0.7558, "step": 41871 }, { "epoch": 0.79, "learning_rate": 5.563405996239968e-07, "loss": 0.899, "step": 41872 }, { "epoch": 0.79, "learning_rate": 5.562445247708509e-07, "loss": 0.7498, "step": 41873 }, { "epoch": 0.79, "learning_rate": 5.561484571756276e-07, "loss": 0.8254, "step": 41874 }, { "epoch": 0.79, "learning_rate": 5.560523968386864e-07, "loss": 1.2051, "step": 41875 }, { "epoch": 0.79, "learning_rate": 5.559563437603857e-07, "loss": 0.7718, "step": 41876 }, { "epoch": 0.79, "learning_rate": 5.558602979410845e-07, "loss": 0.9446, "step": 41877 }, { "epoch": 0.79, "learning_rate": 5.557642593811413e-07, "loss": 0.9447, "step": 41878 }, { "epoch": 0.79, "learning_rate": 5.55668228080915e-07, "loss": 0.6825, "step": 41879 }, { "epoch": 0.79, "learning_rate": 5.555722040407643e-07, "loss": 0.9089, "step": 41880 }, { "epoch": 0.79, "learning_rate": 5.554761872610462e-07, "loss": 0.9183, "step": 41881 }, { "epoch": 0.79, "learning_rate": 5.553801777421217e-07, "loss": 0.9726, "step": 41882 }, { "epoch": 0.79, "learning_rate": 5.552841754843472e-07, "loss": 0.8651, "step": 41883 }, { "epoch": 0.79, "learning_rate": 5.551881804880821e-07, "loss": 0.9244, "step": 41884 }, { "epoch": 0.79, "learning_rate": 5.550921927536848e-07, "loss": 0.721, "step": 41885 }, { "epoch": 0.79, "learning_rate": 5.549962122815133e-07, "loss": 1.0475, "step": 41886 }, { "epoch": 0.79, "learning_rate": 5.549002390719265e-07, "loss": 1.1808, "step": 41887 }, { "epoch": 0.79, "learning_rate": 5.548042731252825e-07, "loss": 0.983, "step": 41888 }, { "epoch": 0.79, "learning_rate": 5.547083144419408e-07, "loss": 0.8408, "step": 41889 }, { "epoch": 0.79, "learning_rate": 5.546123630222566e-07, "loss": 0.8981, "step": 41890 }, { "epoch": 0.79, "learning_rate": 5.545164188665914e-07, "loss": 0.9741, "step": 41891 }, { "epoch": 0.79, "learning_rate": 5.544204819753026e-07, "loss": 0.7735, "step": 41892 }, { "epoch": 0.79, "learning_rate": 5.543245523487467e-07, "loss": 1.1025, "step": 41893 }, { "epoch": 0.79, "learning_rate": 5.542286299872848e-07, "loss": 0.9333, "step": 41894 }, { "epoch": 0.79, "learning_rate": 5.541327148912728e-07, "loss": 0.8308, "step": 41895 }, { "epoch": 0.79, "learning_rate": 5.540368070610696e-07, "loss": 0.8029, "step": 41896 }, { "epoch": 0.79, "learning_rate": 5.539409064970333e-07, "loss": 0.7596, "step": 41897 }, { "epoch": 0.79, "learning_rate": 5.538450131995221e-07, "loss": 0.9417, "step": 41898 }, { "epoch": 0.79, "learning_rate": 5.537491271688936e-07, "loss": 0.9489, "step": 41899 }, { "epoch": 0.79, "learning_rate": 5.536532484055066e-07, "loss": 0.8957, "step": 41900 }, { "epoch": 0.79, "learning_rate": 5.535573769097192e-07, "loss": 0.8789, "step": 41901 }, { "epoch": 0.79, "learning_rate": 5.534615126818874e-07, "loss": 0.7356, "step": 41902 }, { "epoch": 0.79, "learning_rate": 5.533656557223721e-07, "loss": 0.7624, "step": 41903 }, { "epoch": 0.79, "learning_rate": 5.532698060315289e-07, "loss": 1.0172, "step": 41904 }, { "epoch": 0.79, "learning_rate": 5.531739636097166e-07, "loss": 0.7691, "step": 41905 }, { "epoch": 0.79, "learning_rate": 5.530781284572934e-07, "loss": 0.8865, "step": 41906 }, { "epoch": 0.79, "learning_rate": 5.529823005746162e-07, "loss": 0.9063, "step": 41907 }, { "epoch": 0.79, "learning_rate": 5.528864799620446e-07, "loss": 0.8358, "step": 41908 }, { "epoch": 0.79, "learning_rate": 5.527906666199337e-07, "loss": 1.0755, "step": 41909 }, { "epoch": 0.79, "learning_rate": 5.52694860548644e-07, "loss": 0.8346, "step": 41910 }, { "epoch": 0.79, "learning_rate": 5.525990617485314e-07, "loss": 0.8359, "step": 41911 }, { "epoch": 0.79, "learning_rate": 5.525032702199532e-07, "loss": 0.9775, "step": 41912 }, { "epoch": 0.79, "learning_rate": 5.524074859632697e-07, "loss": 1.0085, "step": 41913 }, { "epoch": 0.79, "learning_rate": 5.523117089788363e-07, "loss": 0.9865, "step": 41914 }, { "epoch": 0.79, "learning_rate": 5.522159392670112e-07, "loss": 0.9968, "step": 41915 }, { "epoch": 0.79, "learning_rate": 5.52120176828152e-07, "loss": 0.8818, "step": 41916 }, { "epoch": 0.79, "learning_rate": 5.520244216626163e-07, "loss": 0.9518, "step": 41917 }, { "epoch": 0.79, "learning_rate": 5.519286737707619e-07, "loss": 1.4474, "step": 41918 }, { "epoch": 0.79, "learning_rate": 5.51832933152946e-07, "loss": 1.1699, "step": 41919 }, { "epoch": 0.79, "learning_rate": 5.517371998095266e-07, "loss": 0.9024, "step": 41920 }, { "epoch": 0.79, "learning_rate": 5.516414737408598e-07, "loss": 0.9291, "step": 41921 }, { "epoch": 0.79, "learning_rate": 5.515457549473052e-07, "loss": 0.871, "step": 41922 }, { "epoch": 0.79, "learning_rate": 5.514500434292184e-07, "loss": 0.9582, "step": 41923 }, { "epoch": 0.79, "learning_rate": 5.513543391869572e-07, "loss": 0.9908, "step": 41924 }, { "epoch": 0.79, "learning_rate": 5.512586422208793e-07, "loss": 0.8985, "step": 41925 }, { "epoch": 0.79, "learning_rate": 5.51162952531342e-07, "loss": 0.967, "step": 41926 }, { "epoch": 0.79, "learning_rate": 5.510672701187022e-07, "loss": 0.9219, "step": 41927 }, { "epoch": 0.79, "learning_rate": 5.509715949833178e-07, "loss": 1.067, "step": 41928 }, { "epoch": 0.79, "learning_rate": 5.50875927125546e-07, "loss": 0.8304, "step": 41929 }, { "epoch": 0.79, "learning_rate": 5.507802665457427e-07, "loss": 0.8246, "step": 41930 }, { "epoch": 0.79, "learning_rate": 5.506846132442672e-07, "loss": 0.8829, "step": 41931 }, { "epoch": 0.79, "learning_rate": 5.50588967221475e-07, "loss": 1.161, "step": 41932 }, { "epoch": 0.79, "learning_rate": 5.504933284777231e-07, "loss": 0.8215, "step": 41933 }, { "epoch": 0.79, "learning_rate": 5.503976970133709e-07, "loss": 1.1016, "step": 41934 }, { "epoch": 0.79, "learning_rate": 5.503020728287731e-07, "loss": 0.6939, "step": 41935 }, { "epoch": 0.79, "learning_rate": 5.502064559242876e-07, "loss": 0.9567, "step": 41936 }, { "epoch": 0.79, "learning_rate": 5.501108463002714e-07, "loss": 1.1918, "step": 41937 }, { "epoch": 0.79, "learning_rate": 5.500152439570816e-07, "loss": 1.0496, "step": 41938 }, { "epoch": 0.79, "learning_rate": 5.49919648895075e-07, "loss": 0.7263, "step": 41939 }, { "epoch": 0.79, "learning_rate": 5.498240611146086e-07, "loss": 0.8459, "step": 41940 }, { "epoch": 0.79, "learning_rate": 5.497284806160403e-07, "loss": 0.864, "step": 41941 }, { "epoch": 0.79, "learning_rate": 5.496329073997244e-07, "loss": 0.8419, "step": 41942 }, { "epoch": 0.79, "learning_rate": 5.49537341466021e-07, "loss": 1.038, "step": 41943 }, { "epoch": 0.79, "learning_rate": 5.494417828152845e-07, "loss": 1.0106, "step": 41944 }, { "epoch": 0.79, "learning_rate": 5.493462314478726e-07, "loss": 0.8708, "step": 41945 }, { "epoch": 0.79, "learning_rate": 5.49250687364142e-07, "loss": 0.9808, "step": 41946 }, { "epoch": 0.79, "learning_rate": 5.491551505644498e-07, "loss": 1.0538, "step": 41947 }, { "epoch": 0.79, "learning_rate": 5.490596210491522e-07, "loss": 0.8535, "step": 41948 }, { "epoch": 0.79, "learning_rate": 5.489640988186063e-07, "loss": 0.788, "step": 41949 }, { "epoch": 0.79, "learning_rate": 5.488685838731691e-07, "loss": 1.1981, "step": 41950 }, { "epoch": 0.79, "learning_rate": 5.487730762131956e-07, "loss": 0.924, "step": 41951 }, { "epoch": 0.79, "learning_rate": 5.48677575839045e-07, "loss": 1.0118, "step": 41952 }, { "epoch": 0.79, "learning_rate": 5.485820827510718e-07, "loss": 0.7796, "step": 41953 }, { "epoch": 0.79, "learning_rate": 5.484865969496328e-07, "loss": 0.8292, "step": 41954 }, { "epoch": 0.79, "learning_rate": 5.48391118435086e-07, "loss": 1.0606, "step": 41955 }, { "epoch": 0.79, "learning_rate": 5.482956472077863e-07, "loss": 0.9034, "step": 41956 }, { "epoch": 0.79, "learning_rate": 5.482001832680911e-07, "loss": 0.949, "step": 41957 }, { "epoch": 0.79, "learning_rate": 5.481047266163564e-07, "loss": 0.8663, "step": 41958 }, { "epoch": 0.79, "learning_rate": 5.480092772529386e-07, "loss": 0.8012, "step": 41959 }, { "epoch": 0.79, "learning_rate": 5.479138351781945e-07, "loss": 0.8477, "step": 41960 }, { "epoch": 0.79, "learning_rate": 5.478184003924802e-07, "loss": 0.9498, "step": 41961 }, { "epoch": 0.79, "learning_rate": 5.477229728961531e-07, "loss": 0.9405, "step": 41962 }, { "epoch": 0.79, "learning_rate": 5.476275526895669e-07, "loss": 0.9239, "step": 41963 }, { "epoch": 0.79, "learning_rate": 5.47532139773081e-07, "loss": 0.8296, "step": 41964 }, { "epoch": 0.79, "learning_rate": 5.474367341470496e-07, "loss": 0.8588, "step": 41965 }, { "epoch": 0.79, "learning_rate": 5.473413358118296e-07, "loss": 0.863, "step": 41966 }, { "epoch": 0.79, "learning_rate": 5.47245944767777e-07, "loss": 0.7841, "step": 41967 }, { "epoch": 0.79, "learning_rate": 5.471505610152483e-07, "loss": 0.9803, "step": 41968 }, { "epoch": 0.79, "learning_rate": 5.470551845545996e-07, "loss": 1.2607, "step": 41969 }, { "epoch": 0.79, "learning_rate": 5.469598153861868e-07, "loss": 0.9045, "step": 41970 }, { "epoch": 0.79, "learning_rate": 5.468644535103668e-07, "loss": 0.9693, "step": 41971 }, { "epoch": 0.79, "learning_rate": 5.467690989274937e-07, "loss": 0.8647, "step": 41972 }, { "epoch": 0.79, "learning_rate": 5.466737516379267e-07, "loss": 0.8669, "step": 41973 }, { "epoch": 0.79, "learning_rate": 5.465784116420189e-07, "loss": 1.0481, "step": 41974 }, { "epoch": 0.79, "learning_rate": 5.464830789401268e-07, "loss": 0.9967, "step": 41975 }, { "epoch": 0.79, "learning_rate": 5.463877535326084e-07, "loss": 0.8654, "step": 41976 }, { "epoch": 0.79, "learning_rate": 5.462924354198176e-07, "loss": 0.9957, "step": 41977 }, { "epoch": 0.79, "learning_rate": 5.461971246021108e-07, "loss": 0.7293, "step": 41978 }, { "epoch": 0.79, "learning_rate": 5.461018210798441e-07, "loss": 0.8781, "step": 41979 }, { "epoch": 0.79, "learning_rate": 5.460065248533733e-07, "loss": 0.8791, "step": 41980 }, { "epoch": 0.79, "learning_rate": 5.459112359230542e-07, "loss": 0.9229, "step": 41981 }, { "epoch": 0.79, "learning_rate": 5.458159542892427e-07, "loss": 1.0969, "step": 41982 }, { "epoch": 0.79, "learning_rate": 5.457206799522952e-07, "loss": 0.8503, "step": 41983 }, { "epoch": 0.79, "learning_rate": 5.456254129125651e-07, "loss": 0.5754, "step": 41984 }, { "epoch": 0.79, "learning_rate": 5.455301531704116e-07, "loss": 0.9076, "step": 41985 }, { "epoch": 0.79, "learning_rate": 5.454349007261878e-07, "loss": 0.9449, "step": 41986 }, { "epoch": 0.79, "learning_rate": 5.453396555802498e-07, "loss": 1.0123, "step": 41987 }, { "epoch": 0.79, "learning_rate": 5.452444177329541e-07, "loss": 0.878, "step": 41988 }, { "epoch": 0.79, "learning_rate": 5.451491871846554e-07, "loss": 0.8278, "step": 41989 }, { "epoch": 0.79, "learning_rate": 5.450539639357099e-07, "loss": 0.8218, "step": 41990 }, { "epoch": 0.79, "learning_rate": 5.449587479864729e-07, "loss": 0.9457, "step": 41991 }, { "epoch": 0.79, "learning_rate": 5.448635393373005e-07, "loss": 0.948, "step": 41992 }, { "epoch": 0.79, "learning_rate": 5.447683379885468e-07, "loss": 0.8529, "step": 41993 }, { "epoch": 0.79, "learning_rate": 5.446731439405686e-07, "loss": 1.0708, "step": 41994 }, { "epoch": 0.79, "learning_rate": 5.445779571937215e-07, "loss": 0.9478, "step": 41995 }, { "epoch": 0.79, "learning_rate": 5.444827777483591e-07, "loss": 0.8037, "step": 41996 }, { "epoch": 0.79, "learning_rate": 5.443876056048394e-07, "loss": 0.9739, "step": 41997 }, { "epoch": 0.79, "learning_rate": 5.442924407635158e-07, "loss": 0.827, "step": 41998 }, { "epoch": 0.79, "learning_rate": 5.441972832247441e-07, "loss": 1.131, "step": 41999 }, { "epoch": 0.79, "learning_rate": 5.441021329888799e-07, "loss": 0.9527, "step": 42000 }, { "epoch": 0.79, "learning_rate": 5.440069900562783e-07, "loss": 0.9718, "step": 42001 }, { "epoch": 0.79, "learning_rate": 5.439118544272948e-07, "loss": 1.0591, "step": 42002 }, { "epoch": 0.79, "learning_rate": 5.438167261022842e-07, "loss": 0.92, "step": 42003 }, { "epoch": 0.79, "learning_rate": 5.437216050816027e-07, "loss": 0.671, "step": 42004 }, { "epoch": 0.79, "learning_rate": 5.436264913656036e-07, "loss": 0.944, "step": 42005 }, { "epoch": 0.79, "learning_rate": 5.435313849546444e-07, "loss": 0.9741, "step": 42006 }, { "epoch": 0.79, "learning_rate": 5.434362858490783e-07, "loss": 0.9884, "step": 42007 }, { "epoch": 0.79, "learning_rate": 5.433411940492611e-07, "loss": 0.9419, "step": 42008 }, { "epoch": 0.79, "learning_rate": 5.432461095555481e-07, "loss": 0.9027, "step": 42009 }, { "epoch": 0.79, "learning_rate": 5.431510323682939e-07, "loss": 0.9258, "step": 42010 }, { "epoch": 0.79, "learning_rate": 5.43055962487854e-07, "loss": 0.7542, "step": 42011 }, { "epoch": 0.79, "learning_rate": 5.42960899914583e-07, "loss": 0.9896, "step": 42012 }, { "epoch": 0.79, "learning_rate": 5.428658446488367e-07, "loss": 1.01, "step": 42013 }, { "epoch": 0.79, "learning_rate": 5.427707966909679e-07, "loss": 1.0652, "step": 42014 }, { "epoch": 0.79, "learning_rate": 5.426757560413335e-07, "loss": 0.951, "step": 42015 }, { "epoch": 0.79, "learning_rate": 5.425807227002888e-07, "loss": 0.6711, "step": 42016 }, { "epoch": 0.79, "learning_rate": 5.424856966681861e-07, "loss": 0.9795, "step": 42017 }, { "epoch": 0.79, "learning_rate": 5.42390677945383e-07, "loss": 0.8077, "step": 42018 }, { "epoch": 0.79, "learning_rate": 5.422956665322327e-07, "loss": 1.0685, "step": 42019 }, { "epoch": 0.79, "learning_rate": 5.422006624290904e-07, "loss": 0.9954, "step": 42020 }, { "epoch": 0.79, "learning_rate": 5.421056656363105e-07, "loss": 1.0716, "step": 42021 }, { "epoch": 0.79, "learning_rate": 5.420106761542482e-07, "loss": 0.8734, "step": 42022 }, { "epoch": 0.79, "learning_rate": 5.419156939832579e-07, "loss": 0.877, "step": 42023 }, { "epoch": 0.79, "learning_rate": 5.418207191236946e-07, "loss": 0.9722, "step": 42024 }, { "epoch": 0.79, "learning_rate": 5.41725751575913e-07, "loss": 1.0936, "step": 42025 }, { "epoch": 0.79, "learning_rate": 5.416307913402663e-07, "loss": 0.8913, "step": 42026 }, { "epoch": 0.79, "learning_rate": 5.415358384171115e-07, "loss": 0.9921, "step": 42027 }, { "epoch": 0.79, "learning_rate": 5.414408928068013e-07, "loss": 0.8239, "step": 42028 }, { "epoch": 0.79, "learning_rate": 5.413459545096905e-07, "loss": 0.9299, "step": 42029 }, { "epoch": 0.79, "learning_rate": 5.41251023526134e-07, "loss": 0.8454, "step": 42030 }, { "epoch": 0.79, "learning_rate": 5.41156099856486e-07, "loss": 1.0986, "step": 42031 }, { "epoch": 0.79, "learning_rate": 5.410611835011012e-07, "loss": 1.0017, "step": 42032 }, { "epoch": 0.79, "learning_rate": 5.409662744603339e-07, "loss": 0.93, "step": 42033 }, { "epoch": 0.79, "learning_rate": 5.408713727345391e-07, "loss": 0.9878, "step": 42034 }, { "epoch": 0.79, "learning_rate": 5.407764783240691e-07, "loss": 0.7603, "step": 42035 }, { "epoch": 0.79, "learning_rate": 5.406815912292804e-07, "loss": 0.7267, "step": 42036 }, { "epoch": 0.79, "learning_rate": 5.40586711450527e-07, "loss": 0.9335, "step": 42037 }, { "epoch": 0.79, "learning_rate": 5.404918389881616e-07, "loss": 0.9277, "step": 42038 }, { "epoch": 0.79, "learning_rate": 5.40396973842541e-07, "loss": 0.8775, "step": 42039 }, { "epoch": 0.79, "learning_rate": 5.403021160140173e-07, "loss": 1.0264, "step": 42040 }, { "epoch": 0.79, "learning_rate": 5.402072655029453e-07, "loss": 0.8432, "step": 42041 }, { "epoch": 0.79, "learning_rate": 5.401124223096796e-07, "loss": 0.8841, "step": 42042 }, { "epoch": 0.79, "learning_rate": 5.400175864345736e-07, "loss": 1.0452, "step": 42043 }, { "epoch": 0.79, "learning_rate": 5.39922757877982e-07, "loss": 0.8568, "step": 42044 }, { "epoch": 0.79, "learning_rate": 5.39827936640259e-07, "loss": 0.8531, "step": 42045 }, { "epoch": 0.79, "learning_rate": 5.397331227217587e-07, "loss": 0.7995, "step": 42046 }, { "epoch": 0.79, "learning_rate": 5.396383161228336e-07, "loss": 0.8513, "step": 42047 }, { "epoch": 0.79, "learning_rate": 5.395435168438403e-07, "loss": 0.8702, "step": 42048 }, { "epoch": 0.79, "learning_rate": 5.394487248851307e-07, "loss": 0.9518, "step": 42049 }, { "epoch": 0.79, "learning_rate": 5.393539402470594e-07, "loss": 1.1898, "step": 42050 }, { "epoch": 0.79, "learning_rate": 5.392591629299804e-07, "loss": 0.9784, "step": 42051 }, { "epoch": 0.79, "learning_rate": 5.391643929342474e-07, "loss": 0.7387, "step": 42052 }, { "epoch": 0.79, "learning_rate": 5.390696302602147e-07, "loss": 0.9697, "step": 42053 }, { "epoch": 0.79, "learning_rate": 5.389748749082357e-07, "loss": 0.6437, "step": 42054 }, { "epoch": 0.79, "learning_rate": 5.388801268786653e-07, "loss": 1.0767, "step": 42055 }, { "epoch": 0.79, "learning_rate": 5.387853861718548e-07, "loss": 1.1486, "step": 42056 }, { "epoch": 0.79, "learning_rate": 5.386906527881606e-07, "loss": 1.0028, "step": 42057 }, { "epoch": 0.79, "learning_rate": 5.385959267279356e-07, "loss": 0.9077, "step": 42058 }, { "epoch": 0.79, "learning_rate": 5.385012079915319e-07, "loss": 0.9745, "step": 42059 }, { "epoch": 0.79, "learning_rate": 5.384064965793062e-07, "loss": 0.7252, "step": 42060 }, { "epoch": 0.79, "learning_rate": 5.383117924916096e-07, "loss": 0.7891, "step": 42061 }, { "epoch": 0.79, "learning_rate": 5.382170957287966e-07, "loss": 0.9521, "step": 42062 }, { "epoch": 0.79, "learning_rate": 5.38122406291221e-07, "loss": 1.1547, "step": 42063 }, { "epoch": 0.79, "learning_rate": 5.380277241792362e-07, "loss": 0.6458, "step": 42064 }, { "epoch": 0.79, "learning_rate": 5.379330493931955e-07, "loss": 0.895, "step": 42065 }, { "epoch": 0.79, "learning_rate": 5.378383819334529e-07, "loss": 0.7031, "step": 42066 }, { "epoch": 0.79, "learning_rate": 5.37743721800362e-07, "loss": 0.9077, "step": 42067 }, { "epoch": 0.79, "learning_rate": 5.376490689942749e-07, "loss": 0.8786, "step": 42068 }, { "epoch": 0.79, "learning_rate": 5.375544235155469e-07, "loss": 1.12, "step": 42069 }, { "epoch": 0.79, "learning_rate": 5.374597853645302e-07, "loss": 0.9487, "step": 42070 }, { "epoch": 0.79, "learning_rate": 5.373651545415784e-07, "loss": 0.9414, "step": 42071 }, { "epoch": 0.79, "learning_rate": 5.372705310470449e-07, "loss": 0.8996, "step": 42072 }, { "epoch": 0.79, "learning_rate": 5.37175914881283e-07, "loss": 0.716, "step": 42073 }, { "epoch": 0.79, "learning_rate": 5.370813060446461e-07, "loss": 1.0195, "step": 42074 }, { "epoch": 0.79, "learning_rate": 5.369867045374875e-07, "loss": 0.9646, "step": 42075 }, { "epoch": 0.79, "learning_rate": 5.36892110360161e-07, "loss": 0.8403, "step": 42076 }, { "epoch": 0.79, "learning_rate": 5.367975235130177e-07, "loss": 0.7409, "step": 42077 }, { "epoch": 0.79, "learning_rate": 5.36702943996413e-07, "loss": 0.913, "step": 42078 }, { "epoch": 0.79, "learning_rate": 5.366083718107002e-07, "loss": 0.6754, "step": 42079 }, { "epoch": 0.79, "learning_rate": 5.365138069562298e-07, "loss": 0.9806, "step": 42080 }, { "epoch": 0.79, "learning_rate": 5.364192494333581e-07, "loss": 1.1244, "step": 42081 }, { "epoch": 0.79, "learning_rate": 5.363246992424362e-07, "loss": 0.8561, "step": 42082 }, { "epoch": 0.79, "learning_rate": 5.362301563838177e-07, "loss": 0.9747, "step": 42083 }, { "epoch": 0.79, "learning_rate": 5.361356208578553e-07, "loss": 0.9202, "step": 42084 }, { "epoch": 0.79, "learning_rate": 5.360410926649027e-07, "loss": 0.6485, "step": 42085 }, { "epoch": 0.79, "learning_rate": 5.35946571805312e-07, "loss": 0.9444, "step": 42086 }, { "epoch": 0.79, "learning_rate": 5.358520582794369e-07, "loss": 1.1255, "step": 42087 }, { "epoch": 0.79, "learning_rate": 5.357575520876304e-07, "loss": 0.9761, "step": 42088 }, { "epoch": 0.79, "learning_rate": 5.356630532302437e-07, "loss": 0.7912, "step": 42089 }, { "epoch": 0.79, "learning_rate": 5.355685617076326e-07, "loss": 0.8234, "step": 42090 }, { "epoch": 0.79, "learning_rate": 5.354740775201472e-07, "loss": 0.8542, "step": 42091 }, { "epoch": 0.79, "learning_rate": 5.353796006681417e-07, "loss": 0.7954, "step": 42092 }, { "epoch": 0.79, "learning_rate": 5.352851311519682e-07, "loss": 0.8754, "step": 42093 }, { "epoch": 0.79, "learning_rate": 5.351906689719799e-07, "loss": 1.201, "step": 42094 }, { "epoch": 0.79, "learning_rate": 5.350962141285293e-07, "loss": 0.9056, "step": 42095 }, { "epoch": 0.79, "learning_rate": 5.350017666219695e-07, "loss": 0.6931, "step": 42096 }, { "epoch": 0.79, "learning_rate": 5.349073264526533e-07, "loss": 0.6966, "step": 42097 }, { "epoch": 0.79, "learning_rate": 5.348128936209315e-07, "loss": 0.7316, "step": 42098 }, { "epoch": 0.79, "learning_rate": 5.347184681271589e-07, "loss": 0.9525, "step": 42099 }, { "epoch": 0.79, "learning_rate": 5.346240499716879e-07, "loss": 1.0812, "step": 42100 }, { "epoch": 0.79, "learning_rate": 5.34529639154869e-07, "loss": 0.9856, "step": 42101 }, { "epoch": 0.79, "learning_rate": 5.344352356770577e-07, "loss": 0.7164, "step": 42102 }, { "epoch": 0.79, "learning_rate": 5.343408395386044e-07, "loss": 0.9132, "step": 42103 }, { "epoch": 0.79, "learning_rate": 5.342464507398617e-07, "loss": 0.8324, "step": 42104 }, { "epoch": 0.79, "learning_rate": 5.341520692811827e-07, "loss": 0.8936, "step": 42105 }, { "epoch": 0.79, "learning_rate": 5.340576951629198e-07, "loss": 1.1269, "step": 42106 }, { "epoch": 0.79, "learning_rate": 5.339633283854248e-07, "loss": 0.7794, "step": 42107 }, { "epoch": 0.79, "learning_rate": 5.338689689490508e-07, "loss": 0.9164, "step": 42108 }, { "epoch": 0.79, "learning_rate": 5.337746168541503e-07, "loss": 0.8119, "step": 42109 }, { "epoch": 0.79, "learning_rate": 5.336802721010737e-07, "loss": 0.8228, "step": 42110 }, { "epoch": 0.79, "learning_rate": 5.335859346901762e-07, "loss": 0.7437, "step": 42111 }, { "epoch": 0.79, "learning_rate": 5.334916046218077e-07, "loss": 1.0713, "step": 42112 }, { "epoch": 0.79, "learning_rate": 5.333972818963212e-07, "loss": 0.8212, "step": 42113 }, { "epoch": 0.79, "learning_rate": 5.333029665140693e-07, "loss": 0.9448, "step": 42114 }, { "epoch": 0.79, "learning_rate": 5.332086584754034e-07, "loss": 0.9265, "step": 42115 }, { "epoch": 0.79, "learning_rate": 5.331143577806763e-07, "loss": 0.7067, "step": 42116 }, { "epoch": 0.79, "learning_rate": 5.3302006443024e-07, "loss": 0.8655, "step": 42117 }, { "epoch": 0.79, "learning_rate": 5.329257784244469e-07, "loss": 1.0336, "step": 42118 }, { "epoch": 0.79, "learning_rate": 5.328314997636471e-07, "loss": 1.0466, "step": 42119 }, { "epoch": 0.79, "learning_rate": 5.327372284481952e-07, "loss": 0.938, "step": 42120 }, { "epoch": 0.79, "learning_rate": 5.326429644784428e-07, "loss": 0.8737, "step": 42121 }, { "epoch": 0.79, "learning_rate": 5.325487078547397e-07, "loss": 0.8405, "step": 42122 }, { "epoch": 0.79, "learning_rate": 5.32454458577441e-07, "loss": 0.7834, "step": 42123 }, { "epoch": 0.79, "learning_rate": 5.323602166468964e-07, "loss": 0.9832, "step": 42124 }, { "epoch": 0.79, "learning_rate": 5.322659820634582e-07, "loss": 0.9131, "step": 42125 }, { "epoch": 0.79, "learning_rate": 5.321717548274785e-07, "loss": 0.9236, "step": 42126 }, { "epoch": 0.79, "learning_rate": 5.320775349393092e-07, "loss": 0.7414, "step": 42127 }, { "epoch": 0.79, "learning_rate": 5.31983322399302e-07, "loss": 0.665, "step": 42128 }, { "epoch": 0.79, "learning_rate": 5.318891172078089e-07, "loss": 0.6909, "step": 42129 }, { "epoch": 0.79, "learning_rate": 5.31794919365182e-07, "loss": 0.8574, "step": 42130 }, { "epoch": 0.79, "learning_rate": 5.31700728871771e-07, "loss": 1.2287, "step": 42131 }, { "epoch": 0.79, "learning_rate": 5.316065457279307e-07, "loss": 0.9952, "step": 42132 }, { "epoch": 0.79, "learning_rate": 5.315123699340105e-07, "loss": 0.8045, "step": 42133 }, { "epoch": 0.79, "learning_rate": 5.314182014903629e-07, "loss": 0.8224, "step": 42134 }, { "epoch": 0.79, "learning_rate": 5.313240403973394e-07, "loss": 0.9838, "step": 42135 }, { "epoch": 0.79, "learning_rate": 5.312298866552911e-07, "loss": 0.7977, "step": 42136 }, { "epoch": 0.79, "learning_rate": 5.311357402645712e-07, "loss": 1.1173, "step": 42137 }, { "epoch": 0.8, "learning_rate": 5.310416012255288e-07, "loss": 0.9729, "step": 42138 }, { "epoch": 0.8, "learning_rate": 5.309474695385175e-07, "loss": 0.9434, "step": 42139 }, { "epoch": 0.8, "learning_rate": 5.308533452038877e-07, "loss": 0.7079, "step": 42140 }, { "epoch": 0.8, "learning_rate": 5.307592282219904e-07, "loss": 0.9418, "step": 42141 }, { "epoch": 0.8, "learning_rate": 5.306651185931791e-07, "loss": 0.8039, "step": 42142 }, { "epoch": 0.8, "learning_rate": 5.305710163178032e-07, "loss": 1.0197, "step": 42143 }, { "epoch": 0.8, "learning_rate": 5.304769213962147e-07, "loss": 1.1076, "step": 42144 }, { "epoch": 0.8, "learning_rate": 5.30382833828765e-07, "loss": 0.7631, "step": 42145 }, { "epoch": 0.8, "learning_rate": 5.302887536158055e-07, "loss": 0.8721, "step": 42146 }, { "epoch": 0.8, "learning_rate": 5.301946807576872e-07, "loss": 0.9796, "step": 42147 }, { "epoch": 0.8, "learning_rate": 5.301006152547616e-07, "loss": 0.8123, "step": 42148 }, { "epoch": 0.8, "learning_rate": 5.300065571073807e-07, "loss": 1.0515, "step": 42149 }, { "epoch": 0.8, "learning_rate": 5.299125063158936e-07, "loss": 1.1082, "step": 42150 }, { "epoch": 0.8, "learning_rate": 5.298184628806541e-07, "loss": 0.8018, "step": 42151 }, { "epoch": 0.8, "learning_rate": 5.297244268020113e-07, "loss": 0.9388, "step": 42152 }, { "epoch": 0.8, "learning_rate": 5.296303980803172e-07, "loss": 1.0225, "step": 42153 }, { "epoch": 0.8, "learning_rate": 5.295363767159225e-07, "loss": 0.7371, "step": 42154 }, { "epoch": 0.8, "learning_rate": 5.294423627091789e-07, "loss": 0.9068, "step": 42155 }, { "epoch": 0.8, "learning_rate": 5.293483560604371e-07, "loss": 1.1783, "step": 42156 }, { "epoch": 0.8, "learning_rate": 5.292543567700478e-07, "loss": 0.9731, "step": 42157 }, { "epoch": 0.8, "learning_rate": 5.291603648383634e-07, "loss": 0.9272, "step": 42158 }, { "epoch": 0.8, "learning_rate": 5.29066380265732e-07, "loss": 0.872, "step": 42159 }, { "epoch": 0.8, "learning_rate": 5.289724030525079e-07, "loss": 0.8309, "step": 42160 }, { "epoch": 0.8, "learning_rate": 5.288784331990395e-07, "loss": 0.9852, "step": 42161 }, { "epoch": 0.8, "learning_rate": 5.287844707056783e-07, "loss": 1.1745, "step": 42162 }, { "epoch": 0.8, "learning_rate": 5.286905155727764e-07, "loss": 0.6817, "step": 42163 }, { "epoch": 0.8, "learning_rate": 5.285965678006832e-07, "loss": 0.8297, "step": 42164 }, { "epoch": 0.8, "learning_rate": 5.2850262738975e-07, "loss": 0.8951, "step": 42165 }, { "epoch": 0.8, "learning_rate": 5.284086943403278e-07, "loss": 1.1871, "step": 42166 }, { "epoch": 0.8, "learning_rate": 5.283147686527665e-07, "loss": 0.8727, "step": 42167 }, { "epoch": 0.8, "learning_rate": 5.282208503274177e-07, "loss": 0.9568, "step": 42168 }, { "epoch": 0.8, "learning_rate": 5.281269393646319e-07, "loss": 0.915, "step": 42169 }, { "epoch": 0.8, "learning_rate": 5.2803303576476e-07, "loss": 1.1178, "step": 42170 }, { "epoch": 0.8, "learning_rate": 5.279391395281514e-07, "loss": 0.8721, "step": 42171 }, { "epoch": 0.8, "learning_rate": 5.278452506551585e-07, "loss": 0.7631, "step": 42172 }, { "epoch": 0.8, "learning_rate": 5.277513691461306e-07, "loss": 0.7932, "step": 42173 }, { "epoch": 0.8, "learning_rate": 5.276574950014185e-07, "loss": 0.9366, "step": 42174 }, { "epoch": 0.8, "learning_rate": 5.275636282213728e-07, "loss": 0.9305, "step": 42175 }, { "epoch": 0.8, "learning_rate": 5.274697688063441e-07, "loss": 0.9539, "step": 42176 }, { "epoch": 0.8, "learning_rate": 5.273759167566828e-07, "loss": 0.8282, "step": 42177 }, { "epoch": 0.8, "learning_rate": 5.272820720727393e-07, "loss": 0.7645, "step": 42178 }, { "epoch": 0.8, "learning_rate": 5.271882347548645e-07, "loss": 0.7422, "step": 42179 }, { "epoch": 0.8, "learning_rate": 5.270944048034074e-07, "loss": 0.8774, "step": 42180 }, { "epoch": 0.8, "learning_rate": 5.270005822187205e-07, "loss": 0.9666, "step": 42181 }, { "epoch": 0.8, "learning_rate": 5.269067670011521e-07, "loss": 0.8184, "step": 42182 }, { "epoch": 0.8, "learning_rate": 5.26812959151053e-07, "loss": 0.9463, "step": 42183 }, { "epoch": 0.8, "learning_rate": 5.267191586687748e-07, "loss": 0.9092, "step": 42184 }, { "epoch": 0.8, "learning_rate": 5.266253655546664e-07, "loss": 0.7917, "step": 42185 }, { "epoch": 0.8, "learning_rate": 5.265315798090781e-07, "loss": 0.9752, "step": 42186 }, { "epoch": 0.8, "learning_rate": 5.264378014323606e-07, "loss": 1.0532, "step": 42187 }, { "epoch": 0.8, "learning_rate": 5.263440304248638e-07, "loss": 1.0176, "step": 42188 }, { "epoch": 0.8, "learning_rate": 5.262502667869376e-07, "loss": 1.0457, "step": 42189 }, { "epoch": 0.8, "learning_rate": 5.261565105189329e-07, "loss": 1.0409, "step": 42190 }, { "epoch": 0.8, "learning_rate": 5.260627616211994e-07, "loss": 0.778, "step": 42191 }, { "epoch": 0.8, "learning_rate": 5.259690200940862e-07, "loss": 0.8506, "step": 42192 }, { "epoch": 0.8, "learning_rate": 5.258752859379451e-07, "loss": 1.156, "step": 42193 }, { "epoch": 0.8, "learning_rate": 5.257815591531245e-07, "loss": 0.9563, "step": 42194 }, { "epoch": 0.8, "learning_rate": 5.256878397399753e-07, "loss": 0.832, "step": 42195 }, { "epoch": 0.8, "learning_rate": 5.255941276988468e-07, "loss": 0.9551, "step": 42196 }, { "epoch": 0.8, "learning_rate": 5.255004230300897e-07, "loss": 0.7127, "step": 42197 }, { "epoch": 0.8, "learning_rate": 5.254067257340534e-07, "loss": 0.8487, "step": 42198 }, { "epoch": 0.8, "learning_rate": 5.253130358110876e-07, "loss": 0.8311, "step": 42199 }, { "epoch": 0.8, "learning_rate": 5.252193532615432e-07, "loss": 1.0796, "step": 42200 }, { "epoch": 0.8, "learning_rate": 5.251256780857677e-07, "loss": 0.8697, "step": 42201 }, { "epoch": 0.8, "learning_rate": 5.250320102841139e-07, "loss": 0.821, "step": 42202 }, { "epoch": 0.8, "learning_rate": 5.249383498569294e-07, "loss": 0.8629, "step": 42203 }, { "epoch": 0.8, "learning_rate": 5.248446968045636e-07, "loss": 0.6111, "step": 42204 }, { "epoch": 0.8, "learning_rate": 5.247510511273687e-07, "loss": 0.8788, "step": 42205 }, { "epoch": 0.8, "learning_rate": 5.246574128256921e-07, "loss": 1.0902, "step": 42206 }, { "epoch": 0.8, "learning_rate": 5.245637818998841e-07, "loss": 0.9386, "step": 42207 }, { "epoch": 0.8, "learning_rate": 5.244701583502945e-07, "loss": 0.8759, "step": 42208 }, { "epoch": 0.8, "learning_rate": 5.243765421772726e-07, "loss": 0.9483, "step": 42209 }, { "epoch": 0.8, "learning_rate": 5.242829333811684e-07, "loss": 0.9096, "step": 42210 }, { "epoch": 0.8, "learning_rate": 5.241893319623306e-07, "loss": 0.7467, "step": 42211 }, { "epoch": 0.8, "learning_rate": 5.240957379211103e-07, "loss": 0.8162, "step": 42212 }, { "epoch": 0.8, "learning_rate": 5.240021512578547e-07, "loss": 0.7273, "step": 42213 }, { "epoch": 0.8, "learning_rate": 5.239085719729156e-07, "loss": 0.9459, "step": 42214 }, { "epoch": 0.8, "learning_rate": 5.238150000666406e-07, "loss": 0.8724, "step": 42215 }, { "epoch": 0.8, "learning_rate": 5.237214355393799e-07, "loss": 0.9832, "step": 42216 }, { "epoch": 0.8, "learning_rate": 5.236278783914828e-07, "loss": 0.8548, "step": 42217 }, { "epoch": 0.8, "learning_rate": 5.235343286232986e-07, "loss": 1.0464, "step": 42218 }, { "epoch": 0.8, "learning_rate": 5.234407862351768e-07, "loss": 0.981, "step": 42219 }, { "epoch": 0.8, "learning_rate": 5.233472512274662e-07, "loss": 0.9666, "step": 42220 }, { "epoch": 0.8, "learning_rate": 5.232537236005169e-07, "loss": 1.0315, "step": 42221 }, { "epoch": 0.8, "learning_rate": 5.231602033546768e-07, "loss": 0.8884, "step": 42222 }, { "epoch": 0.8, "learning_rate": 5.230666904902968e-07, "loss": 1.0154, "step": 42223 }, { "epoch": 0.8, "learning_rate": 5.229731850077247e-07, "loss": 1.0011, "step": 42224 }, { "epoch": 0.8, "learning_rate": 5.228796869073091e-07, "loss": 1.006, "step": 42225 }, { "epoch": 0.8, "learning_rate": 5.227861961894018e-07, "loss": 1.0114, "step": 42226 }, { "epoch": 0.8, "learning_rate": 5.226927128543493e-07, "loss": 0.911, "step": 42227 }, { "epoch": 0.8, "learning_rate": 5.225992369025018e-07, "loss": 0.9645, "step": 42228 }, { "epoch": 0.8, "learning_rate": 5.22505768334208e-07, "loss": 0.7337, "step": 42229 }, { "epoch": 0.8, "learning_rate": 5.224123071498172e-07, "loss": 0.7413, "step": 42230 }, { "epoch": 0.8, "learning_rate": 5.223188533496781e-07, "loss": 1.1816, "step": 42231 }, { "epoch": 0.8, "learning_rate": 5.222254069341398e-07, "loss": 0.6902, "step": 42232 }, { "epoch": 0.8, "learning_rate": 5.221319679035519e-07, "loss": 0.8317, "step": 42233 }, { "epoch": 0.8, "learning_rate": 5.220385362582612e-07, "loss": 0.7793, "step": 42234 }, { "epoch": 0.8, "learning_rate": 5.219451119986191e-07, "loss": 0.89, "step": 42235 }, { "epoch": 0.8, "learning_rate": 5.218516951249728e-07, "loss": 0.8787, "step": 42236 }, { "epoch": 0.8, "learning_rate": 5.217582856376716e-07, "loss": 0.8952, "step": 42237 }, { "epoch": 0.8, "learning_rate": 5.216648835370644e-07, "loss": 0.9787, "step": 42238 }, { "epoch": 0.8, "learning_rate": 5.215714888234999e-07, "loss": 0.9957, "step": 42239 }, { "epoch": 0.8, "learning_rate": 5.214781014973267e-07, "loss": 0.8212, "step": 42240 }, { "epoch": 0.8, "learning_rate": 5.213847215588936e-07, "loss": 0.7566, "step": 42241 }, { "epoch": 0.8, "learning_rate": 5.2129134900855e-07, "loss": 1.0115, "step": 42242 }, { "epoch": 0.8, "learning_rate": 5.211979838466424e-07, "loss": 1.0496, "step": 42243 }, { "epoch": 0.8, "learning_rate": 5.211046260735223e-07, "loss": 1.1731, "step": 42244 }, { "epoch": 0.8, "learning_rate": 5.210112756895361e-07, "loss": 0.8694, "step": 42245 }, { "epoch": 0.8, "learning_rate": 5.209179326950326e-07, "loss": 0.7712, "step": 42246 }, { "epoch": 0.8, "learning_rate": 5.208245970903619e-07, "loss": 0.7819, "step": 42247 }, { "epoch": 0.8, "learning_rate": 5.207312688758709e-07, "loss": 0.7182, "step": 42248 }, { "epoch": 0.8, "learning_rate": 5.206379480519089e-07, "loss": 0.8272, "step": 42249 }, { "epoch": 0.8, "learning_rate": 5.205446346188239e-07, "loss": 1.2014, "step": 42250 }, { "epoch": 0.8, "learning_rate": 5.204513285769647e-07, "loss": 0.7637, "step": 42251 }, { "epoch": 0.8, "learning_rate": 5.203580299266795e-07, "loss": 0.8923, "step": 42252 }, { "epoch": 0.8, "learning_rate": 5.202647386683165e-07, "loss": 0.7049, "step": 42253 }, { "epoch": 0.8, "learning_rate": 5.201714548022252e-07, "loss": 0.6192, "step": 42254 }, { "epoch": 0.8, "learning_rate": 5.200781783287514e-07, "loss": 0.8821, "step": 42255 }, { "epoch": 0.8, "learning_rate": 5.199849092482465e-07, "loss": 1.121, "step": 42256 }, { "epoch": 0.8, "learning_rate": 5.198916475610566e-07, "loss": 0.8976, "step": 42257 }, { "epoch": 0.8, "learning_rate": 5.197983932675305e-07, "loss": 0.8494, "step": 42258 }, { "epoch": 0.8, "learning_rate": 5.197051463680163e-07, "loss": 0.7828, "step": 42259 }, { "epoch": 0.8, "learning_rate": 5.196119068628627e-07, "loss": 0.7796, "step": 42260 }, { "epoch": 0.8, "learning_rate": 5.195186747524173e-07, "loss": 0.7404, "step": 42261 }, { "epoch": 0.8, "learning_rate": 5.194254500370285e-07, "loss": 1.0647, "step": 42262 }, { "epoch": 0.8, "learning_rate": 5.193322327170452e-07, "loss": 0.8711, "step": 42263 }, { "epoch": 0.8, "learning_rate": 5.192390227928129e-07, "loss": 1.0499, "step": 42264 }, { "epoch": 0.8, "learning_rate": 5.191458202646832e-07, "loss": 0.9301, "step": 42265 }, { "epoch": 0.8, "learning_rate": 5.190526251330011e-07, "loss": 0.8413, "step": 42266 }, { "epoch": 0.8, "learning_rate": 5.189594373981155e-07, "loss": 0.8643, "step": 42267 }, { "epoch": 0.8, "learning_rate": 5.188662570603756e-07, "loss": 0.9631, "step": 42268 }, { "epoch": 0.8, "learning_rate": 5.18773084120128e-07, "loss": 1.0984, "step": 42269 }, { "epoch": 0.8, "learning_rate": 5.186799185777208e-07, "loss": 0.7612, "step": 42270 }, { "epoch": 0.8, "learning_rate": 5.185867604335018e-07, "loss": 0.8796, "step": 42271 }, { "epoch": 0.8, "learning_rate": 5.184936096878195e-07, "loss": 0.7418, "step": 42272 }, { "epoch": 0.8, "learning_rate": 5.184004663410211e-07, "loss": 0.9738, "step": 42273 }, { "epoch": 0.8, "learning_rate": 5.183073303934546e-07, "loss": 1.0051, "step": 42274 }, { "epoch": 0.8, "learning_rate": 5.182142018454686e-07, "loss": 1.1794, "step": 42275 }, { "epoch": 0.8, "learning_rate": 5.181210806974085e-07, "loss": 0.7868, "step": 42276 }, { "epoch": 0.8, "learning_rate": 5.180279669496249e-07, "loss": 1.0068, "step": 42277 }, { "epoch": 0.8, "learning_rate": 5.179348606024634e-07, "loss": 0.7387, "step": 42278 }, { "epoch": 0.8, "learning_rate": 5.178417616562723e-07, "loss": 0.9009, "step": 42279 }, { "epoch": 0.8, "learning_rate": 5.177486701113995e-07, "loss": 1.0605, "step": 42280 }, { "epoch": 0.8, "learning_rate": 5.176555859681923e-07, "loss": 1.1119, "step": 42281 }, { "epoch": 0.8, "learning_rate": 5.175625092269981e-07, "loss": 0.855, "step": 42282 }, { "epoch": 0.8, "learning_rate": 5.17469439888165e-07, "loss": 0.7858, "step": 42283 }, { "epoch": 0.8, "learning_rate": 5.173763779520411e-07, "loss": 0.9489, "step": 42284 }, { "epoch": 0.8, "learning_rate": 5.172833234189712e-07, "loss": 0.807, "step": 42285 }, { "epoch": 0.8, "learning_rate": 5.171902762893061e-07, "loss": 1.0391, "step": 42286 }, { "epoch": 0.8, "learning_rate": 5.170972365633911e-07, "loss": 0.9465, "step": 42287 }, { "epoch": 0.8, "learning_rate": 5.170042042415735e-07, "loss": 0.9881, "step": 42288 }, { "epoch": 0.8, "learning_rate": 5.169111793242029e-07, "loss": 1.1146, "step": 42289 }, { "epoch": 0.8, "learning_rate": 5.168181618116241e-07, "loss": 0.7995, "step": 42290 }, { "epoch": 0.8, "learning_rate": 5.167251517041857e-07, "loss": 0.8055, "step": 42291 }, { "epoch": 0.8, "learning_rate": 5.16632149002235e-07, "loss": 0.7244, "step": 42292 }, { "epoch": 0.8, "learning_rate": 5.165391537061187e-07, "loss": 0.8806, "step": 42293 }, { "epoch": 0.8, "learning_rate": 5.164461658161845e-07, "loss": 0.9741, "step": 42294 }, { "epoch": 0.8, "learning_rate": 5.163531853327797e-07, "loss": 1.0418, "step": 42295 }, { "epoch": 0.8, "learning_rate": 5.162602122562518e-07, "loss": 0.7005, "step": 42296 }, { "epoch": 0.8, "learning_rate": 5.161672465869461e-07, "loss": 0.7366, "step": 42297 }, { "epoch": 0.8, "learning_rate": 5.160742883252123e-07, "loss": 0.7888, "step": 42298 }, { "epoch": 0.8, "learning_rate": 5.159813374713957e-07, "loss": 0.8495, "step": 42299 }, { "epoch": 0.8, "learning_rate": 5.158883940258441e-07, "loss": 0.8472, "step": 42300 }, { "epoch": 0.8, "learning_rate": 5.157954579889043e-07, "loss": 0.8432, "step": 42301 }, { "epoch": 0.8, "learning_rate": 5.157025293609233e-07, "loss": 1.0121, "step": 42302 }, { "epoch": 0.8, "learning_rate": 5.156096081422485e-07, "loss": 0.793, "step": 42303 }, { "epoch": 0.8, "learning_rate": 5.155166943332262e-07, "loss": 0.8512, "step": 42304 }, { "epoch": 0.8, "learning_rate": 5.154237879342047e-07, "loss": 0.7769, "step": 42305 }, { "epoch": 0.8, "learning_rate": 5.153308889455283e-07, "loss": 1.0793, "step": 42306 }, { "epoch": 0.8, "learning_rate": 5.15237997367547e-07, "loss": 1.0055, "step": 42307 }, { "epoch": 0.8, "learning_rate": 5.151451132006055e-07, "loss": 0.9173, "step": 42308 }, { "epoch": 0.8, "learning_rate": 5.150522364450508e-07, "loss": 0.8442, "step": 42309 }, { "epoch": 0.8, "learning_rate": 5.149593671012313e-07, "loss": 0.9079, "step": 42310 }, { "epoch": 0.8, "learning_rate": 5.14866505169492e-07, "loss": 0.6929, "step": 42311 }, { "epoch": 0.8, "learning_rate": 5.147736506501804e-07, "loss": 1.0529, "step": 42312 }, { "epoch": 0.8, "learning_rate": 5.146808035436432e-07, "loss": 1.0856, "step": 42313 }, { "epoch": 0.8, "learning_rate": 5.145879638502269e-07, "loss": 0.8492, "step": 42314 }, { "epoch": 0.8, "learning_rate": 5.144951315702781e-07, "loss": 0.8693, "step": 42315 }, { "epoch": 0.8, "learning_rate": 5.144023067041437e-07, "loss": 0.7471, "step": 42316 }, { "epoch": 0.8, "learning_rate": 5.14309489252171e-07, "loss": 0.7641, "step": 42317 }, { "epoch": 0.8, "learning_rate": 5.142166792147044e-07, "loss": 0.8633, "step": 42318 }, { "epoch": 0.8, "learning_rate": 5.141238765920931e-07, "loss": 1.1765, "step": 42319 }, { "epoch": 0.8, "learning_rate": 5.140310813846819e-07, "loss": 0.9471, "step": 42320 }, { "epoch": 0.8, "learning_rate": 5.139382935928175e-07, "loss": 0.8595, "step": 42321 }, { "epoch": 0.8, "learning_rate": 5.138455132168466e-07, "loss": 0.8815, "step": 42322 }, { "epoch": 0.8, "learning_rate": 5.137527402571157e-07, "loss": 1.0349, "step": 42323 }, { "epoch": 0.8, "learning_rate": 5.136599747139714e-07, "loss": 1.0517, "step": 42324 }, { "epoch": 0.8, "learning_rate": 5.135672165877598e-07, "loss": 0.8257, "step": 42325 }, { "epoch": 0.8, "learning_rate": 5.134744658788277e-07, "loss": 0.8528, "step": 42326 }, { "epoch": 0.8, "learning_rate": 5.133817225875198e-07, "loss": 0.5891, "step": 42327 }, { "epoch": 0.8, "learning_rate": 5.132889867141852e-07, "loss": 0.8357, "step": 42328 }, { "epoch": 0.8, "learning_rate": 5.131962582591676e-07, "loss": 0.6754, "step": 42329 }, { "epoch": 0.8, "learning_rate": 5.131035372228138e-07, "loss": 1.1547, "step": 42330 }, { "epoch": 0.8, "learning_rate": 5.130108236054717e-07, "loss": 0.8832, "step": 42331 }, { "epoch": 0.8, "learning_rate": 5.129181174074857e-07, "loss": 1.0204, "step": 42332 }, { "epoch": 0.8, "learning_rate": 5.128254186292025e-07, "loss": 0.8315, "step": 42333 }, { "epoch": 0.8, "learning_rate": 5.127327272709684e-07, "loss": 0.8163, "step": 42334 }, { "epoch": 0.8, "learning_rate": 5.126400433331291e-07, "loss": 0.7166, "step": 42335 }, { "epoch": 0.8, "learning_rate": 5.125473668160311e-07, "loss": 0.9318, "step": 42336 }, { "epoch": 0.8, "learning_rate": 5.124546977200201e-07, "loss": 1.1652, "step": 42337 }, { "epoch": 0.8, "learning_rate": 5.123620360454432e-07, "loss": 0.821, "step": 42338 }, { "epoch": 0.8, "learning_rate": 5.122693817926442e-07, "loss": 0.9288, "step": 42339 }, { "epoch": 0.8, "learning_rate": 5.121767349619716e-07, "loss": 0.8144, "step": 42340 }, { "epoch": 0.8, "learning_rate": 5.120840955537695e-07, "loss": 0.8595, "step": 42341 }, { "epoch": 0.8, "learning_rate": 5.119914635683845e-07, "loss": 0.876, "step": 42342 }, { "epoch": 0.8, "learning_rate": 5.118988390061622e-07, "loss": 0.9921, "step": 42343 }, { "epoch": 0.8, "learning_rate": 5.118062218674488e-07, "loss": 1.0846, "step": 42344 }, { "epoch": 0.8, "learning_rate": 5.117136121525901e-07, "loss": 1.0403, "step": 42345 }, { "epoch": 0.8, "learning_rate": 5.116210098619317e-07, "loss": 0.8117, "step": 42346 }, { "epoch": 0.8, "learning_rate": 5.115284149958203e-07, "loss": 0.9518, "step": 42347 }, { "epoch": 0.8, "learning_rate": 5.114358275545994e-07, "loss": 0.8435, "step": 42348 }, { "epoch": 0.8, "learning_rate": 5.113432475386174e-07, "loss": 0.8988, "step": 42349 }, { "epoch": 0.8, "learning_rate": 5.112506749482182e-07, "loss": 1.0862, "step": 42350 }, { "epoch": 0.8, "learning_rate": 5.111581097837473e-07, "loss": 0.8949, "step": 42351 }, { "epoch": 0.8, "learning_rate": 5.110655520455523e-07, "loss": 1.0677, "step": 42352 }, { "epoch": 0.8, "learning_rate": 5.10973001733977e-07, "loss": 1.0195, "step": 42353 }, { "epoch": 0.8, "learning_rate": 5.108804588493674e-07, "loss": 0.8721, "step": 42354 }, { "epoch": 0.8, "learning_rate": 5.107879233920693e-07, "loss": 0.9946, "step": 42355 }, { "epoch": 0.8, "learning_rate": 5.10695395362428e-07, "loss": 1.0975, "step": 42356 }, { "epoch": 0.8, "learning_rate": 5.106028747607891e-07, "loss": 1.0972, "step": 42357 }, { "epoch": 0.8, "learning_rate": 5.105103615874982e-07, "loss": 1.1099, "step": 42358 }, { "epoch": 0.8, "learning_rate": 5.104178558429012e-07, "loss": 0.9816, "step": 42359 }, { "epoch": 0.8, "learning_rate": 5.103253575273417e-07, "loss": 0.8715, "step": 42360 }, { "epoch": 0.8, "learning_rate": 5.102328666411674e-07, "loss": 0.9567, "step": 42361 }, { "epoch": 0.8, "learning_rate": 5.101403831847221e-07, "loss": 1.1755, "step": 42362 }, { "epoch": 0.8, "learning_rate": 5.100479071583517e-07, "loss": 0.9775, "step": 42363 }, { "epoch": 0.8, "learning_rate": 5.099554385624012e-07, "loss": 1.0713, "step": 42364 }, { "epoch": 0.8, "learning_rate": 5.09862977397216e-07, "loss": 0.8316, "step": 42365 }, { "epoch": 0.8, "learning_rate": 5.097705236631414e-07, "loss": 0.7292, "step": 42366 }, { "epoch": 0.8, "learning_rate": 5.096780773605228e-07, "loss": 1.0561, "step": 42367 }, { "epoch": 0.8, "learning_rate": 5.09585638489706e-07, "loss": 1.0261, "step": 42368 }, { "epoch": 0.8, "learning_rate": 5.094932070510339e-07, "loss": 1.0281, "step": 42369 }, { "epoch": 0.8, "learning_rate": 5.094007830448544e-07, "loss": 1.0579, "step": 42370 }, { "epoch": 0.8, "learning_rate": 5.09308366471511e-07, "loss": 0.9205, "step": 42371 }, { "epoch": 0.8, "learning_rate": 5.092159573313488e-07, "loss": 1.0372, "step": 42372 }, { "epoch": 0.8, "learning_rate": 5.091235556247134e-07, "loss": 0.8681, "step": 42373 }, { "epoch": 0.8, "learning_rate": 5.090311613519494e-07, "loss": 1.0426, "step": 42374 }, { "epoch": 0.8, "learning_rate": 5.089387745134028e-07, "loss": 1.0919, "step": 42375 }, { "epoch": 0.8, "learning_rate": 5.088463951094164e-07, "loss": 0.8189, "step": 42376 }, { "epoch": 0.8, "learning_rate": 5.08754023140337e-07, "loss": 0.8752, "step": 42377 }, { "epoch": 0.8, "learning_rate": 5.086616586065099e-07, "loss": 0.9268, "step": 42378 }, { "epoch": 0.8, "learning_rate": 5.085693015082779e-07, "loss": 0.8772, "step": 42379 }, { "epoch": 0.8, "learning_rate": 5.084769518459881e-07, "loss": 0.8725, "step": 42380 }, { "epoch": 0.8, "learning_rate": 5.083846096199838e-07, "loss": 1.0834, "step": 42381 }, { "epoch": 0.8, "learning_rate": 5.082922748306101e-07, "loss": 0.9727, "step": 42382 }, { "epoch": 0.8, "learning_rate": 5.081999474782123e-07, "loss": 0.7778, "step": 42383 }, { "epoch": 0.8, "learning_rate": 5.081076275631347e-07, "loss": 0.8638, "step": 42384 }, { "epoch": 0.8, "learning_rate": 5.080153150857223e-07, "loss": 0.8452, "step": 42385 }, { "epoch": 0.8, "learning_rate": 5.079230100463192e-07, "loss": 0.8046, "step": 42386 }, { "epoch": 0.8, "learning_rate": 5.078307124452716e-07, "loss": 0.9927, "step": 42387 }, { "epoch": 0.8, "learning_rate": 5.077384222829216e-07, "loss": 0.9371, "step": 42388 }, { "epoch": 0.8, "learning_rate": 5.076461395596163e-07, "loss": 0.8248, "step": 42389 }, { "epoch": 0.8, "learning_rate": 5.075538642756989e-07, "loss": 0.895, "step": 42390 }, { "epoch": 0.8, "learning_rate": 5.074615964315141e-07, "loss": 0.8347, "step": 42391 }, { "epoch": 0.8, "learning_rate": 5.073693360274068e-07, "loss": 0.9481, "step": 42392 }, { "epoch": 0.8, "learning_rate": 5.072770830637211e-07, "loss": 1.0388, "step": 42393 }, { "epoch": 0.8, "learning_rate": 5.071848375408017e-07, "loss": 1.0772, "step": 42394 }, { "epoch": 0.8, "learning_rate": 5.070925994589931e-07, "loss": 0.9644, "step": 42395 }, { "epoch": 0.8, "learning_rate": 5.070003688186403e-07, "loss": 0.7733, "step": 42396 }, { "epoch": 0.8, "learning_rate": 5.069081456200856e-07, "loss": 0.6959, "step": 42397 }, { "epoch": 0.8, "learning_rate": 5.068159298636755e-07, "loss": 0.9755, "step": 42398 }, { "epoch": 0.8, "learning_rate": 5.067237215497542e-07, "loss": 0.7857, "step": 42399 }, { "epoch": 0.8, "learning_rate": 5.066315206786643e-07, "loss": 0.9894, "step": 42400 }, { "epoch": 0.8, "learning_rate": 5.065393272507521e-07, "loss": 0.8549, "step": 42401 }, { "epoch": 0.8, "learning_rate": 5.064471412663608e-07, "loss": 0.7795, "step": 42402 }, { "epoch": 0.8, "learning_rate": 5.063549627258343e-07, "loss": 0.8283, "step": 42403 }, { "epoch": 0.8, "learning_rate": 5.062627916295174e-07, "loss": 0.8889, "step": 42404 }, { "epoch": 0.8, "learning_rate": 5.061706279777543e-07, "loss": 0.9684, "step": 42405 }, { "epoch": 0.8, "learning_rate": 5.060784717708886e-07, "loss": 1.1289, "step": 42406 }, { "epoch": 0.8, "learning_rate": 5.059863230092649e-07, "loss": 1.0493, "step": 42407 }, { "epoch": 0.8, "learning_rate": 5.058941816932278e-07, "loss": 0.8274, "step": 42408 }, { "epoch": 0.8, "learning_rate": 5.058020478231193e-07, "loss": 0.9119, "step": 42409 }, { "epoch": 0.8, "learning_rate": 5.057099213992861e-07, "loss": 0.7634, "step": 42410 }, { "epoch": 0.8, "learning_rate": 5.056178024220703e-07, "loss": 0.8011, "step": 42411 }, { "epoch": 0.8, "learning_rate": 5.055256908918166e-07, "loss": 1.0217, "step": 42412 }, { "epoch": 0.8, "learning_rate": 5.054335868088689e-07, "loss": 1.1038, "step": 42413 }, { "epoch": 0.8, "learning_rate": 5.053414901735706e-07, "loss": 0.908, "step": 42414 }, { "epoch": 0.8, "learning_rate": 5.052494009862665e-07, "loss": 0.9985, "step": 42415 }, { "epoch": 0.8, "learning_rate": 5.051573192472998e-07, "loss": 0.727, "step": 42416 }, { "epoch": 0.8, "learning_rate": 5.050652449570151e-07, "loss": 0.755, "step": 42417 }, { "epoch": 0.8, "learning_rate": 5.049731781157544e-07, "loss": 1.0581, "step": 42418 }, { "epoch": 0.8, "learning_rate": 5.048811187238631e-07, "loss": 0.9615, "step": 42419 }, { "epoch": 0.8, "learning_rate": 5.047890667816855e-07, "loss": 0.8167, "step": 42420 }, { "epoch": 0.8, "learning_rate": 5.046970222895628e-07, "loss": 0.9593, "step": 42421 }, { "epoch": 0.8, "learning_rate": 5.046049852478416e-07, "loss": 0.7139, "step": 42422 }, { "epoch": 0.8, "learning_rate": 5.045129556568637e-07, "loss": 0.6804, "step": 42423 }, { "epoch": 0.8, "learning_rate": 5.044209335169731e-07, "loss": 1.2261, "step": 42424 }, { "epoch": 0.8, "learning_rate": 5.043289188285136e-07, "loss": 1.1235, "step": 42425 }, { "epoch": 0.8, "learning_rate": 5.042369115918286e-07, "loss": 1.0135, "step": 42426 }, { "epoch": 0.8, "learning_rate": 5.041449118072619e-07, "loss": 0.8879, "step": 42427 }, { "epoch": 0.8, "learning_rate": 5.04052919475157e-07, "loss": 0.7113, "step": 42428 }, { "epoch": 0.8, "learning_rate": 5.039609345958576e-07, "loss": 0.7737, "step": 42429 }, { "epoch": 0.8, "learning_rate": 5.038689571697058e-07, "loss": 1.0252, "step": 42430 }, { "epoch": 0.8, "learning_rate": 5.037769871970477e-07, "loss": 1.2255, "step": 42431 }, { "epoch": 0.8, "learning_rate": 5.036850246782241e-07, "loss": 0.9158, "step": 42432 }, { "epoch": 0.8, "learning_rate": 5.035930696135796e-07, "loss": 0.9365, "step": 42433 }, { "epoch": 0.8, "learning_rate": 5.035011220034572e-07, "loss": 0.9411, "step": 42434 }, { "epoch": 0.8, "learning_rate": 5.034091818482003e-07, "loss": 0.7266, "step": 42435 }, { "epoch": 0.8, "learning_rate": 5.033172491481525e-07, "loss": 0.8417, "step": 42436 }, { "epoch": 0.8, "learning_rate": 5.03225323903657e-07, "loss": 0.9523, "step": 42437 }, { "epoch": 0.8, "learning_rate": 5.031334061150575e-07, "loss": 0.9746, "step": 42438 }, { "epoch": 0.8, "learning_rate": 5.030414957826951e-07, "loss": 0.9724, "step": 42439 }, { "epoch": 0.8, "learning_rate": 5.029495929069153e-07, "loss": 0.9151, "step": 42440 }, { "epoch": 0.8, "learning_rate": 5.028576974880611e-07, "loss": 0.7574, "step": 42441 }, { "epoch": 0.8, "learning_rate": 5.02765809526474e-07, "loss": 0.9553, "step": 42442 }, { "epoch": 0.8, "learning_rate": 5.026739290224992e-07, "loss": 1.0383, "step": 42443 }, { "epoch": 0.8, "learning_rate": 5.02582055976478e-07, "loss": 1.1409, "step": 42444 }, { "epoch": 0.8, "learning_rate": 5.024901903887541e-07, "loss": 0.901, "step": 42445 }, { "epoch": 0.8, "learning_rate": 5.023983322596709e-07, "loss": 1.0236, "step": 42446 }, { "epoch": 0.8, "learning_rate": 5.023064815895709e-07, "loss": 0.8564, "step": 42447 }, { "epoch": 0.8, "learning_rate": 5.022146383787974e-07, "loss": 0.8821, "step": 42448 }, { "epoch": 0.8, "learning_rate": 5.021228026276928e-07, "loss": 0.7736, "step": 42449 }, { "epoch": 0.8, "learning_rate": 5.020309743366014e-07, "loss": 1.1906, "step": 42450 }, { "epoch": 0.8, "learning_rate": 5.019391535058638e-07, "loss": 0.9562, "step": 42451 }, { "epoch": 0.8, "learning_rate": 5.018473401358251e-07, "loss": 0.9948, "step": 42452 }, { "epoch": 0.8, "learning_rate": 5.017555342268268e-07, "loss": 0.7002, "step": 42453 }, { "epoch": 0.8, "learning_rate": 5.01663735779212e-07, "loss": 0.8722, "step": 42454 }, { "epoch": 0.8, "learning_rate": 5.015719447933234e-07, "loss": 0.7823, "step": 42455 }, { "epoch": 0.8, "learning_rate": 5.014801612695042e-07, "loss": 0.9491, "step": 42456 }, { "epoch": 0.8, "learning_rate": 5.013883852080964e-07, "loss": 0.9703, "step": 42457 }, { "epoch": 0.8, "learning_rate": 5.012966166094435e-07, "loss": 0.9985, "step": 42458 }, { "epoch": 0.8, "learning_rate": 5.012048554738882e-07, "loss": 0.9012, "step": 42459 }, { "epoch": 0.8, "learning_rate": 5.011131018017715e-07, "loss": 0.8545, "step": 42460 }, { "epoch": 0.8, "learning_rate": 5.010213555934376e-07, "loss": 0.9453, "step": 42461 }, { "epoch": 0.8, "learning_rate": 5.009296168492294e-07, "loss": 1.1166, "step": 42462 }, { "epoch": 0.8, "learning_rate": 5.008378855694876e-07, "loss": 1.0885, "step": 42463 }, { "epoch": 0.8, "learning_rate": 5.007461617545569e-07, "loss": 0.8228, "step": 42464 }, { "epoch": 0.8, "learning_rate": 5.006544454047781e-07, "loss": 0.9697, "step": 42465 }, { "epoch": 0.8, "learning_rate": 5.005627365204946e-07, "loss": 0.883, "step": 42466 }, { "epoch": 0.8, "learning_rate": 5.004710351020484e-07, "loss": 0.913, "step": 42467 }, { "epoch": 0.8, "learning_rate": 5.003793411497817e-07, "loss": 0.907, "step": 42468 }, { "epoch": 0.8, "learning_rate": 5.002876546640375e-07, "loss": 1.0497, "step": 42469 }, { "epoch": 0.8, "learning_rate": 5.00195975645158e-07, "loss": 1.0112, "step": 42470 }, { "epoch": 0.8, "learning_rate": 5.001043040934861e-07, "loss": 0.9686, "step": 42471 }, { "epoch": 0.8, "learning_rate": 5.000126400093619e-07, "loss": 0.7696, "step": 42472 }, { "epoch": 0.8, "learning_rate": 4.999209833931307e-07, "loss": 0.8734, "step": 42473 }, { "epoch": 0.8, "learning_rate": 4.998293342451325e-07, "loss": 0.9619, "step": 42474 }, { "epoch": 0.8, "learning_rate": 4.997376925657099e-07, "loss": 1.1253, "step": 42475 }, { "epoch": 0.8, "learning_rate": 4.996460583552056e-07, "loss": 0.9316, "step": 42476 }, { "epoch": 0.8, "learning_rate": 4.995544316139619e-07, "loss": 0.8759, "step": 42477 }, { "epoch": 0.8, "learning_rate": 4.994628123423204e-07, "loss": 0.9316, "step": 42478 }, { "epoch": 0.8, "learning_rate": 4.993712005406234e-07, "loss": 0.8281, "step": 42479 }, { "epoch": 0.8, "learning_rate": 4.992795962092137e-07, "loss": 0.7968, "step": 42480 }, { "epoch": 0.8, "learning_rate": 4.991879993484311e-07, "loss": 1.0097, "step": 42481 }, { "epoch": 0.8, "learning_rate": 4.990964099586201e-07, "loss": 1.0426, "step": 42482 }, { "epoch": 0.8, "learning_rate": 4.990048280401224e-07, "loss": 0.8424, "step": 42483 }, { "epoch": 0.8, "learning_rate": 4.989132535932778e-07, "loss": 0.7498, "step": 42484 }, { "epoch": 0.8, "learning_rate": 4.988216866184311e-07, "loss": 0.8514, "step": 42485 }, { "epoch": 0.8, "learning_rate": 4.987301271159226e-07, "loss": 0.921, "step": 42486 }, { "epoch": 0.8, "learning_rate": 4.986385750860942e-07, "loss": 1.2466, "step": 42487 }, { "epoch": 0.8, "learning_rate": 4.985470305292878e-07, "loss": 0.8973, "step": 42488 }, { "epoch": 0.8, "learning_rate": 4.984554934458457e-07, "loss": 0.691, "step": 42489 }, { "epoch": 0.8, "learning_rate": 4.983639638361093e-07, "loss": 0.8949, "step": 42490 }, { "epoch": 0.8, "learning_rate": 4.982724417004204e-07, "loss": 0.9315, "step": 42491 }, { "epoch": 0.8, "learning_rate": 4.981809270391216e-07, "loss": 0.9026, "step": 42492 }, { "epoch": 0.8, "learning_rate": 4.980894198525524e-07, "loss": 1.0259, "step": 42493 }, { "epoch": 0.8, "learning_rate": 4.979979201410576e-07, "loss": 0.9508, "step": 42494 }, { "epoch": 0.8, "learning_rate": 4.979064279049761e-07, "loss": 0.8149, "step": 42495 }, { "epoch": 0.8, "learning_rate": 4.978149431446508e-07, "loss": 1.0363, "step": 42496 }, { "epoch": 0.8, "learning_rate": 4.97723465860423e-07, "loss": 0.8511, "step": 42497 }, { "epoch": 0.8, "learning_rate": 4.976319960526347e-07, "loss": 0.9807, "step": 42498 }, { "epoch": 0.8, "learning_rate": 4.975405337216268e-07, "loss": 0.8521, "step": 42499 }, { "epoch": 0.8, "learning_rate": 4.974490788677414e-07, "loss": 1.102, "step": 42500 }, { "epoch": 0.8, "learning_rate": 4.9735763149132e-07, "loss": 0.9211, "step": 42501 }, { "epoch": 0.8, "learning_rate": 4.97266191592703e-07, "loss": 0.7199, "step": 42502 }, { "epoch": 0.8, "learning_rate": 4.971747591722328e-07, "loss": 0.8801, "step": 42503 }, { "epoch": 0.8, "learning_rate": 4.970833342302517e-07, "loss": 0.8576, "step": 42504 }, { "epoch": 0.8, "learning_rate": 4.969919167670986e-07, "loss": 0.9205, "step": 42505 }, { "epoch": 0.8, "learning_rate": 4.969005067831175e-07, "loss": 1.2133, "step": 42506 }, { "epoch": 0.8, "learning_rate": 4.968091042786477e-07, "loss": 0.6949, "step": 42507 }, { "epoch": 0.8, "learning_rate": 4.967177092540316e-07, "loss": 0.783, "step": 42508 }, { "epoch": 0.8, "learning_rate": 4.966263217096098e-07, "loss": 0.8782, "step": 42509 }, { "epoch": 0.8, "learning_rate": 4.965349416457244e-07, "loss": 0.666, "step": 42510 }, { "epoch": 0.8, "learning_rate": 4.964435690627156e-07, "loss": 0.793, "step": 42511 }, { "epoch": 0.8, "learning_rate": 4.963522039609253e-07, "loss": 1.0426, "step": 42512 }, { "epoch": 0.8, "learning_rate": 4.962608463406952e-07, "loss": 1.05, "step": 42513 }, { "epoch": 0.8, "learning_rate": 4.961694962023641e-07, "loss": 0.7064, "step": 42514 }, { "epoch": 0.8, "learning_rate": 4.960781535462761e-07, "loss": 0.8649, "step": 42515 }, { "epoch": 0.8, "learning_rate": 4.9598681837277e-07, "loss": 0.8, "step": 42516 }, { "epoch": 0.8, "learning_rate": 4.958954906821881e-07, "loss": 1.0218, "step": 42517 }, { "epoch": 0.8, "learning_rate": 4.958041704748706e-07, "loss": 1.0168, "step": 42518 }, { "epoch": 0.8, "learning_rate": 4.957128577511591e-07, "loss": 1.105, "step": 42519 }, { "epoch": 0.8, "learning_rate": 4.956215525113941e-07, "loss": 1.0234, "step": 42520 }, { "epoch": 0.8, "learning_rate": 4.955302547559171e-07, "loss": 0.8658, "step": 42521 }, { "epoch": 0.8, "learning_rate": 4.95438964485069e-07, "loss": 0.8876, "step": 42522 }, { "epoch": 0.8, "learning_rate": 4.953476816991893e-07, "loss": 0.8904, "step": 42523 }, { "epoch": 0.8, "learning_rate": 4.952564063986204e-07, "loss": 0.8038, "step": 42524 }, { "epoch": 0.8, "learning_rate": 4.951651385837033e-07, "loss": 1.1594, "step": 42525 }, { "epoch": 0.8, "learning_rate": 4.950738782547767e-07, "loss": 1.0798, "step": 42526 }, { "epoch": 0.8, "learning_rate": 4.949826254121842e-07, "loss": 0.761, "step": 42527 }, { "epoch": 0.8, "learning_rate": 4.948913800562644e-07, "loss": 1.0533, "step": 42528 }, { "epoch": 0.8, "learning_rate": 4.948001421873588e-07, "loss": 0.9919, "step": 42529 }, { "epoch": 0.8, "learning_rate": 4.947089118058079e-07, "loss": 0.8461, "step": 42530 }, { "epoch": 0.8, "learning_rate": 4.946176889119525e-07, "loss": 1.14, "step": 42531 }, { "epoch": 0.8, "learning_rate": 4.945264735061331e-07, "loss": 1.1395, "step": 42532 }, { "epoch": 0.8, "learning_rate": 4.944352655886902e-07, "loss": 0.8179, "step": 42533 }, { "epoch": 0.8, "learning_rate": 4.943440651599654e-07, "loss": 0.7957, "step": 42534 }, { "epoch": 0.8, "learning_rate": 4.942528722202972e-07, "loss": 0.8277, "step": 42535 }, { "epoch": 0.8, "learning_rate": 4.941616867700283e-07, "loss": 0.9356, "step": 42536 }, { "epoch": 0.8, "learning_rate": 4.940705088094974e-07, "loss": 0.8704, "step": 42537 }, { "epoch": 0.8, "learning_rate": 4.93979338339046e-07, "loss": 1.0315, "step": 42538 }, { "epoch": 0.8, "learning_rate": 4.938881753590141e-07, "loss": 0.7524, "step": 42539 }, { "epoch": 0.8, "learning_rate": 4.937970198697426e-07, "loss": 0.939, "step": 42540 }, { "epoch": 0.8, "learning_rate": 4.937058718715709e-07, "loss": 0.9816, "step": 42541 }, { "epoch": 0.8, "learning_rate": 4.936147313648404e-07, "loss": 0.9749, "step": 42542 }, { "epoch": 0.8, "learning_rate": 4.935235983498915e-07, "loss": 1.0473, "step": 42543 }, { "epoch": 0.8, "learning_rate": 4.934324728270628e-07, "loss": 1.0769, "step": 42544 }, { "epoch": 0.8, "learning_rate": 4.933413547966962e-07, "loss": 0.9014, "step": 42545 }, { "epoch": 0.8, "learning_rate": 4.932502442591322e-07, "loss": 1.1151, "step": 42546 }, { "epoch": 0.8, "learning_rate": 4.931591412147088e-07, "loss": 0.8646, "step": 42547 }, { "epoch": 0.8, "learning_rate": 4.93068045663769e-07, "loss": 0.8058, "step": 42548 }, { "epoch": 0.8, "learning_rate": 4.92976957606651e-07, "loss": 0.915, "step": 42549 }, { "epoch": 0.8, "learning_rate": 4.928858770436957e-07, "loss": 0.7612, "step": 42550 }, { "epoch": 0.8, "learning_rate": 4.927948039752426e-07, "loss": 0.7929, "step": 42551 }, { "epoch": 0.8, "learning_rate": 4.927037384016323e-07, "loss": 0.8122, "step": 42552 }, { "epoch": 0.8, "learning_rate": 4.926126803232048e-07, "loss": 0.879, "step": 42553 }, { "epoch": 0.8, "learning_rate": 4.925216297402999e-07, "loss": 0.7409, "step": 42554 }, { "epoch": 0.8, "learning_rate": 4.924305866532583e-07, "loss": 1.0627, "step": 42555 }, { "epoch": 0.8, "learning_rate": 4.923395510624182e-07, "loss": 1.0585, "step": 42556 }, { "epoch": 0.8, "learning_rate": 4.92248522968122e-07, "loss": 0.9439, "step": 42557 }, { "epoch": 0.8, "learning_rate": 4.921575023707073e-07, "loss": 0.935, "step": 42558 }, { "epoch": 0.8, "learning_rate": 4.920664892705151e-07, "loss": 0.7507, "step": 42559 }, { "epoch": 0.8, "learning_rate": 4.919754836678853e-07, "loss": 0.9337, "step": 42560 }, { "epoch": 0.8, "learning_rate": 4.918844855631571e-07, "loss": 0.7912, "step": 42561 }, { "epoch": 0.8, "learning_rate": 4.917934949566708e-07, "loss": 0.952, "step": 42562 }, { "epoch": 0.8, "learning_rate": 4.917025118487659e-07, "loss": 0.8927, "step": 42563 }, { "epoch": 0.8, "learning_rate": 4.916115362397831e-07, "loss": 0.8994, "step": 42564 }, { "epoch": 0.8, "learning_rate": 4.915205681300599e-07, "loss": 0.5815, "step": 42565 }, { "epoch": 0.8, "learning_rate": 4.914296075199379e-07, "loss": 0.7919, "step": 42566 }, { "epoch": 0.8, "learning_rate": 4.913386544097567e-07, "loss": 0.8203, "step": 42567 }, { "epoch": 0.8, "learning_rate": 4.912477087998544e-07, "loss": 1.1263, "step": 42568 }, { "epoch": 0.8, "learning_rate": 4.911567706905726e-07, "loss": 1.1628, "step": 42569 }, { "epoch": 0.8, "learning_rate": 4.910658400822493e-07, "loss": 0.8399, "step": 42570 }, { "epoch": 0.8, "learning_rate": 4.909749169752245e-07, "loss": 0.9406, "step": 42571 }, { "epoch": 0.8, "learning_rate": 4.908840013698377e-07, "loss": 0.8622, "step": 42572 }, { "epoch": 0.8, "learning_rate": 4.907930932664287e-07, "loss": 0.8174, "step": 42573 }, { "epoch": 0.8, "learning_rate": 4.907021926653363e-07, "loss": 0.9912, "step": 42574 }, { "epoch": 0.8, "learning_rate": 4.906112995669008e-07, "loss": 0.932, "step": 42575 }, { "epoch": 0.8, "learning_rate": 4.905204139714612e-07, "loss": 0.8044, "step": 42576 }, { "epoch": 0.8, "learning_rate": 4.904295358793556e-07, "loss": 0.891, "step": 42577 }, { "epoch": 0.8, "learning_rate": 4.903386652909261e-07, "loss": 0.9407, "step": 42578 }, { "epoch": 0.8, "learning_rate": 4.902478022065097e-07, "loss": 0.6958, "step": 42579 }, { "epoch": 0.8, "learning_rate": 4.901569466264461e-07, "loss": 0.7909, "step": 42580 }, { "epoch": 0.8, "learning_rate": 4.90066098551075e-07, "loss": 1.0557, "step": 42581 }, { "epoch": 0.8, "learning_rate": 4.899752579807354e-07, "loss": 0.9885, "step": 42582 }, { "epoch": 0.8, "learning_rate": 4.898844249157667e-07, "loss": 0.7147, "step": 42583 }, { "epoch": 0.8, "learning_rate": 4.897935993565078e-07, "loss": 0.7542, "step": 42584 }, { "epoch": 0.8, "learning_rate": 4.897027813032986e-07, "loss": 0.7322, "step": 42585 }, { "epoch": 0.8, "learning_rate": 4.896119707564764e-07, "loss": 0.8918, "step": 42586 }, { "epoch": 0.8, "learning_rate": 4.895211677163822e-07, "loss": 0.8732, "step": 42587 }, { "epoch": 0.8, "learning_rate": 4.894303721833546e-07, "loss": 0.8404, "step": 42588 }, { "epoch": 0.8, "learning_rate": 4.893395841577314e-07, "loss": 0.9193, "step": 42589 }, { "epoch": 0.8, "learning_rate": 4.892488036398538e-07, "loss": 0.9767, "step": 42590 }, { "epoch": 0.8, "learning_rate": 4.891580306300586e-07, "loss": 0.9569, "step": 42591 }, { "epoch": 0.8, "learning_rate": 4.89067265128686e-07, "loss": 0.8373, "step": 42592 }, { "epoch": 0.8, "learning_rate": 4.889765071360744e-07, "loss": 0.9359, "step": 42593 }, { "epoch": 0.8, "learning_rate": 4.888857566525629e-07, "loss": 0.9481, "step": 42594 }, { "epoch": 0.8, "learning_rate": 4.887950136784902e-07, "loss": 1.0565, "step": 42595 }, { "epoch": 0.8, "learning_rate": 4.887042782141954e-07, "loss": 1.1105, "step": 42596 }, { "epoch": 0.8, "learning_rate": 4.886135502600175e-07, "loss": 1.0057, "step": 42597 }, { "epoch": 0.8, "learning_rate": 4.885228298162939e-07, "loss": 0.8085, "step": 42598 }, { "epoch": 0.8, "learning_rate": 4.884321168833659e-07, "loss": 0.927, "step": 42599 }, { "epoch": 0.8, "learning_rate": 4.883414114615698e-07, "loss": 0.7608, "step": 42600 }, { "epoch": 0.8, "learning_rate": 4.882507135512446e-07, "loss": 0.7292, "step": 42601 }, { "epoch": 0.8, "learning_rate": 4.881600231527306e-07, "loss": 0.6856, "step": 42602 }, { "epoch": 0.8, "learning_rate": 4.88069340266365e-07, "loss": 0.8269, "step": 42603 }, { "epoch": 0.8, "learning_rate": 4.879786648924875e-07, "loss": 0.9549, "step": 42604 }, { "epoch": 0.8, "learning_rate": 4.878879970314346e-07, "loss": 0.9794, "step": 42605 }, { "epoch": 0.8, "learning_rate": 4.877973366835467e-07, "loss": 1.1263, "step": 42606 }, { "epoch": 0.8, "learning_rate": 4.877066838491626e-07, "loss": 0.8693, "step": 42607 }, { "epoch": 0.8, "learning_rate": 4.876160385286188e-07, "loss": 0.947, "step": 42608 }, { "epoch": 0.8, "learning_rate": 4.875254007222563e-07, "loss": 0.7369, "step": 42609 }, { "epoch": 0.8, "learning_rate": 4.874347704304116e-07, "loss": 0.9971, "step": 42610 }, { "epoch": 0.8, "learning_rate": 4.873441476534238e-07, "loss": 0.9424, "step": 42611 }, { "epoch": 0.8, "learning_rate": 4.872535323916314e-07, "loss": 0.9851, "step": 42612 }, { "epoch": 0.8, "learning_rate": 4.871629246453721e-07, "loss": 1.0032, "step": 42613 }, { "epoch": 0.8, "learning_rate": 4.870723244149852e-07, "loss": 0.9581, "step": 42614 }, { "epoch": 0.8, "learning_rate": 4.869817317008082e-07, "loss": 0.9942, "step": 42615 }, { "epoch": 0.8, "learning_rate": 4.868911465031806e-07, "loss": 0.8081, "step": 42616 }, { "epoch": 0.8, "learning_rate": 4.868005688224384e-07, "loss": 0.8407, "step": 42617 }, { "epoch": 0.8, "learning_rate": 4.867099986589225e-07, "loss": 1.0523, "step": 42618 }, { "epoch": 0.8, "learning_rate": 4.866194360129689e-07, "loss": 1.0877, "step": 42619 }, { "epoch": 0.8, "learning_rate": 4.865288808849167e-07, "loss": 0.7978, "step": 42620 }, { "epoch": 0.8, "learning_rate": 4.864383332751039e-07, "loss": 0.9132, "step": 42621 }, { "epoch": 0.8, "learning_rate": 4.863477931838684e-07, "loss": 0.8798, "step": 42622 }, { "epoch": 0.8, "learning_rate": 4.862572606115487e-07, "loss": 0.8056, "step": 42623 }, { "epoch": 0.8, "learning_rate": 4.861667355584828e-07, "loss": 0.6469, "step": 42624 }, { "epoch": 0.8, "learning_rate": 4.86076218025009e-07, "loss": 0.9378, "step": 42625 }, { "epoch": 0.8, "learning_rate": 4.859857080114636e-07, "loss": 1.1238, "step": 42626 }, { "epoch": 0.8, "learning_rate": 4.858952055181864e-07, "loss": 0.8568, "step": 42627 }, { "epoch": 0.8, "learning_rate": 4.858047105455158e-07, "loss": 0.808, "step": 42628 }, { "epoch": 0.8, "learning_rate": 4.85714223093787e-07, "loss": 1.0591, "step": 42629 }, { "epoch": 0.8, "learning_rate": 4.856237431633407e-07, "loss": 0.7782, "step": 42630 }, { "epoch": 0.8, "learning_rate": 4.855332707545133e-07, "loss": 0.8853, "step": 42631 }, { "epoch": 0.8, "learning_rate": 4.854428058676425e-07, "loss": 0.9242, "step": 42632 }, { "epoch": 0.8, "learning_rate": 4.853523485030667e-07, "loss": 0.7885, "step": 42633 }, { "epoch": 0.8, "learning_rate": 4.852618986611235e-07, "loss": 0.792, "step": 42634 }, { "epoch": 0.8, "learning_rate": 4.851714563421505e-07, "loss": 0.8792, "step": 42635 }, { "epoch": 0.8, "learning_rate": 4.850810215464858e-07, "loss": 1.0422, "step": 42636 }, { "epoch": 0.8, "learning_rate": 4.84990594274467e-07, "loss": 1.0399, "step": 42637 }, { "epoch": 0.8, "learning_rate": 4.849001745264307e-07, "loss": 1.0151, "step": 42638 }, { "epoch": 0.8, "learning_rate": 4.848097623027162e-07, "loss": 0.9106, "step": 42639 }, { "epoch": 0.8, "learning_rate": 4.847193576036599e-07, "loss": 0.7875, "step": 42640 }, { "epoch": 0.8, "learning_rate": 4.846289604295996e-07, "loss": 1.0286, "step": 42641 }, { "epoch": 0.8, "learning_rate": 4.84538570780873e-07, "loss": 0.7419, "step": 42642 }, { "epoch": 0.8, "learning_rate": 4.844481886578176e-07, "loss": 1.0677, "step": 42643 }, { "epoch": 0.8, "learning_rate": 4.843578140607707e-07, "loss": 0.8405, "step": 42644 }, { "epoch": 0.8, "learning_rate": 4.842674469900702e-07, "loss": 0.8224, "step": 42645 }, { "epoch": 0.8, "learning_rate": 4.841770874460539e-07, "loss": 0.905, "step": 42646 }, { "epoch": 0.8, "learning_rate": 4.840867354290571e-07, "loss": 0.9078, "step": 42647 }, { "epoch": 0.8, "learning_rate": 4.839963909394193e-07, "loss": 0.8006, "step": 42648 }, { "epoch": 0.8, "learning_rate": 4.839060539774779e-07, "loss": 0.9283, "step": 42649 }, { "epoch": 0.8, "learning_rate": 4.838157245435679e-07, "loss": 1.0249, "step": 42650 }, { "epoch": 0.8, "learning_rate": 4.837254026380297e-07, "loss": 0.8332, "step": 42651 }, { "epoch": 0.8, "learning_rate": 4.836350882611984e-07, "loss": 0.9573, "step": 42652 }, { "epoch": 0.8, "learning_rate": 4.835447814134117e-07, "loss": 0.8076, "step": 42653 }, { "epoch": 0.8, "learning_rate": 4.834544820950071e-07, "loss": 0.9593, "step": 42654 }, { "epoch": 0.8, "learning_rate": 4.833641903063215e-07, "loss": 1.0787, "step": 42655 }, { "epoch": 0.8, "learning_rate": 4.832739060476924e-07, "loss": 1.0789, "step": 42656 }, { "epoch": 0.8, "learning_rate": 4.831836293194567e-07, "loss": 0.8631, "step": 42657 }, { "epoch": 0.8, "learning_rate": 4.83093360121952e-07, "loss": 0.8132, "step": 42658 }, { "epoch": 0.8, "learning_rate": 4.830030984555134e-07, "loss": 0.7747, "step": 42659 }, { "epoch": 0.8, "learning_rate": 4.829128443204808e-07, "loss": 0.736, "step": 42660 }, { "epoch": 0.8, "learning_rate": 4.828225977171893e-07, "loss": 0.9873, "step": 42661 }, { "epoch": 0.8, "learning_rate": 4.827323586459765e-07, "loss": 1.0617, "step": 42662 }, { "epoch": 0.8, "learning_rate": 4.826421271071788e-07, "loss": 1.1277, "step": 42663 }, { "epoch": 0.8, "learning_rate": 4.825519031011339e-07, "loss": 0.8234, "step": 42664 }, { "epoch": 0.8, "learning_rate": 4.824616866281781e-07, "loss": 0.7975, "step": 42665 }, { "epoch": 0.8, "learning_rate": 4.823714776886485e-07, "loss": 0.915, "step": 42666 }, { "epoch": 0.8, "learning_rate": 4.822812762828827e-07, "loss": 0.8573, "step": 42667 }, { "epoch": 0.81, "learning_rate": 4.821910824112155e-07, "loss": 0.8374, "step": 42668 }, { "epoch": 0.81, "learning_rate": 4.821008960739853e-07, "loss": 1.0015, "step": 42669 }, { "epoch": 0.81, "learning_rate": 4.820107172715293e-07, "loss": 0.9726, "step": 42670 }, { "epoch": 0.81, "learning_rate": 4.819205460041823e-07, "loss": 0.8231, "step": 42671 }, { "epoch": 0.81, "learning_rate": 4.818303822722834e-07, "loss": 0.7652, "step": 42672 }, { "epoch": 0.81, "learning_rate": 4.817402260761669e-07, "loss": 0.8099, "step": 42673 }, { "epoch": 0.81, "learning_rate": 4.816500774161708e-07, "loss": 0.8255, "step": 42674 }, { "epoch": 0.81, "learning_rate": 4.815599362926316e-07, "loss": 0.833, "step": 42675 }, { "epoch": 0.81, "learning_rate": 4.814698027058853e-07, "loss": 0.8846, "step": 42676 }, { "epoch": 0.81, "learning_rate": 4.813796766562692e-07, "loss": 0.8876, "step": 42677 }, { "epoch": 0.81, "learning_rate": 4.812895581441193e-07, "loss": 0.9359, "step": 42678 }, { "epoch": 0.81, "learning_rate": 4.811994471697731e-07, "loss": 0.8079, "step": 42679 }, { "epoch": 0.81, "learning_rate": 4.811093437335651e-07, "loss": 0.8381, "step": 42680 }, { "epoch": 0.81, "learning_rate": 4.810192478358339e-07, "loss": 1.1038, "step": 42681 }, { "epoch": 0.81, "learning_rate": 4.809291594769144e-07, "loss": 0.9753, "step": 42682 }, { "epoch": 0.81, "learning_rate": 4.808390786571435e-07, "loss": 0.8097, "step": 42683 }, { "epoch": 0.81, "learning_rate": 4.807490053768577e-07, "loss": 0.8963, "step": 42684 }, { "epoch": 0.81, "learning_rate": 4.806589396363928e-07, "loss": 0.7463, "step": 42685 }, { "epoch": 0.81, "learning_rate": 4.805688814360859e-07, "loss": 1.1638, "step": 42686 }, { "epoch": 0.81, "learning_rate": 4.804788307762728e-07, "loss": 0.9482, "step": 42687 }, { "epoch": 0.81, "learning_rate": 4.803887876572904e-07, "loss": 1.0305, "step": 42688 }, { "epoch": 0.81, "learning_rate": 4.80298752079473e-07, "loss": 1.0693, "step": 42689 }, { "epoch": 0.81, "learning_rate": 4.802087240431588e-07, "loss": 1.0742, "step": 42690 }, { "epoch": 0.81, "learning_rate": 4.80118703548684e-07, "loss": 0.8947, "step": 42691 }, { "epoch": 0.81, "learning_rate": 4.800286905963827e-07, "loss": 0.8707, "step": 42692 }, { "epoch": 0.81, "learning_rate": 4.799386851865939e-07, "loss": 1.0435, "step": 42693 }, { "epoch": 0.81, "learning_rate": 4.798486873196511e-07, "loss": 0.987, "step": 42694 }, { "epoch": 0.81, "learning_rate": 4.797586969958914e-07, "loss": 0.7961, "step": 42695 }, { "epoch": 0.81, "learning_rate": 4.796687142156511e-07, "loss": 0.868, "step": 42696 }, { "epoch": 0.81, "learning_rate": 4.795787389792656e-07, "loss": 0.8229, "step": 42697 }, { "epoch": 0.81, "learning_rate": 4.794887712870714e-07, "loss": 0.8015, "step": 42698 }, { "epoch": 0.81, "learning_rate": 4.793988111394038e-07, "loss": 0.9883, "step": 42699 }, { "epoch": 0.81, "learning_rate": 4.793088585365999e-07, "loss": 1.0519, "step": 42700 }, { "epoch": 0.81, "learning_rate": 4.792189134789934e-07, "loss": 0.9649, "step": 42701 }, { "epoch": 0.81, "learning_rate": 4.791289759669229e-07, "loss": 0.7394, "step": 42702 }, { "epoch": 0.81, "learning_rate": 4.790390460007225e-07, "loss": 0.6738, "step": 42703 }, { "epoch": 0.81, "learning_rate": 4.789491235807278e-07, "loss": 0.8007, "step": 42704 }, { "epoch": 0.81, "learning_rate": 4.788592087072755e-07, "loss": 0.7594, "step": 42705 }, { "epoch": 0.81, "learning_rate": 4.787693013807008e-07, "loss": 1.1682, "step": 42706 }, { "epoch": 0.81, "learning_rate": 4.786794016013394e-07, "loss": 1.1226, "step": 42707 }, { "epoch": 0.81, "learning_rate": 4.785895093695272e-07, "loss": 0.873, "step": 42708 }, { "epoch": 0.81, "learning_rate": 4.784996246856005e-07, "loss": 0.7467, "step": 42709 }, { "epoch": 0.81, "learning_rate": 4.784097475498931e-07, "loss": 0.7613, "step": 42710 }, { "epoch": 0.81, "learning_rate": 4.783198779627421e-07, "loss": 0.88, "step": 42711 }, { "epoch": 0.81, "learning_rate": 4.782300159244835e-07, "loss": 1.1412, "step": 42712 }, { "epoch": 0.81, "learning_rate": 4.781401614354506e-07, "loss": 0.9164, "step": 42713 }, { "epoch": 0.81, "learning_rate": 4.780503144959819e-07, "loss": 0.8924, "step": 42714 }, { "epoch": 0.81, "learning_rate": 4.779604751064104e-07, "loss": 0.8566, "step": 42715 }, { "epoch": 0.81, "learning_rate": 4.778706432670727e-07, "loss": 0.8637, "step": 42716 }, { "epoch": 0.81, "learning_rate": 4.777808189783037e-07, "loss": 1.0152, "step": 42717 }, { "epoch": 0.81, "learning_rate": 4.776910022404394e-07, "loss": 1.0536, "step": 42718 }, { "epoch": 0.81, "learning_rate": 4.776011930538149e-07, "loss": 0.9237, "step": 42719 }, { "epoch": 0.81, "learning_rate": 4.775113914187654e-07, "loss": 0.9874, "step": 42720 }, { "epoch": 0.81, "learning_rate": 4.774215973356272e-07, "loss": 0.78, "step": 42721 }, { "epoch": 0.81, "learning_rate": 4.773318108047331e-07, "loss": 0.8979, "step": 42722 }, { "epoch": 0.81, "learning_rate": 4.772420318264217e-07, "loss": 0.8055, "step": 42723 }, { "epoch": 0.81, "learning_rate": 4.771522604010256e-07, "loss": 0.7543, "step": 42724 }, { "epoch": 0.81, "learning_rate": 4.770624965288812e-07, "loss": 0.8021, "step": 42725 }, { "epoch": 0.81, "learning_rate": 4.76972740210323e-07, "loss": 1.0688, "step": 42726 }, { "epoch": 0.81, "learning_rate": 4.768829914456869e-07, "loss": 0.8824, "step": 42727 }, { "epoch": 0.81, "learning_rate": 4.767932502353076e-07, "loss": 0.8417, "step": 42728 }, { "epoch": 0.81, "learning_rate": 4.7670351657952027e-07, "loss": 0.7014, "step": 42729 }, { "epoch": 0.81, "learning_rate": 4.766137904786605e-07, "loss": 0.7989, "step": 42730 }, { "epoch": 0.81, "learning_rate": 4.765240719330619e-07, "loss": 0.9161, "step": 42731 }, { "epoch": 0.81, "learning_rate": 4.764343609430605e-07, "loss": 0.926, "step": 42732 }, { "epoch": 0.81, "learning_rate": 4.763446575089922e-07, "loss": 0.8034, "step": 42733 }, { "epoch": 0.81, "learning_rate": 4.762549616311893e-07, "loss": 0.8857, "step": 42734 }, { "epoch": 0.81, "learning_rate": 4.761652733099897e-07, "loss": 0.8417, "step": 42735 }, { "epoch": 0.81, "learning_rate": 4.760755925457264e-07, "loss": 1.0276, "step": 42736 }, { "epoch": 0.81, "learning_rate": 4.7598591933873476e-07, "loss": 0.9947, "step": 42737 }, { "epoch": 0.81, "learning_rate": 4.7589625368934964e-07, "loss": 0.7082, "step": 42738 }, { "epoch": 0.81, "learning_rate": 4.7580659559790574e-07, "loss": 0.7693, "step": 42739 }, { "epoch": 0.81, "learning_rate": 4.757169450647381e-07, "loss": 0.833, "step": 42740 }, { "epoch": 0.81, "learning_rate": 4.756273020901811e-07, "loss": 0.9196, "step": 42741 }, { "epoch": 0.81, "learning_rate": 4.755376666745706e-07, "loss": 0.9729, "step": 42742 }, { "epoch": 0.81, "learning_rate": 4.754480388182389e-07, "loss": 1.0851, "step": 42743 }, { "epoch": 0.81, "learning_rate": 4.753584185215235e-07, "loss": 0.9102, "step": 42744 }, { "epoch": 0.81, "learning_rate": 4.7526880578475707e-07, "loss": 0.9327, "step": 42745 }, { "epoch": 0.81, "learning_rate": 4.7517920060827475e-07, "loss": 0.8802, "step": 42746 }, { "epoch": 0.81, "learning_rate": 4.7508960299241126e-07, "loss": 1.0214, "step": 42747 }, { "epoch": 0.81, "learning_rate": 4.7500001293750125e-07, "loss": 0.8014, "step": 42748 }, { "epoch": 0.81, "learning_rate": 4.7491043044387897e-07, "loss": 0.9581, "step": 42749 }, { "epoch": 0.81, "learning_rate": 4.7482085551187884e-07, "loss": 1.062, "step": 42750 }, { "epoch": 0.81, "learning_rate": 4.7473128814183644e-07, "loss": 0.8799, "step": 42751 }, { "epoch": 0.81, "learning_rate": 4.74641728334084e-07, "loss": 0.8929, "step": 42752 }, { "epoch": 0.81, "learning_rate": 4.745521760889579e-07, "loss": 0.7792, "step": 42753 }, { "epoch": 0.81, "learning_rate": 4.7446263140679264e-07, "loss": 0.8149, "step": 42754 }, { "epoch": 0.81, "learning_rate": 4.743730942879202e-07, "loss": 0.9807, "step": 42755 }, { "epoch": 0.81, "learning_rate": 4.7428356473267793e-07, "loss": 1.0865, "step": 42756 }, { "epoch": 0.81, "learning_rate": 4.7419404274139824e-07, "loss": 1.0888, "step": 42757 }, { "epoch": 0.81, "learning_rate": 4.741045283144158e-07, "loss": 0.9435, "step": 42758 }, { "epoch": 0.81, "learning_rate": 4.7401502145206476e-07, "loss": 0.8849, "step": 42759 }, { "epoch": 0.81, "learning_rate": 4.7392552215467983e-07, "loss": 0.7239, "step": 42760 }, { "epoch": 0.81, "learning_rate": 4.7383603042259475e-07, "loss": 0.7404, "step": 42761 }, { "epoch": 0.81, "learning_rate": 4.737465462561436e-07, "loss": 1.0948, "step": 42762 }, { "epoch": 0.81, "learning_rate": 4.7365706965566166e-07, "loss": 0.8672, "step": 42763 }, { "epoch": 0.81, "learning_rate": 4.735676006214807e-07, "loss": 0.9273, "step": 42764 }, { "epoch": 0.81, "learning_rate": 4.734781391539373e-07, "loss": 0.9185, "step": 42765 }, { "epoch": 0.81, "learning_rate": 4.7338868525336394e-07, "loss": 0.8702, "step": 42766 }, { "epoch": 0.81, "learning_rate": 4.7329923892009496e-07, "loss": 0.9294, "step": 42767 }, { "epoch": 0.81, "learning_rate": 4.7320980015446467e-07, "loss": 1.022, "step": 42768 }, { "epoch": 0.81, "learning_rate": 4.731203689568067e-07, "loss": 1.1074, "step": 42769 }, { "epoch": 0.81, "learning_rate": 4.7303094532745535e-07, "loss": 1.0045, "step": 42770 }, { "epoch": 0.81, "learning_rate": 4.7294152926674416e-07, "loss": 0.7927, "step": 42771 }, { "epoch": 0.81, "learning_rate": 4.7285212077500753e-07, "loss": 0.8755, "step": 42772 }, { "epoch": 0.81, "learning_rate": 4.7276271985257807e-07, "loss": 0.7597, "step": 42773 }, { "epoch": 0.81, "learning_rate": 4.726733264997907e-07, "loss": 0.876, "step": 42774 }, { "epoch": 0.81, "learning_rate": 4.7258394071697994e-07, "loss": 1.2198, "step": 42775 }, { "epoch": 0.81, "learning_rate": 4.7249456250447715e-07, "loss": 0.7515, "step": 42776 }, { "epoch": 0.81, "learning_rate": 4.724051918626188e-07, "loss": 0.9991, "step": 42777 }, { "epoch": 0.81, "learning_rate": 4.723158287917368e-07, "loss": 0.8318, "step": 42778 }, { "epoch": 0.81, "learning_rate": 4.7222647329216496e-07, "loss": 0.6252, "step": 42779 }, { "epoch": 0.81, "learning_rate": 4.721371253642376e-07, "loss": 1.0172, "step": 42780 }, { "epoch": 0.81, "learning_rate": 4.72047785008288e-07, "loss": 0.8537, "step": 42781 }, { "epoch": 0.81, "learning_rate": 4.719584522246498e-07, "loss": 0.8965, "step": 42782 }, { "epoch": 0.81, "learning_rate": 4.7186912701365635e-07, "loss": 0.9213, "step": 42783 }, { "epoch": 0.81, "learning_rate": 4.7177980937564233e-07, "loss": 1.0022, "step": 42784 }, { "epoch": 0.81, "learning_rate": 4.7169049931093893e-07, "loss": 0.8684, "step": 42785 }, { "epoch": 0.81, "learning_rate": 4.716011968198822e-07, "loss": 0.8405, "step": 42786 }, { "epoch": 0.81, "learning_rate": 4.715119019028039e-07, "loss": 0.9554, "step": 42787 }, { "epoch": 0.81, "learning_rate": 4.7142261456003783e-07, "loss": 0.7923, "step": 42788 }, { "epoch": 0.81, "learning_rate": 4.7133333479191746e-07, "loss": 0.9993, "step": 42789 }, { "epoch": 0.81, "learning_rate": 4.712440625987763e-07, "loss": 0.806, "step": 42790 }, { "epoch": 0.81, "learning_rate": 4.7115479798094776e-07, "loss": 0.8237, "step": 42791 }, { "epoch": 0.81, "learning_rate": 4.710655409387649e-07, "loss": 0.8696, "step": 42792 }, { "epoch": 0.81, "learning_rate": 4.7097629147256184e-07, "loss": 0.9939, "step": 42793 }, { "epoch": 0.81, "learning_rate": 4.708870495826695e-07, "loss": 0.9537, "step": 42794 }, { "epoch": 0.81, "learning_rate": 4.707978152694237e-07, "loss": 0.908, "step": 42795 }, { "epoch": 0.81, "learning_rate": 4.707085885331572e-07, "loss": 0.899, "step": 42796 }, { "epoch": 0.81, "learning_rate": 4.7061936937420116e-07, "loss": 0.8882, "step": 42797 }, { "epoch": 0.81, "learning_rate": 4.7053015779289167e-07, "loss": 0.9791, "step": 42798 }, { "epoch": 0.81, "learning_rate": 4.7044095378955936e-07, "loss": 0.9648, "step": 42799 }, { "epoch": 0.81, "learning_rate": 4.7035175736453857e-07, "loss": 1.1463, "step": 42800 }, { "epoch": 0.81, "learning_rate": 4.702625685181622e-07, "loss": 0.9585, "step": 42801 }, { "epoch": 0.81, "learning_rate": 4.70173387250763e-07, "loss": 0.8573, "step": 42802 }, { "epoch": 0.81, "learning_rate": 4.7008421356267406e-07, "loss": 0.8183, "step": 42803 }, { "epoch": 0.81, "learning_rate": 4.6999504745422865e-07, "loss": 0.7612, "step": 42804 }, { "epoch": 0.81, "learning_rate": 4.699058889257599e-07, "loss": 0.8957, "step": 42805 }, { "epoch": 0.81, "learning_rate": 4.698167379775992e-07, "loss": 1.1437, "step": 42806 }, { "epoch": 0.81, "learning_rate": 4.6972759461008185e-07, "loss": 1.129, "step": 42807 }, { "epoch": 0.81, "learning_rate": 4.6963845882353867e-07, "loss": 0.8344, "step": 42808 }, { "epoch": 0.81, "learning_rate": 4.6954933061830326e-07, "loss": 0.7569, "step": 42809 }, { "epoch": 0.81, "learning_rate": 4.694602099947082e-07, "loss": 0.825, "step": 42810 }, { "epoch": 0.81, "learning_rate": 4.693710969530868e-07, "loss": 0.8956, "step": 42811 }, { "epoch": 0.81, "learning_rate": 4.692819914937713e-07, "loss": 1.0142, "step": 42812 }, { "epoch": 0.81, "learning_rate": 4.6919289361709447e-07, "loss": 0.8909, "step": 42813 }, { "epoch": 0.81, "learning_rate": 4.6910380332338994e-07, "loss": 0.9252, "step": 42814 }, { "epoch": 0.81, "learning_rate": 4.6901472061298833e-07, "loss": 0.9761, "step": 42815 }, { "epoch": 0.81, "learning_rate": 4.68925645486224e-07, "loss": 0.7998, "step": 42816 }, { "epoch": 0.81, "learning_rate": 4.688365779434295e-07, "loss": 0.5831, "step": 42817 }, { "epoch": 0.81, "learning_rate": 4.6874751798493574e-07, "loss": 1.1605, "step": 42818 }, { "epoch": 0.81, "learning_rate": 4.686584656110779e-07, "loss": 0.9474, "step": 42819 }, { "epoch": 0.81, "learning_rate": 4.685694208221864e-07, "loss": 0.858, "step": 42820 }, { "epoch": 0.81, "learning_rate": 4.6848038361859444e-07, "loss": 0.8485, "step": 42821 }, { "epoch": 0.81, "learning_rate": 4.6839135400063434e-07, "loss": 0.6885, "step": 42822 }, { "epoch": 0.81, "learning_rate": 4.683023319686386e-07, "loss": 0.8608, "step": 42823 }, { "epoch": 0.81, "learning_rate": 4.6821331752293977e-07, "loss": 0.993, "step": 42824 }, { "epoch": 0.81, "learning_rate": 4.6812431066386996e-07, "loss": 1.0023, "step": 42825 }, { "epoch": 0.81, "learning_rate": 4.680353113917624e-07, "loss": 1.0084, "step": 42826 }, { "epoch": 0.81, "learning_rate": 4.6794631970694756e-07, "loss": 0.8832, "step": 42827 }, { "epoch": 0.81, "learning_rate": 4.678573356097599e-07, "loss": 0.8007, "step": 42828 }, { "epoch": 0.81, "learning_rate": 4.6776835910053e-07, "loss": 0.8987, "step": 42829 }, { "epoch": 0.81, "learning_rate": 4.676793901795909e-07, "loss": 1.0364, "step": 42830 }, { "epoch": 0.81, "learning_rate": 4.675904288472746e-07, "loss": 1.1642, "step": 42831 }, { "epoch": 0.81, "learning_rate": 4.6750147510391334e-07, "loss": 0.8173, "step": 42832 }, { "epoch": 0.81, "learning_rate": 4.6741252894983907e-07, "loss": 0.8384, "step": 42833 }, { "epoch": 0.81, "learning_rate": 4.673235903853843e-07, "loss": 1.0552, "step": 42834 }, { "epoch": 0.81, "learning_rate": 4.672346594108815e-07, "loss": 0.9221, "step": 42835 }, { "epoch": 0.81, "learning_rate": 4.67145736026661e-07, "loss": 0.7194, "step": 42836 }, { "epoch": 0.81, "learning_rate": 4.6705682023305636e-07, "loss": 1.1282, "step": 42837 }, { "epoch": 0.81, "learning_rate": 4.669679120304002e-07, "loss": 0.8561, "step": 42838 }, { "epoch": 0.81, "learning_rate": 4.6687901141902246e-07, "loss": 1.0485, "step": 42839 }, { "epoch": 0.81, "learning_rate": 4.667901183992565e-07, "loss": 0.943, "step": 42840 }, { "epoch": 0.81, "learning_rate": 4.6670123297143375e-07, "loss": 0.7802, "step": 42841 }, { "epoch": 0.81, "learning_rate": 4.666123551358864e-07, "loss": 0.9681, "step": 42842 }, { "epoch": 0.81, "learning_rate": 4.665234848929459e-07, "loss": 0.9702, "step": 42843 }, { "epoch": 0.81, "learning_rate": 4.6643462224294473e-07, "loss": 0.7848, "step": 42844 }, { "epoch": 0.81, "learning_rate": 4.6634576718621457e-07, "loss": 1.0764, "step": 42845 }, { "epoch": 0.81, "learning_rate": 4.6625691972308597e-07, "loss": 0.9169, "step": 42846 }, { "epoch": 0.81, "learning_rate": 4.661680798538928e-07, "loss": 0.6786, "step": 42847 }, { "epoch": 0.81, "learning_rate": 4.660792475789652e-07, "loss": 0.979, "step": 42848 }, { "epoch": 0.81, "learning_rate": 4.6599042289863504e-07, "loss": 0.8067, "step": 42849 }, { "epoch": 0.81, "learning_rate": 4.659016058132346e-07, "loss": 1.063, "step": 42850 }, { "epoch": 0.81, "learning_rate": 4.658127963230949e-07, "loss": 0.8578, "step": 42851 }, { "epoch": 0.81, "learning_rate": 4.65723994428548e-07, "loss": 0.9429, "step": 42852 }, { "epoch": 0.81, "learning_rate": 4.656352001299255e-07, "loss": 0.8567, "step": 42853 }, { "epoch": 0.81, "learning_rate": 4.655464134275592e-07, "loss": 0.8021, "step": 42854 }, { "epoch": 0.81, "learning_rate": 4.65457634321779e-07, "loss": 1.0466, "step": 42855 }, { "epoch": 0.81, "learning_rate": 4.6536886281291885e-07, "loss": 1.0688, "step": 42856 }, { "epoch": 0.81, "learning_rate": 4.652800989013084e-07, "loss": 0.8954, "step": 42857 }, { "epoch": 0.81, "learning_rate": 4.6519134258727896e-07, "loss": 0.9648, "step": 42858 }, { "epoch": 0.81, "learning_rate": 4.6510259387116395e-07, "loss": 1.1141, "step": 42859 }, { "epoch": 0.81, "learning_rate": 4.65013852753293e-07, "loss": 1.0504, "step": 42860 }, { "epoch": 0.81, "learning_rate": 4.649251192339976e-07, "loss": 0.9977, "step": 42861 }, { "epoch": 0.81, "learning_rate": 4.648363933136096e-07, "loss": 1.0503, "step": 42862 }, { "epoch": 0.81, "learning_rate": 4.6474767499246036e-07, "loss": 0.9194, "step": 42863 }, { "epoch": 0.81, "learning_rate": 4.6465896427088043e-07, "loss": 0.6938, "step": 42864 }, { "epoch": 0.81, "learning_rate": 4.645702611492017e-07, "loss": 1.0534, "step": 42865 }, { "epoch": 0.81, "learning_rate": 4.6448156562775597e-07, "loss": 0.7934, "step": 42866 }, { "epoch": 0.81, "learning_rate": 4.6439287770687234e-07, "loss": 0.7394, "step": 42867 }, { "epoch": 0.81, "learning_rate": 4.643041973868845e-07, "loss": 0.926, "step": 42868 }, { "epoch": 0.81, "learning_rate": 4.6421552466812183e-07, "loss": 1.0268, "step": 42869 }, { "epoch": 0.81, "learning_rate": 4.6412685955091574e-07, "loss": 0.7577, "step": 42870 }, { "epoch": 0.81, "learning_rate": 4.6403820203559794e-07, "loss": 0.7629, "step": 42871 }, { "epoch": 0.81, "learning_rate": 4.6394955212249874e-07, "loss": 0.979, "step": 42872 }, { "epoch": 0.81, "learning_rate": 4.638609098119495e-07, "loss": 0.7592, "step": 42873 }, { "epoch": 0.81, "learning_rate": 4.637722751042814e-07, "loss": 0.9756, "step": 42874 }, { "epoch": 0.81, "learning_rate": 4.636836479998255e-07, "loss": 1.0851, "step": 42875 }, { "epoch": 0.81, "learning_rate": 4.635950284989116e-07, "loss": 1.0322, "step": 42876 }, { "epoch": 0.81, "learning_rate": 4.635064166018724e-07, "loss": 0.9525, "step": 42877 }, { "epoch": 0.81, "learning_rate": 4.6341781230903717e-07, "loss": 0.9793, "step": 42878 }, { "epoch": 0.81, "learning_rate": 4.633292156207367e-07, "loss": 0.9618, "step": 42879 }, { "epoch": 0.81, "learning_rate": 4.6324062653730376e-07, "loss": 0.7528, "step": 42880 }, { "epoch": 0.81, "learning_rate": 4.6315204505906733e-07, "loss": 0.9451, "step": 42881 }, { "epoch": 0.81, "learning_rate": 4.630634711863588e-07, "loss": 0.8822, "step": 42882 }, { "epoch": 0.81, "learning_rate": 4.629749049195087e-07, "loss": 0.8511, "step": 42883 }, { "epoch": 0.81, "learning_rate": 4.628863462588479e-07, "loss": 1.0105, "step": 42884 }, { "epoch": 0.81, "learning_rate": 4.627977952047072e-07, "loss": 0.7354, "step": 42885 }, { "epoch": 0.81, "learning_rate": 4.627092517574167e-07, "loss": 0.9301, "step": 42886 }, { "epoch": 0.81, "learning_rate": 4.6262071591730825e-07, "loss": 1.0728, "step": 42887 }, { "epoch": 0.81, "learning_rate": 4.6253218768471025e-07, "loss": 1.1888, "step": 42888 }, { "epoch": 0.81, "learning_rate": 4.624436670599558e-07, "loss": 0.861, "step": 42889 }, { "epoch": 0.81, "learning_rate": 4.6235515404337377e-07, "loss": 0.8653, "step": 42890 }, { "epoch": 0.81, "learning_rate": 4.62266648635295e-07, "loss": 0.9492, "step": 42891 }, { "epoch": 0.81, "learning_rate": 4.621781508360501e-07, "loss": 1.0121, "step": 42892 }, { "epoch": 0.81, "learning_rate": 4.620896606459693e-07, "loss": 1.0292, "step": 42893 }, { "epoch": 0.81, "learning_rate": 4.6200117806538355e-07, "loss": 0.9112, "step": 42894 }, { "epoch": 0.81, "learning_rate": 4.6191270309462274e-07, "loss": 0.9433, "step": 42895 }, { "epoch": 0.81, "learning_rate": 4.618242357340183e-07, "loss": 0.9063, "step": 42896 }, { "epoch": 0.81, "learning_rate": 4.617357759838981e-07, "loss": 0.873, "step": 42897 }, { "epoch": 0.81, "learning_rate": 4.616473238445954e-07, "loss": 0.7589, "step": 42898 }, { "epoch": 0.81, "learning_rate": 4.615588793164383e-07, "loss": 0.9964, "step": 42899 }, { "epoch": 0.81, "learning_rate": 4.6147044239975734e-07, "loss": 1.1105, "step": 42900 }, { "epoch": 0.81, "learning_rate": 4.6138201309488454e-07, "loss": 0.9819, "step": 42901 }, { "epoch": 0.81, "learning_rate": 4.6129359140214824e-07, "loss": 0.8642, "step": 42902 }, { "epoch": 0.81, "learning_rate": 4.61205177321879e-07, "loss": 0.7018, "step": 42903 }, { "epoch": 0.81, "learning_rate": 4.611167708544073e-07, "loss": 0.6001, "step": 42904 }, { "epoch": 0.81, "learning_rate": 4.6102837200006275e-07, "loss": 0.8432, "step": 42905 }, { "epoch": 0.81, "learning_rate": 4.6093998075917607e-07, "loss": 1.0277, "step": 42906 }, { "epoch": 0.81, "learning_rate": 4.6085159713207676e-07, "loss": 0.9665, "step": 42907 }, { "epoch": 0.81, "learning_rate": 4.60763221119096e-07, "loss": 0.733, "step": 42908 }, { "epoch": 0.81, "learning_rate": 4.606748527205612e-07, "loss": 0.8666, "step": 42909 }, { "epoch": 0.81, "learning_rate": 4.605864919368055e-07, "loss": 0.9758, "step": 42910 }, { "epoch": 0.81, "learning_rate": 4.6049813876815644e-07, "loss": 0.8391, "step": 42911 }, { "epoch": 0.81, "learning_rate": 4.604097932149451e-07, "loss": 0.8514, "step": 42912 }, { "epoch": 0.81, "learning_rate": 4.6032145527750093e-07, "loss": 1.0114, "step": 42913 }, { "epoch": 0.81, "learning_rate": 4.602331249561537e-07, "loss": 0.9059, "step": 42914 }, { "epoch": 0.81, "learning_rate": 4.6014480225123367e-07, "loss": 0.9933, "step": 42915 }, { "epoch": 0.81, "learning_rate": 4.6005648716307027e-07, "loss": 0.8094, "step": 42916 }, { "epoch": 0.81, "learning_rate": 4.599681796919941e-07, "loss": 0.9668, "step": 42917 }, { "epoch": 0.81, "learning_rate": 4.5987987983833307e-07, "loss": 1.2322, "step": 42918 }, { "epoch": 0.81, "learning_rate": 4.597915876024192e-07, "loss": 1.0397, "step": 42919 }, { "epoch": 0.81, "learning_rate": 4.5970330298458044e-07, "loss": 0.8629, "step": 42920 }, { "epoch": 0.81, "learning_rate": 4.5961502598514616e-07, "loss": 1.0004, "step": 42921 }, { "epoch": 0.81, "learning_rate": 4.5952675660444814e-07, "loss": 0.9683, "step": 42922 }, { "epoch": 0.81, "learning_rate": 4.5943849484281407e-07, "loss": 0.8315, "step": 42923 }, { "epoch": 0.81, "learning_rate": 4.59350240700574e-07, "loss": 0.8558, "step": 42924 }, { "epoch": 0.81, "learning_rate": 4.592619941780577e-07, "loss": 0.7997, "step": 42925 }, { "epoch": 0.81, "learning_rate": 4.5917375527559426e-07, "loss": 0.928, "step": 42926 }, { "epoch": 0.81, "learning_rate": 4.590855239935138e-07, "loss": 0.9013, "step": 42927 }, { "epoch": 0.81, "learning_rate": 4.589973003321452e-07, "loss": 0.836, "step": 42928 }, { "epoch": 0.81, "learning_rate": 4.58909084291819e-07, "loss": 0.7768, "step": 42929 }, { "epoch": 0.81, "learning_rate": 4.5882087587286213e-07, "loss": 0.9952, "step": 42930 }, { "epoch": 0.81, "learning_rate": 4.587326750756069e-07, "loss": 1.2073, "step": 42931 }, { "epoch": 0.81, "learning_rate": 4.5864448190038044e-07, "loss": 0.9198, "step": 42932 }, { "epoch": 0.81, "learning_rate": 4.585562963475132e-07, "loss": 0.9668, "step": 42933 }, { "epoch": 0.81, "learning_rate": 4.58468118417334e-07, "loss": 0.9434, "step": 42934 }, { "epoch": 0.81, "learning_rate": 4.583799481101725e-07, "loss": 0.7495, "step": 42935 }, { "epoch": 0.81, "learning_rate": 4.5829178542635745e-07, "loss": 0.8031, "step": 42936 }, { "epoch": 0.81, "learning_rate": 4.5820363036621824e-07, "loss": 0.7193, "step": 42937 }, { "epoch": 0.81, "learning_rate": 4.5811548293008463e-07, "loss": 0.8682, "step": 42938 }, { "epoch": 0.81, "learning_rate": 4.580273431182841e-07, "loss": 1.0092, "step": 42939 }, { "epoch": 0.81, "learning_rate": 4.579392109311481e-07, "loss": 0.8569, "step": 42940 }, { "epoch": 0.81, "learning_rate": 4.578510863690039e-07, "loss": 1.0028, "step": 42941 }, { "epoch": 0.81, "learning_rate": 4.577629694321806e-07, "loss": 0.7375, "step": 42942 }, { "epoch": 0.81, "learning_rate": 4.5767486012100876e-07, "loss": 1.1671, "step": 42943 }, { "epoch": 0.81, "learning_rate": 4.5758675843581566e-07, "loss": 1.1012, "step": 42944 }, { "epoch": 0.81, "learning_rate": 4.5749866437693134e-07, "loss": 0.9309, "step": 42945 }, { "epoch": 0.81, "learning_rate": 4.5741057794468414e-07, "loss": 0.8233, "step": 42946 }, { "epoch": 0.81, "learning_rate": 4.573224991394032e-07, "loss": 0.8762, "step": 42947 }, { "epoch": 0.81, "learning_rate": 4.572344279614177e-07, "loss": 0.7495, "step": 42948 }, { "epoch": 0.81, "learning_rate": 4.57146364411056e-07, "loss": 0.9905, "step": 42949 }, { "epoch": 0.81, "learning_rate": 4.5705830848864764e-07, "loss": 0.8903, "step": 42950 }, { "epoch": 0.81, "learning_rate": 4.569702601945197e-07, "loss": 0.9311, "step": 42951 }, { "epoch": 0.81, "learning_rate": 4.5688221952900373e-07, "loss": 0.8439, "step": 42952 }, { "epoch": 0.81, "learning_rate": 4.567941864924261e-07, "loss": 0.8913, "step": 42953 }, { "epoch": 0.81, "learning_rate": 4.567061610851162e-07, "loss": 0.688, "step": 42954 }, { "epoch": 0.81, "learning_rate": 4.5661814330740293e-07, "loss": 0.881, "step": 42955 }, { "epoch": 0.81, "learning_rate": 4.56530133159615e-07, "loss": 1.0331, "step": 42956 }, { "epoch": 0.81, "learning_rate": 4.5644213064208075e-07, "loss": 0.82, "step": 42957 }, { "epoch": 0.81, "learning_rate": 4.56354135755129e-07, "loss": 0.8803, "step": 42958 }, { "epoch": 0.81, "learning_rate": 4.562661484990888e-07, "loss": 0.7538, "step": 42959 }, { "epoch": 0.81, "learning_rate": 4.5617816887428694e-07, "loss": 0.8692, "step": 42960 }, { "epoch": 0.81, "learning_rate": 4.5609019688105437e-07, "loss": 0.7321, "step": 42961 }, { "epoch": 0.81, "learning_rate": 4.5600223251971777e-07, "loss": 1.0752, "step": 42962 }, { "epoch": 0.81, "learning_rate": 4.559142757906054e-07, "loss": 0.9048, "step": 42963 }, { "epoch": 0.81, "learning_rate": 4.558263266940477e-07, "loss": 0.9875, "step": 42964 }, { "epoch": 0.81, "learning_rate": 4.5573838523037125e-07, "loss": 0.7215, "step": 42965 }, { "epoch": 0.81, "learning_rate": 4.556504513999052e-07, "loss": 0.9413, "step": 42966 }, { "epoch": 0.81, "learning_rate": 4.5556252520297746e-07, "loss": 0.946, "step": 42967 }, { "epoch": 0.81, "learning_rate": 4.554746066399165e-07, "loss": 1.0698, "step": 42968 }, { "epoch": 0.81, "learning_rate": 4.553866957110509e-07, "loss": 0.8861, "step": 42969 }, { "epoch": 0.81, "learning_rate": 4.5529879241670847e-07, "loss": 0.7946, "step": 42970 }, { "epoch": 0.81, "learning_rate": 4.552108967572183e-07, "loss": 0.9242, "step": 42971 }, { "epoch": 0.81, "learning_rate": 4.55123008732907e-07, "loss": 0.7815, "step": 42972 }, { "epoch": 0.81, "learning_rate": 4.550351283441046e-07, "loss": 0.7233, "step": 42973 }, { "epoch": 0.81, "learning_rate": 4.549472555911377e-07, "loss": 0.9459, "step": 42974 }, { "epoch": 0.81, "learning_rate": 4.548593904743354e-07, "loss": 1.0297, "step": 42975 }, { "epoch": 0.81, "learning_rate": 4.5477153299402497e-07, "loss": 0.9669, "step": 42976 }, { "epoch": 0.81, "learning_rate": 4.5468368315053524e-07, "loss": 0.9198, "step": 42977 }, { "epoch": 0.81, "learning_rate": 4.545958409441939e-07, "loss": 1.011, "step": 42978 }, { "epoch": 0.81, "learning_rate": 4.5450800637532875e-07, "loss": 0.8692, "step": 42979 }, { "epoch": 0.81, "learning_rate": 4.54420179444269e-07, "loss": 0.9332, "step": 42980 }, { "epoch": 0.81, "learning_rate": 4.5433236015133996e-07, "loss": 0.8527, "step": 42981 }, { "epoch": 0.81, "learning_rate": 4.542445484968727e-07, "loss": 0.9242, "step": 42982 }, { "epoch": 0.81, "learning_rate": 4.5415674448119283e-07, "loss": 0.784, "step": 42983 }, { "epoch": 0.81, "learning_rate": 4.5406894810462814e-07, "loss": 0.9278, "step": 42984 }, { "epoch": 0.81, "learning_rate": 4.5398115936750866e-07, "loss": 0.7504, "step": 42985 }, { "epoch": 0.81, "learning_rate": 4.538933782701602e-07, "loss": 0.9875, "step": 42986 }, { "epoch": 0.81, "learning_rate": 4.5380560481291107e-07, "loss": 1.1606, "step": 42987 }, { "epoch": 0.81, "learning_rate": 4.5371783899608915e-07, "loss": 0.9062, "step": 42988 }, { "epoch": 0.81, "learning_rate": 4.536300808200222e-07, "loss": 0.845, "step": 42989 }, { "epoch": 0.81, "learning_rate": 4.5354233028503755e-07, "loss": 0.8352, "step": 42990 }, { "epoch": 0.81, "learning_rate": 4.5345458739146336e-07, "loss": 0.7036, "step": 42991 }, { "epoch": 0.81, "learning_rate": 4.533668521396273e-07, "loss": 0.743, "step": 42992 }, { "epoch": 0.81, "learning_rate": 4.532791245298557e-07, "loss": 0.7552, "step": 42993 }, { "epoch": 0.81, "learning_rate": 4.53191404562478e-07, "loss": 0.9775, "step": 42994 }, { "epoch": 0.81, "learning_rate": 4.5310369223782043e-07, "loss": 0.9951, "step": 42995 }, { "epoch": 0.81, "learning_rate": 4.53015987556211e-07, "loss": 0.7197, "step": 42996 }, { "epoch": 0.81, "learning_rate": 4.529282905179772e-07, "loss": 1.0146, "step": 42997 }, { "epoch": 0.81, "learning_rate": 4.52840601123446e-07, "loss": 0.7504, "step": 42998 }, { "epoch": 0.81, "learning_rate": 4.5275291937294546e-07, "loss": 0.6736, "step": 42999 }, { "epoch": 0.81, "learning_rate": 4.526652452668029e-07, "loss": 1.0862, "step": 43000 }, { "epoch": 0.81, "learning_rate": 4.5257757880534574e-07, "loss": 0.8908, "step": 43001 }, { "epoch": 0.81, "learning_rate": 4.524899199889002e-07, "loss": 0.7619, "step": 43002 }, { "epoch": 0.81, "learning_rate": 4.524022688177956e-07, "loss": 0.7749, "step": 43003 }, { "epoch": 0.81, "learning_rate": 4.523146252923577e-07, "loss": 0.7296, "step": 43004 }, { "epoch": 0.81, "learning_rate": 4.522269894129136e-07, "loss": 0.7809, "step": 43005 }, { "epoch": 0.81, "learning_rate": 4.5213936117979225e-07, "loss": 0.8841, "step": 43006 }, { "epoch": 0.81, "learning_rate": 4.520517405933192e-07, "loss": 1.0539, "step": 43007 }, { "epoch": 0.81, "learning_rate": 4.5196412765382195e-07, "loss": 0.9703, "step": 43008 }, { "epoch": 0.81, "learning_rate": 4.518765223616281e-07, "loss": 0.8054, "step": 43009 }, { "epoch": 0.81, "learning_rate": 4.5178892471706454e-07, "loss": 0.7372, "step": 43010 }, { "epoch": 0.81, "learning_rate": 4.5170133472045824e-07, "loss": 0.8391, "step": 43011 }, { "epoch": 0.81, "learning_rate": 4.5161375237213615e-07, "loss": 1.0026, "step": 43012 }, { "epoch": 0.81, "learning_rate": 4.515261776724264e-07, "loss": 1.035, "step": 43013 }, { "epoch": 0.81, "learning_rate": 4.514386106216537e-07, "loss": 0.8588, "step": 43014 }, { "epoch": 0.81, "learning_rate": 4.513510512201477e-07, "loss": 0.8627, "step": 43015 }, { "epoch": 0.81, "learning_rate": 4.5126349946823353e-07, "loss": 0.8768, "step": 43016 }, { "epoch": 0.81, "learning_rate": 4.511759553662387e-07, "loss": 0.7467, "step": 43017 }, { "epoch": 0.81, "learning_rate": 4.5108841891448983e-07, "loss": 1.0188, "step": 43018 }, { "epoch": 0.81, "learning_rate": 4.510008901133142e-07, "loss": 1.0327, "step": 43019 }, { "epoch": 0.81, "learning_rate": 4.5091336896303823e-07, "loss": 0.8382, "step": 43020 }, { "epoch": 0.81, "learning_rate": 4.5082585546398884e-07, "loss": 0.894, "step": 43021 }, { "epoch": 0.81, "learning_rate": 4.5073834961649384e-07, "loss": 0.8953, "step": 43022 }, { "epoch": 0.81, "learning_rate": 4.506508514208774e-07, "loss": 0.8657, "step": 43023 }, { "epoch": 0.81, "learning_rate": 4.5056336087746927e-07, "loss": 0.8989, "step": 43024 }, { "epoch": 0.81, "learning_rate": 4.504758779865942e-07, "loss": 0.9043, "step": 43025 }, { "epoch": 0.81, "learning_rate": 4.503884027485786e-07, "loss": 1.0023, "step": 43026 }, { "epoch": 0.81, "learning_rate": 4.5030093516375106e-07, "loss": 0.917, "step": 43027 }, { "epoch": 0.81, "learning_rate": 4.5021347523243633e-07, "loss": 1.0515, "step": 43028 }, { "epoch": 0.81, "learning_rate": 4.501260229549617e-07, "loss": 0.8179, "step": 43029 }, { "epoch": 0.81, "learning_rate": 4.500385783316538e-07, "loss": 0.9556, "step": 43030 }, { "epoch": 0.81, "learning_rate": 4.499511413628388e-07, "loss": 0.9934, "step": 43031 }, { "epoch": 0.81, "learning_rate": 4.498637120488433e-07, "loss": 0.8406, "step": 43032 }, { "epoch": 0.81, "learning_rate": 4.497762903899941e-07, "loss": 0.7263, "step": 43033 }, { "epoch": 0.81, "learning_rate": 4.496888763866181e-07, "loss": 0.6905, "step": 43034 }, { "epoch": 0.81, "learning_rate": 4.496014700390394e-07, "loss": 0.7843, "step": 43035 }, { "epoch": 0.81, "learning_rate": 4.4951407134758733e-07, "loss": 1.0627, "step": 43036 }, { "epoch": 0.81, "learning_rate": 4.49426680312586e-07, "loss": 1.1245, "step": 43037 }, { "epoch": 0.81, "learning_rate": 4.4933929693436296e-07, "loss": 0.9743, "step": 43038 }, { "epoch": 0.81, "learning_rate": 4.4925192121324373e-07, "loss": 0.9035, "step": 43039 }, { "epoch": 0.81, "learning_rate": 4.491645531495553e-07, "loss": 0.8769, "step": 43040 }, { "epoch": 0.81, "learning_rate": 4.490771927436233e-07, "loss": 0.9715, "step": 43041 }, { "epoch": 0.81, "learning_rate": 4.4898983999577426e-07, "loss": 0.86, "step": 43042 }, { "epoch": 0.81, "learning_rate": 4.4890249490633504e-07, "loss": 1.087, "step": 43043 }, { "epoch": 0.81, "learning_rate": 4.488151574756294e-07, "loss": 0.9951, "step": 43044 }, { "epoch": 0.81, "learning_rate": 4.4872782770398663e-07, "loss": 0.9041, "step": 43045 }, { "epoch": 0.81, "learning_rate": 4.486405055917306e-07, "loss": 0.9316, "step": 43046 }, { "epoch": 0.81, "learning_rate": 4.4855319113918743e-07, "loss": 0.9272, "step": 43047 }, { "epoch": 0.81, "learning_rate": 4.484658843466849e-07, "loss": 0.811, "step": 43048 }, { "epoch": 0.81, "learning_rate": 4.4837858521454725e-07, "loss": 1.0292, "step": 43049 }, { "epoch": 0.81, "learning_rate": 4.482912937431011e-07, "loss": 1.1264, "step": 43050 }, { "epoch": 0.81, "learning_rate": 4.482040099326723e-07, "loss": 0.9641, "step": 43051 }, { "epoch": 0.81, "learning_rate": 4.4811673378358676e-07, "loss": 0.8574, "step": 43052 }, { "epoch": 0.81, "learning_rate": 4.4802946529617056e-07, "loss": 0.828, "step": 43053 }, { "epoch": 0.81, "learning_rate": 4.4794220447074933e-07, "loss": 0.8958, "step": 43054 }, { "epoch": 0.81, "learning_rate": 4.4785495130764966e-07, "loss": 1.0204, "step": 43055 }, { "epoch": 0.81, "learning_rate": 4.4776770580719527e-07, "loss": 1.2919, "step": 43056 }, { "epoch": 0.81, "learning_rate": 4.476804679697147e-07, "loss": 0.8163, "step": 43057 }, { "epoch": 0.81, "learning_rate": 4.4759323779553196e-07, "loss": 0.9379, "step": 43058 }, { "epoch": 0.81, "learning_rate": 4.4750601528497276e-07, "loss": 0.8975, "step": 43059 }, { "epoch": 0.81, "learning_rate": 4.474188004383634e-07, "loss": 0.7429, "step": 43060 }, { "epoch": 0.81, "learning_rate": 4.473315932560293e-07, "loss": 0.8611, "step": 43061 }, { "epoch": 0.81, "learning_rate": 4.4724439373829586e-07, "loss": 1.1026, "step": 43062 }, { "epoch": 0.81, "learning_rate": 4.4715720188548914e-07, "loss": 1.1042, "step": 43063 }, { "epoch": 0.81, "learning_rate": 4.470700176979351e-07, "loss": 0.8517, "step": 43064 }, { "epoch": 0.81, "learning_rate": 4.4698284117595747e-07, "loss": 0.9949, "step": 43065 }, { "epoch": 0.81, "learning_rate": 4.468956723198842e-07, "loss": 0.7621, "step": 43066 }, { "epoch": 0.81, "learning_rate": 4.468085111300388e-07, "loss": 0.7727, "step": 43067 }, { "epoch": 0.81, "learning_rate": 4.46721357606747e-07, "loss": 1.0481, "step": 43068 }, { "epoch": 0.81, "learning_rate": 4.4663421175033556e-07, "loss": 0.9597, "step": 43069 }, { "epoch": 0.81, "learning_rate": 4.465470735611288e-07, "loss": 0.9354, "step": 43070 }, { "epoch": 0.81, "learning_rate": 4.464599430394523e-07, "loss": 0.863, "step": 43071 }, { "epoch": 0.81, "learning_rate": 4.46372820185631e-07, "loss": 0.712, "step": 43072 }, { "epoch": 0.81, "learning_rate": 4.462857049999911e-07, "loss": 0.8136, "step": 43073 }, { "epoch": 0.81, "learning_rate": 4.461985974828578e-07, "loss": 0.7173, "step": 43074 }, { "epoch": 0.81, "learning_rate": 4.4611149763455483e-07, "loss": 1.1265, "step": 43075 }, { "epoch": 0.81, "learning_rate": 4.460244054554097e-07, "loss": 1.1382, "step": 43076 }, { "epoch": 0.81, "learning_rate": 4.459373209457457e-07, "loss": 0.7369, "step": 43077 }, { "epoch": 0.81, "learning_rate": 4.45850244105889e-07, "loss": 0.8997, "step": 43078 }, { "epoch": 0.81, "learning_rate": 4.4576317493616433e-07, "loss": 0.7027, "step": 43079 }, { "epoch": 0.81, "learning_rate": 4.4567611343689725e-07, "loss": 0.9647, "step": 43080 }, { "epoch": 0.81, "learning_rate": 4.4558905960841226e-07, "loss": 0.9174, "step": 43081 }, { "epoch": 0.81, "learning_rate": 4.455020134510349e-07, "loss": 0.9401, "step": 43082 }, { "epoch": 0.81, "learning_rate": 4.454149749650907e-07, "loss": 0.9449, "step": 43083 }, { "epoch": 0.81, "learning_rate": 4.453279441509029e-07, "loss": 0.9351, "step": 43084 }, { "epoch": 0.81, "learning_rate": 4.452409210087985e-07, "loss": 1.0269, "step": 43085 }, { "epoch": 0.81, "learning_rate": 4.45153905539101e-07, "loss": 0.7129, "step": 43086 }, { "epoch": 0.81, "learning_rate": 4.450668977421357e-07, "loss": 0.8868, "step": 43087 }, { "epoch": 0.81, "learning_rate": 4.4497989761822764e-07, "loss": 0.9372, "step": 43088 }, { "epoch": 0.81, "learning_rate": 4.4489290516770174e-07, "loss": 0.8288, "step": 43089 }, { "epoch": 0.81, "learning_rate": 4.448059203908825e-07, "loss": 1.0448, "step": 43090 }, { "epoch": 0.81, "learning_rate": 4.4471894328809523e-07, "loss": 0.9321, "step": 43091 }, { "epoch": 0.81, "learning_rate": 4.4463197385966495e-07, "loss": 0.8857, "step": 43092 }, { "epoch": 0.81, "learning_rate": 4.4454501210591443e-07, "loss": 1.0481, "step": 43093 }, { "epoch": 0.81, "learning_rate": 4.444580580271707e-07, "loss": 0.9962, "step": 43094 }, { "epoch": 0.81, "learning_rate": 4.443711116237578e-07, "loss": 1.2033, "step": 43095 }, { "epoch": 0.81, "learning_rate": 4.442841728959993e-07, "loss": 0.8741, "step": 43096 }, { "epoch": 0.81, "learning_rate": 4.441972418442217e-07, "loss": 0.7555, "step": 43097 }, { "epoch": 0.81, "learning_rate": 4.4411031846874815e-07, "loss": 0.7916, "step": 43098 }, { "epoch": 0.81, "learning_rate": 4.440234027699034e-07, "loss": 0.9437, "step": 43099 }, { "epoch": 0.81, "learning_rate": 4.439364947480124e-07, "loss": 0.9559, "step": 43100 }, { "epoch": 0.81, "learning_rate": 4.4384959440339934e-07, "loss": 0.7983, "step": 43101 }, { "epoch": 0.81, "learning_rate": 4.437627017363888e-07, "loss": 0.8068, "step": 43102 }, { "epoch": 0.81, "learning_rate": 4.4367581674730543e-07, "loss": 0.7451, "step": 43103 }, { "epoch": 0.81, "learning_rate": 4.4358893943647426e-07, "loss": 0.6457, "step": 43104 }, { "epoch": 0.81, "learning_rate": 4.435020698042175e-07, "loss": 0.9762, "step": 43105 }, { "epoch": 0.81, "learning_rate": 4.434152078508622e-07, "loss": 0.9556, "step": 43106 }, { "epoch": 0.81, "learning_rate": 4.4332835357673075e-07, "loss": 0.9964, "step": 43107 }, { "epoch": 0.81, "learning_rate": 4.432415069821483e-07, "loss": 0.9124, "step": 43108 }, { "epoch": 0.81, "learning_rate": 4.4315466806743895e-07, "loss": 0.9054, "step": 43109 }, { "epoch": 0.81, "learning_rate": 4.430678368329272e-07, "loss": 0.7473, "step": 43110 }, { "epoch": 0.81, "learning_rate": 4.4298101327893693e-07, "loss": 0.8109, "step": 43111 }, { "epoch": 0.81, "learning_rate": 4.4289419740579236e-07, "loss": 0.9401, "step": 43112 }, { "epoch": 0.81, "learning_rate": 4.428073892138188e-07, "loss": 1.0369, "step": 43113 }, { "epoch": 0.81, "learning_rate": 4.4272058870333757e-07, "loss": 0.8736, "step": 43114 }, { "epoch": 0.81, "learning_rate": 4.426337958746757e-07, "loss": 0.9336, "step": 43115 }, { "epoch": 0.81, "learning_rate": 4.4254701072815654e-07, "loss": 0.6866, "step": 43116 }, { "epoch": 0.81, "learning_rate": 4.424602332641026e-07, "loss": 0.9249, "step": 43117 }, { "epoch": 0.81, "learning_rate": 4.4237346348284025e-07, "loss": 0.8858, "step": 43118 }, { "epoch": 0.81, "learning_rate": 4.422867013846915e-07, "loss": 1.0804, "step": 43119 }, { "epoch": 0.81, "learning_rate": 4.421999469699814e-07, "loss": 0.933, "step": 43120 }, { "epoch": 0.81, "learning_rate": 4.4211320023903354e-07, "loss": 0.9521, "step": 43121 }, { "epoch": 0.81, "learning_rate": 4.420264611921718e-07, "loss": 0.995, "step": 43122 }, { "epoch": 0.81, "learning_rate": 4.419397298297204e-07, "loss": 0.8765, "step": 43123 }, { "epoch": 0.81, "learning_rate": 4.4185300615200266e-07, "loss": 0.8915, "step": 43124 }, { "epoch": 0.81, "learning_rate": 4.4176629015934337e-07, "loss": 0.995, "step": 43125 }, { "epoch": 0.81, "learning_rate": 4.4167958185206447e-07, "loss": 0.8794, "step": 43126 }, { "epoch": 0.81, "learning_rate": 4.4159288123049206e-07, "loss": 0.9107, "step": 43127 }, { "epoch": 0.81, "learning_rate": 4.415061882949481e-07, "loss": 0.9865, "step": 43128 }, { "epoch": 0.81, "learning_rate": 4.4141950304575713e-07, "loss": 0.9579, "step": 43129 }, { "epoch": 0.81, "learning_rate": 4.413328254832425e-07, "loss": 0.8427, "step": 43130 }, { "epoch": 0.81, "learning_rate": 4.4124615560772797e-07, "loss": 1.1218, "step": 43131 }, { "epoch": 0.81, "learning_rate": 4.411594934195371e-07, "loss": 1.0432, "step": 43132 }, { "epoch": 0.81, "learning_rate": 4.4107283891899363e-07, "loss": 1.0388, "step": 43133 }, { "epoch": 0.81, "learning_rate": 4.409861921064215e-07, "loss": 0.9382, "step": 43134 }, { "epoch": 0.81, "learning_rate": 4.4089955298214275e-07, "loss": 1.0045, "step": 43135 }, { "epoch": 0.81, "learning_rate": 4.408129215464826e-07, "loss": 0.8703, "step": 43136 }, { "epoch": 0.81, "learning_rate": 4.407262977997645e-07, "loss": 0.8353, "step": 43137 }, { "epoch": 0.81, "learning_rate": 4.406396817423098e-07, "loss": 1.1181, "step": 43138 }, { "epoch": 0.81, "learning_rate": 4.405530733744448e-07, "loss": 0.9409, "step": 43139 }, { "epoch": 0.81, "learning_rate": 4.404664726964908e-07, "loss": 0.8667, "step": 43140 }, { "epoch": 0.81, "learning_rate": 4.403798797087719e-07, "loss": 0.6956, "step": 43141 }, { "epoch": 0.81, "learning_rate": 4.402932944116112e-07, "loss": 0.8928, "step": 43142 }, { "epoch": 0.81, "learning_rate": 4.402067168053323e-07, "loss": 1.0889, "step": 43143 }, { "epoch": 0.81, "learning_rate": 4.401201468902586e-07, "loss": 1.0929, "step": 43144 }, { "epoch": 0.81, "learning_rate": 4.400335846667128e-07, "loss": 0.8743, "step": 43145 }, { "epoch": 0.81, "learning_rate": 4.399470301350192e-07, "loss": 0.8375, "step": 43146 }, { "epoch": 0.81, "learning_rate": 4.398604832954989e-07, "loss": 0.99, "step": 43147 }, { "epoch": 0.81, "learning_rate": 4.397739441484777e-07, "loss": 0.7234, "step": 43148 }, { "epoch": 0.81, "learning_rate": 4.396874126942768e-07, "loss": 0.9702, "step": 43149 }, { "epoch": 0.81, "learning_rate": 4.3960088893321986e-07, "loss": 0.8931, "step": 43150 }, { "epoch": 0.81, "learning_rate": 4.395143728656301e-07, "loss": 1.0114, "step": 43151 }, { "epoch": 0.81, "learning_rate": 4.394278644918304e-07, "loss": 0.9186, "step": 43152 }, { "epoch": 0.81, "learning_rate": 4.393413638121438e-07, "loss": 1.1431, "step": 43153 }, { "epoch": 0.81, "learning_rate": 4.3925487082689374e-07, "loss": 0.8344, "step": 43154 }, { "epoch": 0.81, "learning_rate": 4.391683855364032e-07, "loss": 0.8918, "step": 43155 }, { "epoch": 0.81, "learning_rate": 4.3908190794099333e-07, "loss": 0.9683, "step": 43156 }, { "epoch": 0.81, "learning_rate": 4.3899543804098916e-07, "loss": 0.7424, "step": 43157 }, { "epoch": 0.81, "learning_rate": 4.389089758367135e-07, "loss": 0.8162, "step": 43158 }, { "epoch": 0.81, "learning_rate": 4.3882252132848747e-07, "loss": 0.8932, "step": 43159 }, { "epoch": 0.81, "learning_rate": 4.387360745166358e-07, "loss": 0.8797, "step": 43160 }, { "epoch": 0.81, "learning_rate": 4.386496354014802e-07, "loss": 0.8342, "step": 43161 }, { "epoch": 0.81, "learning_rate": 4.385632039833435e-07, "loss": 1.0267, "step": 43162 }, { "epoch": 0.81, "learning_rate": 4.3847678026254836e-07, "loss": 0.982, "step": 43163 }, { "epoch": 0.81, "learning_rate": 4.38390364239418e-07, "loss": 0.9016, "step": 43164 }, { "epoch": 0.81, "learning_rate": 4.383039559142746e-07, "loss": 0.7736, "step": 43165 }, { "epoch": 0.81, "learning_rate": 4.3821755528744125e-07, "loss": 0.8949, "step": 43166 }, { "epoch": 0.81, "learning_rate": 4.3813116235924075e-07, "loss": 0.8696, "step": 43167 }, { "epoch": 0.81, "learning_rate": 4.3804477712999424e-07, "loss": 0.8733, "step": 43168 }, { "epoch": 0.81, "learning_rate": 4.379583996000264e-07, "loss": 0.9589, "step": 43169 }, { "epoch": 0.81, "learning_rate": 4.3787202976965817e-07, "loss": 0.7604, "step": 43170 }, { "epoch": 0.81, "learning_rate": 4.3778566763921226e-07, "loss": 0.7204, "step": 43171 }, { "epoch": 0.81, "learning_rate": 4.3769931320901184e-07, "loss": 0.7537, "step": 43172 }, { "epoch": 0.81, "learning_rate": 4.376129664793788e-07, "loss": 0.7689, "step": 43173 }, { "epoch": 0.81, "learning_rate": 4.375266274506357e-07, "loss": 1.1036, "step": 43174 }, { "epoch": 0.81, "learning_rate": 4.3744029612310474e-07, "loss": 1.0322, "step": 43175 }, { "epoch": 0.81, "learning_rate": 4.3735397249710933e-07, "loss": 0.9402, "step": 43176 }, { "epoch": 0.81, "learning_rate": 4.3726765657296974e-07, "loss": 0.8049, "step": 43177 }, { "epoch": 0.81, "learning_rate": 4.3718134835100984e-07, "loss": 0.6836, "step": 43178 }, { "epoch": 0.81, "learning_rate": 4.370950478315522e-07, "loss": 0.7316, "step": 43179 }, { "epoch": 0.81, "learning_rate": 4.370087550149174e-07, "loss": 1.079, "step": 43180 }, { "epoch": 0.81, "learning_rate": 4.369224699014299e-07, "loss": 1.1977, "step": 43181 }, { "epoch": 0.81, "learning_rate": 4.368361924914097e-07, "loss": 0.8173, "step": 43182 }, { "epoch": 0.81, "learning_rate": 4.3674992278518014e-07, "loss": 1.0312, "step": 43183 }, { "epoch": 0.81, "learning_rate": 4.366636607830632e-07, "loss": 0.751, "step": 43184 }, { "epoch": 0.81, "learning_rate": 4.365774064853806e-07, "loss": 0.9398, "step": 43185 }, { "epoch": 0.81, "learning_rate": 4.364911598924548e-07, "loss": 0.7932, "step": 43186 }, { "epoch": 0.81, "learning_rate": 4.3640492100460783e-07, "loss": 1.1254, "step": 43187 }, { "epoch": 0.81, "learning_rate": 4.363186898221622e-07, "loss": 1.0239, "step": 43188 }, { "epoch": 0.81, "learning_rate": 4.362324663454381e-07, "loss": 1.0103, "step": 43189 }, { "epoch": 0.81, "learning_rate": 4.361462505747599e-07, "loss": 0.8533, "step": 43190 }, { "epoch": 0.81, "learning_rate": 4.360600425104478e-07, "loss": 0.9409, "step": 43191 }, { "epoch": 0.81, "learning_rate": 4.35973842152824e-07, "loss": 0.8304, "step": 43192 }, { "epoch": 0.81, "learning_rate": 4.358876495022107e-07, "loss": 0.9822, "step": 43193 }, { "epoch": 0.81, "learning_rate": 4.358014645589295e-07, "loss": 1.036, "step": 43194 }, { "epoch": 0.81, "learning_rate": 4.357152873233025e-07, "loss": 0.9408, "step": 43195 }, { "epoch": 0.81, "learning_rate": 4.356291177956512e-07, "loss": 0.5389, "step": 43196 }, { "epoch": 0.81, "learning_rate": 4.355429559762983e-07, "loss": 0.7817, "step": 43197 }, { "epoch": 0.82, "learning_rate": 4.3545680186556333e-07, "loss": 0.9731, "step": 43198 }, { "epoch": 0.82, "learning_rate": 4.353706554637702e-07, "loss": 1.1295, "step": 43199 }, { "epoch": 0.82, "learning_rate": 4.3528451677123995e-07, "loss": 1.1105, "step": 43200 }, { "epoch": 0.82, "learning_rate": 4.35198385788293e-07, "loss": 0.8811, "step": 43201 }, { "epoch": 0.82, "learning_rate": 4.351122625152532e-07, "loss": 0.9223, "step": 43202 }, { "epoch": 0.82, "learning_rate": 4.3502614695244026e-07, "loss": 0.9053, "step": 43203 }, { "epoch": 0.82, "learning_rate": 4.349400391001765e-07, "loss": 0.8975, "step": 43204 }, { "epoch": 0.82, "learning_rate": 4.348539389587833e-07, "loss": 0.8625, "step": 43205 }, { "epoch": 0.82, "learning_rate": 4.3476784652858206e-07, "loss": 1.0547, "step": 43206 }, { "epoch": 0.82, "learning_rate": 4.346817618098942e-07, "loss": 0.684, "step": 43207 }, { "epoch": 0.82, "learning_rate": 4.3459568480304166e-07, "loss": 0.7739, "step": 43208 }, { "epoch": 0.82, "learning_rate": 4.3450961550834584e-07, "loss": 1.0031, "step": 43209 }, { "epoch": 0.82, "learning_rate": 4.3442355392612684e-07, "loss": 0.8503, "step": 43210 }, { "epoch": 0.82, "learning_rate": 4.3433750005670795e-07, "loss": 0.8553, "step": 43211 }, { "epoch": 0.82, "learning_rate": 4.342514539004089e-07, "loss": 1.1432, "step": 43212 }, { "epoch": 0.82, "learning_rate": 4.341654154575511e-07, "loss": 1.104, "step": 43213 }, { "epoch": 0.82, "learning_rate": 4.3407938472845746e-07, "loss": 0.8699, "step": 43214 }, { "epoch": 0.82, "learning_rate": 4.3399336171344733e-07, "loss": 0.9014, "step": 43215 }, { "epoch": 0.82, "learning_rate": 4.339073464128429e-07, "loss": 0.8321, "step": 43216 }, { "epoch": 0.82, "learning_rate": 4.338213388269649e-07, "loss": 0.85, "step": 43217 }, { "epoch": 0.82, "learning_rate": 4.337353389561347e-07, "loss": 0.899, "step": 43218 }, { "epoch": 0.82, "learning_rate": 4.3364934680067333e-07, "loss": 0.9189, "step": 43219 }, { "epoch": 0.82, "learning_rate": 4.3356336236090204e-07, "loss": 0.8651, "step": 43220 }, { "epoch": 0.82, "learning_rate": 4.334773856371424e-07, "loss": 0.8598, "step": 43221 }, { "epoch": 0.82, "learning_rate": 4.333914166297137e-07, "loss": 0.8428, "step": 43222 }, { "epoch": 0.82, "learning_rate": 4.3330545533893905e-07, "loss": 0.9479, "step": 43223 }, { "epoch": 0.82, "learning_rate": 4.3321950176513804e-07, "loss": 1.0018, "step": 43224 }, { "epoch": 0.82, "learning_rate": 4.331335559086322e-07, "loss": 0.9063, "step": 43225 }, { "epoch": 0.82, "learning_rate": 4.330476177697421e-07, "loss": 1.0391, "step": 43226 }, { "epoch": 0.82, "learning_rate": 4.329616873487888e-07, "loss": 0.7472, "step": 43227 }, { "epoch": 0.82, "learning_rate": 4.328757646460932e-07, "loss": 0.968, "step": 43228 }, { "epoch": 0.82, "learning_rate": 4.327898496619762e-07, "loss": 0.8214, "step": 43229 }, { "epoch": 0.82, "learning_rate": 4.327039423967588e-07, "loss": 0.8852, "step": 43230 }, { "epoch": 0.82, "learning_rate": 4.3261804285076064e-07, "loss": 1.2183, "step": 43231 }, { "epoch": 0.82, "learning_rate": 4.325321510243044e-07, "loss": 0.9724, "step": 43232 }, { "epoch": 0.82, "learning_rate": 4.324462669177093e-07, "loss": 0.9662, "step": 43233 }, { "epoch": 0.82, "learning_rate": 4.323603905312956e-07, "loss": 1.0317, "step": 43234 }, { "epoch": 0.82, "learning_rate": 4.322745218653862e-07, "loss": 0.9173, "step": 43235 }, { "epoch": 0.82, "learning_rate": 4.3218866092029936e-07, "loss": 1.0217, "step": 43236 }, { "epoch": 0.82, "learning_rate": 4.321028076963571e-07, "loss": 1.0789, "step": 43237 }, { "epoch": 0.82, "learning_rate": 4.320169621938794e-07, "loss": 1.0494, "step": 43238 }, { "epoch": 0.82, "learning_rate": 4.3193112441318683e-07, "loss": 1.1049, "step": 43239 }, { "epoch": 0.82, "learning_rate": 4.318452943546003e-07, "loss": 0.9744, "step": 43240 }, { "epoch": 0.82, "learning_rate": 4.3175947201843984e-07, "loss": 0.8644, "step": 43241 }, { "epoch": 0.82, "learning_rate": 4.316736574050268e-07, "loss": 0.9814, "step": 43242 }, { "epoch": 0.82, "learning_rate": 4.315878505146795e-07, "loss": 1.0674, "step": 43243 }, { "epoch": 0.82, "learning_rate": 4.315020513477211e-07, "loss": 0.983, "step": 43244 }, { "epoch": 0.82, "learning_rate": 4.3141625990446995e-07, "loss": 0.9311, "step": 43245 }, { "epoch": 0.82, "learning_rate": 4.3133047618524713e-07, "loss": 0.8587, "step": 43246 }, { "epoch": 0.82, "learning_rate": 4.3124470019037303e-07, "loss": 0.8611, "step": 43247 }, { "epoch": 0.82, "learning_rate": 4.3115893192016756e-07, "loss": 0.8522, "step": 43248 }, { "epoch": 0.82, "learning_rate": 4.310731713749514e-07, "loss": 0.9161, "step": 43249 }, { "epoch": 0.82, "learning_rate": 4.3098741855504447e-07, "loss": 0.9647, "step": 43250 }, { "epoch": 0.82, "learning_rate": 4.3090167346076767e-07, "loss": 0.7126, "step": 43251 }, { "epoch": 0.82, "learning_rate": 4.308159360924391e-07, "loss": 0.7632, "step": 43252 }, { "epoch": 0.82, "learning_rate": 4.307302064503821e-07, "loss": 0.8037, "step": 43253 }, { "epoch": 0.82, "learning_rate": 4.306444845349142e-07, "loss": 0.6926, "step": 43254 }, { "epoch": 0.82, "learning_rate": 4.305587703463557e-07, "loss": 1.0115, "step": 43255 }, { "epoch": 0.82, "learning_rate": 4.304730638850285e-07, "loss": 0.8214, "step": 43256 }, { "epoch": 0.82, "learning_rate": 4.303873651512511e-07, "loss": 0.886, "step": 43257 }, { "epoch": 0.82, "learning_rate": 4.303016741453436e-07, "loss": 0.758, "step": 43258 }, { "epoch": 0.82, "learning_rate": 4.3021599086762623e-07, "loss": 0.8084, "step": 43259 }, { "epoch": 0.82, "learning_rate": 4.301303153184189e-07, "loss": 0.7581, "step": 43260 }, { "epoch": 0.82, "learning_rate": 4.300446474980413e-07, "loss": 0.9369, "step": 43261 }, { "epoch": 0.82, "learning_rate": 4.2995898740681383e-07, "loss": 0.9083, "step": 43262 }, { "epoch": 0.82, "learning_rate": 4.2987333504505654e-07, "loss": 0.8991, "step": 43263 }, { "epoch": 0.82, "learning_rate": 4.2978769041308735e-07, "loss": 0.7907, "step": 43264 }, { "epoch": 0.82, "learning_rate": 4.2970205351122893e-07, "loss": 0.8158, "step": 43265 }, { "epoch": 0.82, "learning_rate": 4.2961642433979876e-07, "loss": 0.7418, "step": 43266 }, { "epoch": 0.82, "learning_rate": 4.2953080289911743e-07, "loss": 0.9534, "step": 43267 }, { "epoch": 0.82, "learning_rate": 4.294451891895046e-07, "loss": 1.1067, "step": 43268 }, { "epoch": 0.82, "learning_rate": 4.2935958321128014e-07, "loss": 1.0092, "step": 43269 }, { "epoch": 0.82, "learning_rate": 4.292739849647634e-07, "loss": 0.9607, "step": 43270 }, { "epoch": 0.82, "learning_rate": 4.291883944502739e-07, "loss": 1.049, "step": 43271 }, { "epoch": 0.82, "learning_rate": 4.2910281166813226e-07, "loss": 0.8412, "step": 43272 }, { "epoch": 0.82, "learning_rate": 4.2901723661865597e-07, "loss": 0.783, "step": 43273 }, { "epoch": 0.82, "learning_rate": 4.2893166930216723e-07, "loss": 0.8448, "step": 43274 }, { "epoch": 0.82, "learning_rate": 4.288461097189833e-07, "loss": 0.9024, "step": 43275 }, { "epoch": 0.82, "learning_rate": 4.287605578694237e-07, "loss": 1.2035, "step": 43276 }, { "epoch": 0.82, "learning_rate": 4.2867501375381037e-07, "loss": 0.8593, "step": 43277 }, { "epoch": 0.82, "learning_rate": 4.2858947737246e-07, "loss": 0.8302, "step": 43278 }, { "epoch": 0.82, "learning_rate": 4.2850394872569313e-07, "loss": 0.7594, "step": 43279 }, { "epoch": 0.82, "learning_rate": 4.2841842781382923e-07, "loss": 1.2035, "step": 43280 }, { "epoch": 0.82, "learning_rate": 4.28332914637187e-07, "loss": 1.0367, "step": 43281 }, { "epoch": 0.82, "learning_rate": 4.2824740919608644e-07, "loss": 0.8488, "step": 43282 }, { "epoch": 0.82, "learning_rate": 4.281619114908464e-07, "loss": 0.8067, "step": 43283 }, { "epoch": 0.82, "learning_rate": 4.2807642152178695e-07, "loss": 0.7895, "step": 43284 }, { "epoch": 0.82, "learning_rate": 4.2799093928922536e-07, "loss": 0.8378, "step": 43285 }, { "epoch": 0.82, "learning_rate": 4.279054647934833e-07, "loss": 0.7523, "step": 43286 }, { "epoch": 0.82, "learning_rate": 4.2781999803487824e-07, "loss": 0.9904, "step": 43287 }, { "epoch": 0.82, "learning_rate": 4.277345390137297e-07, "loss": 0.9235, "step": 43288 }, { "epoch": 0.82, "learning_rate": 4.2764908773035656e-07, "loss": 0.8617, "step": 43289 }, { "epoch": 0.82, "learning_rate": 4.2756364418507864e-07, "loss": 1.1464, "step": 43290 }, { "epoch": 0.82, "learning_rate": 4.274782083782142e-07, "loss": 0.7504, "step": 43291 }, { "epoch": 0.82, "learning_rate": 4.2739278031008276e-07, "loss": 1.0106, "step": 43292 }, { "epoch": 0.82, "learning_rate": 4.2730735998100347e-07, "loss": 0.9969, "step": 43293 }, { "epoch": 0.82, "learning_rate": 4.272219473912939e-07, "loss": 0.7652, "step": 43294 }, { "epoch": 0.82, "learning_rate": 4.2713654254127544e-07, "loss": 0.8745, "step": 43295 }, { "epoch": 0.82, "learning_rate": 4.270511454312648e-07, "loss": 0.9177, "step": 43296 }, { "epoch": 0.82, "learning_rate": 4.2696575606158086e-07, "loss": 0.9938, "step": 43297 }, { "epoch": 0.82, "learning_rate": 4.268803744325448e-07, "loss": 0.7298, "step": 43298 }, { "epoch": 0.82, "learning_rate": 4.2679500054447294e-07, "loss": 0.9744, "step": 43299 }, { "epoch": 0.82, "learning_rate": 4.267096343976851e-07, "loss": 0.9768, "step": 43300 }, { "epoch": 0.82, "learning_rate": 4.266242759924999e-07, "loss": 0.9015, "step": 43301 }, { "epoch": 0.82, "learning_rate": 4.265389253292362e-07, "loss": 0.8917, "step": 43302 }, { "epoch": 0.82, "learning_rate": 4.264535824082125e-07, "loss": 0.8595, "step": 43303 }, { "epoch": 0.82, "learning_rate": 4.263682472297473e-07, "loss": 0.8053, "step": 43304 }, { "epoch": 0.82, "learning_rate": 4.262829197941604e-07, "loss": 0.8485, "step": 43305 }, { "epoch": 0.82, "learning_rate": 4.261976001017687e-07, "loss": 1.1049, "step": 43306 }, { "epoch": 0.82, "learning_rate": 4.2611228815289176e-07, "loss": 1.021, "step": 43307 }, { "epoch": 0.82, "learning_rate": 4.2602698394784784e-07, "loss": 1.0588, "step": 43308 }, { "epoch": 0.82, "learning_rate": 4.259416874869557e-07, "loss": 0.8667, "step": 43309 }, { "epoch": 0.82, "learning_rate": 4.258563987705336e-07, "loss": 0.9095, "step": 43310 }, { "epoch": 0.82, "learning_rate": 4.257711177989002e-07, "loss": 0.8788, "step": 43311 }, { "epoch": 0.82, "learning_rate": 4.256858445723741e-07, "loss": 0.9898, "step": 43312 }, { "epoch": 0.82, "learning_rate": 4.256005790912726e-07, "loss": 1.1085, "step": 43313 }, { "epoch": 0.82, "learning_rate": 4.25515321355916e-07, "loss": 0.8784, "step": 43314 }, { "epoch": 0.82, "learning_rate": 4.2543007136662123e-07, "loss": 0.9977, "step": 43315 }, { "epoch": 0.82, "learning_rate": 4.253448291237067e-07, "loss": 1.0066, "step": 43316 }, { "epoch": 0.82, "learning_rate": 4.2525959462749095e-07, "loss": 0.8949, "step": 43317 }, { "epoch": 0.82, "learning_rate": 4.2517436787829243e-07, "loss": 0.9411, "step": 43318 }, { "epoch": 0.82, "learning_rate": 4.2508914887642916e-07, "loss": 0.8524, "step": 43319 }, { "epoch": 0.82, "learning_rate": 4.2500393762221923e-07, "loss": 0.8411, "step": 43320 }, { "epoch": 0.82, "learning_rate": 4.249187341159819e-07, "loss": 0.8496, "step": 43321 }, { "epoch": 0.82, "learning_rate": 4.2483353835803293e-07, "loss": 0.9504, "step": 43322 }, { "epoch": 0.82, "learning_rate": 4.2474835034869264e-07, "loss": 0.7276, "step": 43323 }, { "epoch": 0.82, "learning_rate": 4.246631700882789e-07, "loss": 0.8788, "step": 43324 }, { "epoch": 0.82, "learning_rate": 4.2457799757710805e-07, "loss": 0.9768, "step": 43325 }, { "epoch": 0.82, "learning_rate": 4.244928328155004e-07, "loss": 0.7811, "step": 43326 }, { "epoch": 0.82, "learning_rate": 4.244076758037724e-07, "loss": 0.9157, "step": 43327 }, { "epoch": 0.82, "learning_rate": 4.2432252654224263e-07, "loss": 0.7892, "step": 43328 }, { "epoch": 0.82, "learning_rate": 4.242373850312287e-07, "loss": 0.7887, "step": 43329 }, { "epoch": 0.82, "learning_rate": 4.2415225127104886e-07, "loss": 1.1185, "step": 43330 }, { "epoch": 0.82, "learning_rate": 4.2406712526202097e-07, "loss": 1.1002, "step": 43331 }, { "epoch": 0.82, "learning_rate": 4.239820070044626e-07, "loss": 1.0393, "step": 43332 }, { "epoch": 0.82, "learning_rate": 4.238968964986923e-07, "loss": 1.0111, "step": 43333 }, { "epoch": 0.82, "learning_rate": 4.2381179374502617e-07, "loss": 0.687, "step": 43334 }, { "epoch": 0.82, "learning_rate": 4.2372669874378464e-07, "loss": 0.8946, "step": 43335 }, { "epoch": 0.82, "learning_rate": 4.2364161149528295e-07, "loss": 0.8492, "step": 43336 }, { "epoch": 0.82, "learning_rate": 4.2355653199984e-07, "loss": 1.2101, "step": 43337 }, { "epoch": 0.82, "learning_rate": 4.234714602577733e-07, "loss": 0.868, "step": 43338 }, { "epoch": 0.82, "learning_rate": 4.233863962694004e-07, "loss": 0.9363, "step": 43339 }, { "epoch": 0.82, "learning_rate": 4.2330134003503913e-07, "loss": 0.7724, "step": 43340 }, { "epoch": 0.82, "learning_rate": 4.23216291555007e-07, "loss": 0.9729, "step": 43341 }, { "epoch": 0.82, "learning_rate": 4.2313125082962233e-07, "loss": 0.8823, "step": 43342 }, { "epoch": 0.82, "learning_rate": 4.230462178592004e-07, "loss": 1.001, "step": 43343 }, { "epoch": 0.82, "learning_rate": 4.229611926440608e-07, "loss": 1.1077, "step": 43344 }, { "epoch": 0.82, "learning_rate": 4.228761751845212e-07, "loss": 0.7934, "step": 43345 }, { "epoch": 0.82, "learning_rate": 4.2279116548089695e-07, "loss": 0.7866, "step": 43346 }, { "epoch": 0.82, "learning_rate": 4.2270616353350805e-07, "loss": 0.8936, "step": 43347 }, { "epoch": 0.82, "learning_rate": 4.2262116934267016e-07, "loss": 0.7513, "step": 43348 }, { "epoch": 0.82, "learning_rate": 4.22536182908701e-07, "loss": 0.8656, "step": 43349 }, { "epoch": 0.82, "learning_rate": 4.2245120423191815e-07, "loss": 0.9798, "step": 43350 }, { "epoch": 0.82, "learning_rate": 4.223662333126385e-07, "loss": 0.7241, "step": 43351 }, { "epoch": 0.82, "learning_rate": 4.2228127015117997e-07, "loss": 0.8928, "step": 43352 }, { "epoch": 0.82, "learning_rate": 4.2219631474785945e-07, "loss": 0.9438, "step": 43353 }, { "epoch": 0.82, "learning_rate": 4.2211136710299444e-07, "loss": 0.8434, "step": 43354 }, { "epoch": 0.82, "learning_rate": 4.2202642721690114e-07, "loss": 0.9879, "step": 43355 }, { "epoch": 0.82, "learning_rate": 4.219414950898984e-07, "loss": 0.9554, "step": 43356 }, { "epoch": 0.82, "learning_rate": 4.2185657072230183e-07, "loss": 1.0266, "step": 43357 }, { "epoch": 0.82, "learning_rate": 4.21771654114429e-07, "loss": 0.9647, "step": 43358 }, { "epoch": 0.82, "learning_rate": 4.2168674526659707e-07, "loss": 0.9813, "step": 43359 }, { "epoch": 0.82, "learning_rate": 4.2160184417912336e-07, "loss": 0.9016, "step": 43360 }, { "epoch": 0.82, "learning_rate": 4.215169508523245e-07, "loss": 0.8911, "step": 43361 }, { "epoch": 0.82, "learning_rate": 4.214320652865178e-07, "loss": 0.9496, "step": 43362 }, { "epoch": 0.82, "learning_rate": 4.2134718748202047e-07, "loss": 1.0493, "step": 43363 }, { "epoch": 0.82, "learning_rate": 4.212623174391478e-07, "loss": 0.8188, "step": 43364 }, { "epoch": 0.82, "learning_rate": 4.2117745515821845e-07, "loss": 0.9062, "step": 43365 }, { "epoch": 0.82, "learning_rate": 4.210926006395494e-07, "loss": 0.7582, "step": 43366 }, { "epoch": 0.82, "learning_rate": 4.210077538834556e-07, "loss": 0.7366, "step": 43367 }, { "epoch": 0.82, "learning_rate": 4.209229148902563e-07, "loss": 0.8036, "step": 43368 }, { "epoch": 0.82, "learning_rate": 4.2083808366026656e-07, "loss": 0.9702, "step": 43369 }, { "epoch": 0.82, "learning_rate": 4.207532601938036e-07, "loss": 0.8127, "step": 43370 }, { "epoch": 0.82, "learning_rate": 4.2066844449118434e-07, "loss": 0.7507, "step": 43371 }, { "epoch": 0.82, "learning_rate": 4.2058363655272524e-07, "loss": 1.0086, "step": 43372 }, { "epoch": 0.82, "learning_rate": 4.204988363787432e-07, "loss": 0.9892, "step": 43373 }, { "epoch": 0.82, "learning_rate": 4.2041404396955477e-07, "loss": 1.1044, "step": 43374 }, { "epoch": 0.82, "learning_rate": 4.203292593254768e-07, "loss": 0.9859, "step": 43375 }, { "epoch": 0.82, "learning_rate": 4.2024448244682467e-07, "loss": 0.9512, "step": 43376 }, { "epoch": 0.82, "learning_rate": 4.201597133339172e-07, "loss": 0.9741, "step": 43377 }, { "epoch": 0.82, "learning_rate": 4.2007495198706866e-07, "loss": 0.9214, "step": 43378 }, { "epoch": 0.82, "learning_rate": 4.1999019840659685e-07, "loss": 0.8626, "step": 43379 }, { "epoch": 0.82, "learning_rate": 4.199054525928176e-07, "loss": 0.648, "step": 43380 }, { "epoch": 0.82, "learning_rate": 4.1982071454604784e-07, "loss": 0.9656, "step": 43381 }, { "epoch": 0.82, "learning_rate": 4.197359842666035e-07, "loss": 0.9439, "step": 43382 }, { "epoch": 0.82, "learning_rate": 4.196512617548013e-07, "loss": 0.9795, "step": 43383 }, { "epoch": 0.82, "learning_rate": 4.195665470109581e-07, "loss": 0.7456, "step": 43384 }, { "epoch": 0.82, "learning_rate": 4.194818400353884e-07, "loss": 0.8117, "step": 43385 }, { "epoch": 0.82, "learning_rate": 4.193971408284103e-07, "loss": 0.8082, "step": 43386 }, { "epoch": 0.82, "learning_rate": 4.1931244939034026e-07, "loss": 1.2582, "step": 43387 }, { "epoch": 0.82, "learning_rate": 4.192277657214924e-07, "loss": 0.9671, "step": 43388 }, { "epoch": 0.82, "learning_rate": 4.191430898221854e-07, "loss": 0.9299, "step": 43389 }, { "epoch": 0.82, "learning_rate": 4.19058421692734e-07, "loss": 0.8047, "step": 43390 }, { "epoch": 0.82, "learning_rate": 4.1897376133345436e-07, "loss": 0.8951, "step": 43391 }, { "epoch": 0.82, "learning_rate": 4.188891087446631e-07, "loss": 1.1689, "step": 43392 }, { "epoch": 0.82, "learning_rate": 4.1880446392667586e-07, "loss": 1.0758, "step": 43393 }, { "epoch": 0.82, "learning_rate": 4.18719826879809e-07, "loss": 0.9474, "step": 43394 }, { "epoch": 0.82, "learning_rate": 4.186351976043787e-07, "loss": 0.9134, "step": 43395 }, { "epoch": 0.82, "learning_rate": 4.185505761007011e-07, "loss": 0.9904, "step": 43396 }, { "epoch": 0.82, "learning_rate": 4.1846596236909067e-07, "loss": 0.7426, "step": 43397 }, { "epoch": 0.82, "learning_rate": 4.183813564098657e-07, "loss": 0.7575, "step": 43398 }, { "epoch": 0.82, "learning_rate": 4.182967582233405e-07, "loss": 0.8881, "step": 43399 }, { "epoch": 0.82, "learning_rate": 4.182121678098314e-07, "loss": 1.2787, "step": 43400 }, { "epoch": 0.82, "learning_rate": 4.1812758516965395e-07, "loss": 1.0175, "step": 43401 }, { "epoch": 0.82, "learning_rate": 4.1804301030312436e-07, "loss": 0.864, "step": 43402 }, { "epoch": 0.82, "learning_rate": 4.179584432105585e-07, "loss": 0.5046, "step": 43403 }, { "epoch": 0.82, "learning_rate": 4.178738838922719e-07, "loss": 0.8378, "step": 43404 }, { "epoch": 0.82, "learning_rate": 4.17789332348581e-07, "loss": 0.933, "step": 43405 }, { "epoch": 0.82, "learning_rate": 4.1770478857979966e-07, "loss": 1.0729, "step": 43406 }, { "epoch": 0.82, "learning_rate": 4.1762025258624523e-07, "loss": 0.984, "step": 43407 }, { "epoch": 0.82, "learning_rate": 4.175357243682338e-07, "loss": 0.8561, "step": 43408 }, { "epoch": 0.82, "learning_rate": 4.174512039260789e-07, "loss": 0.8782, "step": 43409 }, { "epoch": 0.82, "learning_rate": 4.173666912600985e-07, "loss": 0.7776, "step": 43410 }, { "epoch": 0.82, "learning_rate": 4.1728218637060643e-07, "loss": 0.9238, "step": 43411 }, { "epoch": 0.82, "learning_rate": 4.1719768925791855e-07, "loss": 1.0513, "step": 43412 }, { "epoch": 0.82, "learning_rate": 4.17113199922351e-07, "loss": 1.0074, "step": 43413 }, { "epoch": 0.82, "learning_rate": 4.170287183642188e-07, "loss": 0.7162, "step": 43414 }, { "epoch": 0.82, "learning_rate": 4.1694424458383733e-07, "loss": 0.8736, "step": 43415 }, { "epoch": 0.82, "learning_rate": 4.1685977858152235e-07, "loss": 0.6271, "step": 43416 }, { "epoch": 0.82, "learning_rate": 4.167753203575897e-07, "loss": 0.8428, "step": 43417 }, { "epoch": 0.82, "learning_rate": 4.166908699123529e-07, "loss": 0.9135, "step": 43418 }, { "epoch": 0.82, "learning_rate": 4.1660642724612954e-07, "loss": 1.0417, "step": 43419 }, { "epoch": 0.82, "learning_rate": 4.165219923592334e-07, "loss": 0.8506, "step": 43420 }, { "epoch": 0.82, "learning_rate": 4.1643756525198033e-07, "loss": 0.9148, "step": 43421 }, { "epoch": 0.82, "learning_rate": 4.1635314592468556e-07, "loss": 0.9529, "step": 43422 }, { "epoch": 0.82, "learning_rate": 4.1626873437766417e-07, "loss": 0.925, "step": 43423 }, { "epoch": 0.82, "learning_rate": 4.1618433061123146e-07, "loss": 0.9821, "step": 43424 }, { "epoch": 0.82, "learning_rate": 4.1609993462570276e-07, "loss": 0.9865, "step": 43425 }, { "epoch": 0.82, "learning_rate": 4.160155464213933e-07, "loss": 0.7699, "step": 43426 }, { "epoch": 0.82, "learning_rate": 4.159311659986168e-07, "loss": 0.8671, "step": 43427 }, { "epoch": 0.82, "learning_rate": 4.158467933576901e-07, "loss": 0.7962, "step": 43428 }, { "epoch": 0.82, "learning_rate": 4.157624284989281e-07, "loss": 0.9188, "step": 43429 }, { "epoch": 0.82, "learning_rate": 4.156780714226441e-07, "loss": 0.8794, "step": 43430 }, { "epoch": 0.82, "learning_rate": 4.1559372212915535e-07, "loss": 0.9972, "step": 43431 }, { "epoch": 0.82, "learning_rate": 4.1550938061877543e-07, "loss": 0.9809, "step": 43432 }, { "epoch": 0.82, "learning_rate": 4.1542504689181916e-07, "loss": 0.8331, "step": 43433 }, { "epoch": 0.82, "learning_rate": 4.1534072094860213e-07, "loss": 0.8251, "step": 43434 }, { "epoch": 0.82, "learning_rate": 4.15256402789439e-07, "loss": 0.7979, "step": 43435 }, { "epoch": 0.82, "learning_rate": 4.1517209241464433e-07, "loss": 0.7192, "step": 43436 }, { "epoch": 0.82, "learning_rate": 4.150877898245334e-07, "loss": 1.0522, "step": 43437 }, { "epoch": 0.82, "learning_rate": 4.150034950194212e-07, "loss": 0.9368, "step": 43438 }, { "epoch": 0.82, "learning_rate": 4.149192079996206e-07, "loss": 0.9364, "step": 43439 }, { "epoch": 0.82, "learning_rate": 4.1483492876544933e-07, "loss": 0.8081, "step": 43440 }, { "epoch": 0.82, "learning_rate": 4.147506573172197e-07, "loss": 1.0013, "step": 43441 }, { "epoch": 0.82, "learning_rate": 4.1466639365524726e-07, "loss": 0.7007, "step": 43442 }, { "epoch": 0.82, "learning_rate": 4.1458213777984647e-07, "loss": 1.0298, "step": 43443 }, { "epoch": 0.82, "learning_rate": 4.1449788969133207e-07, "loss": 1.0844, "step": 43444 }, { "epoch": 0.82, "learning_rate": 4.144136493900186e-07, "loss": 0.8588, "step": 43445 }, { "epoch": 0.82, "learning_rate": 4.1432941687622073e-07, "loss": 0.7465, "step": 43446 }, { "epoch": 0.82, "learning_rate": 4.142451921502533e-07, "loss": 0.8135, "step": 43447 }, { "epoch": 0.82, "learning_rate": 4.141609752124293e-07, "loss": 0.8219, "step": 43448 }, { "epoch": 0.82, "learning_rate": 4.1407676606306487e-07, "loss": 1.1342, "step": 43449 }, { "epoch": 0.82, "learning_rate": 4.1399256470247423e-07, "loss": 1.026, "step": 43450 }, { "epoch": 0.82, "learning_rate": 4.139083711309705e-07, "loss": 0.865, "step": 43451 }, { "epoch": 0.82, "learning_rate": 4.1382418534886976e-07, "loss": 0.8976, "step": 43452 }, { "epoch": 0.82, "learning_rate": 4.137400073564854e-07, "loss": 0.956, "step": 43453 }, { "epoch": 0.82, "learning_rate": 4.136558371541316e-07, "loss": 0.749, "step": 43454 }, { "epoch": 0.82, "learning_rate": 4.1357167474212284e-07, "loss": 1.087, "step": 43455 }, { "epoch": 0.82, "learning_rate": 4.1348752012077386e-07, "loss": 0.8801, "step": 43456 }, { "epoch": 0.82, "learning_rate": 4.134033732903983e-07, "loss": 0.9675, "step": 43457 }, { "epoch": 0.82, "learning_rate": 4.1331923425131036e-07, "loss": 0.9772, "step": 43458 }, { "epoch": 0.82, "learning_rate": 4.1323510300382534e-07, "loss": 0.8591, "step": 43459 }, { "epoch": 0.82, "learning_rate": 4.131509795482552e-07, "loss": 0.7816, "step": 43460 }, { "epoch": 0.82, "learning_rate": 4.130668638849164e-07, "loss": 0.8191, "step": 43461 }, { "epoch": 0.82, "learning_rate": 4.129827560141214e-07, "loss": 1.0493, "step": 43462 }, { "epoch": 0.82, "learning_rate": 4.1289865593618474e-07, "loss": 1.0655, "step": 43463 }, { "epoch": 0.82, "learning_rate": 4.128145636514205e-07, "loss": 0.7729, "step": 43464 }, { "epoch": 0.82, "learning_rate": 4.1273047916014276e-07, "loss": 0.8462, "step": 43465 }, { "epoch": 0.82, "learning_rate": 4.126464024626656e-07, "loss": 0.7115, "step": 43466 }, { "epoch": 0.82, "learning_rate": 4.1256233355930266e-07, "loss": 0.9177, "step": 43467 }, { "epoch": 0.82, "learning_rate": 4.124782724503684e-07, "loss": 1.005, "step": 43468 }, { "epoch": 0.82, "learning_rate": 4.1239421913617516e-07, "loss": 1.1592, "step": 43469 }, { "epoch": 0.82, "learning_rate": 4.1231017361703847e-07, "loss": 0.816, "step": 43470 }, { "epoch": 0.82, "learning_rate": 4.122261358932722e-07, "loss": 0.8088, "step": 43471 }, { "epoch": 0.82, "learning_rate": 4.121421059651884e-07, "loss": 0.8875, "step": 43472 }, { "epoch": 0.82, "learning_rate": 4.120580838331029e-07, "loss": 0.7538, "step": 43473 }, { "epoch": 0.82, "learning_rate": 4.1197406949732813e-07, "loss": 0.8714, "step": 43474 }, { "epoch": 0.82, "learning_rate": 4.118900629581782e-07, "loss": 1.0156, "step": 43475 }, { "epoch": 0.82, "learning_rate": 4.118060642159666e-07, "loss": 0.8713, "step": 43476 }, { "epoch": 0.82, "learning_rate": 4.117220732710073e-07, "loss": 0.84, "step": 43477 }, { "epoch": 0.82, "learning_rate": 4.116380901236136e-07, "loss": 0.9868, "step": 43478 }, { "epoch": 0.82, "learning_rate": 4.115541147740992e-07, "loss": 0.6698, "step": 43479 }, { "epoch": 0.82, "learning_rate": 4.1147014722277863e-07, "loss": 0.9544, "step": 43480 }, { "epoch": 0.82, "learning_rate": 4.113861874699629e-07, "loss": 1.0941, "step": 43481 }, { "epoch": 0.82, "learning_rate": 4.1130223551596847e-07, "loss": 0.9713, "step": 43482 }, { "epoch": 0.82, "learning_rate": 4.112182913611068e-07, "loss": 0.9799, "step": 43483 }, { "epoch": 0.82, "learning_rate": 4.1113435500569203e-07, "loss": 0.8204, "step": 43484 }, { "epoch": 0.82, "learning_rate": 4.110504264500376e-07, "loss": 0.7021, "step": 43485 }, { "epoch": 0.82, "learning_rate": 4.1096650569445675e-07, "loss": 0.8775, "step": 43486 }, { "epoch": 0.82, "learning_rate": 4.108825927392629e-07, "loss": 0.9807, "step": 43487 }, { "epoch": 0.82, "learning_rate": 4.107986875847694e-07, "loss": 0.8117, "step": 43488 }, { "epoch": 0.82, "learning_rate": 4.1071479023129025e-07, "loss": 0.9957, "step": 43489 }, { "epoch": 0.82, "learning_rate": 4.106309006791367e-07, "loss": 1.0415, "step": 43490 }, { "epoch": 0.82, "learning_rate": 4.10547018928624e-07, "loss": 0.8818, "step": 43491 }, { "epoch": 0.82, "learning_rate": 4.104631449800653e-07, "loss": 0.9069, "step": 43492 }, { "epoch": 0.82, "learning_rate": 4.1037927883377183e-07, "loss": 1.0364, "step": 43493 }, { "epoch": 0.82, "learning_rate": 4.1029542049005914e-07, "loss": 0.9127, "step": 43494 }, { "epoch": 0.82, "learning_rate": 4.10211569949239e-07, "loss": 0.7718, "step": 43495 }, { "epoch": 0.82, "learning_rate": 4.101277272116247e-07, "loss": 0.5995, "step": 43496 }, { "epoch": 0.82, "learning_rate": 4.1004389227752904e-07, "loss": 0.7947, "step": 43497 }, { "epoch": 0.82, "learning_rate": 4.099600651472657e-07, "loss": 0.9206, "step": 43498 }, { "epoch": 0.82, "learning_rate": 4.098762458211475e-07, "loss": 1.0128, "step": 43499 }, { "epoch": 0.82, "learning_rate": 4.097924342994872e-07, "loss": 1.0197, "step": 43500 }, { "epoch": 0.82, "learning_rate": 4.097086305825984e-07, "loss": 0.8423, "step": 43501 }, { "epoch": 0.82, "learning_rate": 4.0962483467079233e-07, "loss": 0.7885, "step": 43502 }, { "epoch": 0.82, "learning_rate": 4.095410465643843e-07, "loss": 0.7786, "step": 43503 }, { "epoch": 0.82, "learning_rate": 4.094572662636853e-07, "loss": 0.8649, "step": 43504 }, { "epoch": 0.82, "learning_rate": 4.093734937690086e-07, "loss": 1.0074, "step": 43505 }, { "epoch": 0.82, "learning_rate": 4.092897290806672e-07, "loss": 0.9658, "step": 43506 }, { "epoch": 0.82, "learning_rate": 4.092059721989741e-07, "loss": 0.8709, "step": 43507 }, { "epoch": 0.82, "learning_rate": 4.0912222312424143e-07, "loss": 0.8535, "step": 43508 }, { "epoch": 0.82, "learning_rate": 4.0903848185678247e-07, "loss": 0.9601, "step": 43509 }, { "epoch": 0.82, "learning_rate": 4.0895474839691057e-07, "loss": 0.9228, "step": 43510 }, { "epoch": 0.82, "learning_rate": 4.088710227449361e-07, "loss": 0.8277, "step": 43511 }, { "epoch": 0.82, "learning_rate": 4.087873049011734e-07, "loss": 0.9952, "step": 43512 }, { "epoch": 0.82, "learning_rate": 4.087035948659357e-07, "loss": 1.0189, "step": 43513 }, { "epoch": 0.82, "learning_rate": 4.086198926395335e-07, "loss": 1.0647, "step": 43514 }, { "epoch": 0.82, "learning_rate": 4.0853619822228157e-07, "loss": 0.9075, "step": 43515 }, { "epoch": 0.82, "learning_rate": 4.084525116144908e-07, "loss": 0.8134, "step": 43516 }, { "epoch": 0.82, "learning_rate": 4.083688328164742e-07, "loss": 0.813, "step": 43517 }, { "epoch": 0.82, "learning_rate": 4.0828516182854437e-07, "loss": 1.0542, "step": 43518 }, { "epoch": 0.82, "learning_rate": 4.0820149865101353e-07, "loss": 1.0967, "step": 43519 }, { "epoch": 0.82, "learning_rate": 4.0811784328419426e-07, "loss": 1.0922, "step": 43520 }, { "epoch": 0.82, "learning_rate": 4.080341957283987e-07, "loss": 0.6389, "step": 43521 }, { "epoch": 0.82, "learning_rate": 4.0795055598393973e-07, "loss": 0.7103, "step": 43522 }, { "epoch": 0.82, "learning_rate": 4.078669240511282e-07, "loss": 0.8552, "step": 43523 }, { "epoch": 0.82, "learning_rate": 4.077832999302789e-07, "loss": 1.0368, "step": 43524 }, { "epoch": 0.82, "learning_rate": 4.0769968362170174e-07, "loss": 1.2766, "step": 43525 }, { "epoch": 0.82, "learning_rate": 4.076160751257097e-07, "loss": 0.9904, "step": 43526 }, { "epoch": 0.82, "learning_rate": 4.0753247444261513e-07, "loss": 0.8057, "step": 43527 }, { "epoch": 0.82, "learning_rate": 4.0744888157273036e-07, "loss": 1.0071, "step": 43528 }, { "epoch": 0.82, "learning_rate": 4.073652965163671e-07, "loss": 0.9316, "step": 43529 }, { "epoch": 0.82, "learning_rate": 4.0728171927383794e-07, "loss": 0.8207, "step": 43530 }, { "epoch": 0.82, "learning_rate": 4.07198149845455e-07, "loss": 1.0067, "step": 43531 }, { "epoch": 0.82, "learning_rate": 4.071145882315289e-07, "loss": 0.9979, "step": 43532 }, { "epoch": 0.82, "learning_rate": 4.070310344323733e-07, "loss": 0.8566, "step": 43533 }, { "epoch": 0.82, "learning_rate": 4.069474884483002e-07, "loss": 0.8664, "step": 43534 }, { "epoch": 0.82, "learning_rate": 4.0686395027961983e-07, "loss": 0.7944, "step": 43535 }, { "epoch": 0.82, "learning_rate": 4.067804199266467e-07, "loss": 0.7929, "step": 43536 }, { "epoch": 0.82, "learning_rate": 4.0669689738969067e-07, "loss": 0.9187, "step": 43537 }, { "epoch": 0.82, "learning_rate": 4.0661338266906407e-07, "loss": 0.9094, "step": 43538 }, { "epoch": 0.82, "learning_rate": 4.06529875765079e-07, "loss": 0.8892, "step": 43539 }, { "epoch": 0.82, "learning_rate": 4.0644637667804715e-07, "loss": 0.9107, "step": 43540 }, { "epoch": 0.82, "learning_rate": 4.063628854082807e-07, "loss": 0.7524, "step": 43541 }, { "epoch": 0.82, "learning_rate": 4.0627940195609035e-07, "loss": 0.944, "step": 43542 }, { "epoch": 0.82, "learning_rate": 4.061959263217893e-07, "loss": 1.0132, "step": 43543 }, { "epoch": 0.82, "learning_rate": 4.0611245850568804e-07, "loss": 1.023, "step": 43544 }, { "epoch": 0.82, "learning_rate": 4.060289985080987e-07, "loss": 0.8546, "step": 43545 }, { "epoch": 0.82, "learning_rate": 4.059455463293327e-07, "loss": 0.9615, "step": 43546 }, { "epoch": 0.82, "learning_rate": 4.0586210196970207e-07, "loss": 0.9091, "step": 43547 }, { "epoch": 0.82, "learning_rate": 4.0577866542951786e-07, "loss": 0.9714, "step": 43548 }, { "epoch": 0.82, "learning_rate": 4.0569523670909217e-07, "loss": 0.9289, "step": 43549 }, { "epoch": 0.82, "learning_rate": 4.0561181580873685e-07, "loss": 1.1868, "step": 43550 }, { "epoch": 0.82, "learning_rate": 4.055284027287615e-07, "loss": 0.7436, "step": 43551 }, { "epoch": 0.82, "learning_rate": 4.054449974694799e-07, "loss": 0.7428, "step": 43552 }, { "epoch": 0.82, "learning_rate": 4.0536160003120216e-07, "loss": 0.7051, "step": 43553 }, { "epoch": 0.82, "learning_rate": 4.0527821041423914e-07, "loss": 0.857, "step": 43554 }, { "epoch": 0.82, "learning_rate": 4.0519482861890446e-07, "loss": 0.8558, "step": 43555 }, { "epoch": 0.82, "learning_rate": 4.0511145464550733e-07, "loss": 1.0595, "step": 43556 }, { "epoch": 0.82, "learning_rate": 4.050280884943597e-07, "loss": 1.12, "step": 43557 }, { "epoch": 0.82, "learning_rate": 4.0494473016577327e-07, "loss": 0.8315, "step": 43558 }, { "epoch": 0.82, "learning_rate": 4.048613796600587e-07, "loss": 0.8744, "step": 43559 }, { "epoch": 0.82, "learning_rate": 4.0477803697752756e-07, "loss": 0.862, "step": 43560 }, { "epoch": 0.82, "learning_rate": 4.0469470211849103e-07, "loss": 0.7922, "step": 43561 }, { "epoch": 0.82, "learning_rate": 4.046113750832609e-07, "loss": 1.0759, "step": 43562 }, { "epoch": 0.82, "learning_rate": 4.045280558721465e-07, "loss": 0.8862, "step": 43563 }, { "epoch": 0.82, "learning_rate": 4.04444744485461e-07, "loss": 0.9664, "step": 43564 }, { "epoch": 0.82, "learning_rate": 4.0436144092351413e-07, "loss": 0.9547, "step": 43565 }, { "epoch": 0.82, "learning_rate": 4.042781451866176e-07, "loss": 0.8719, "step": 43566 }, { "epoch": 0.82, "learning_rate": 4.04194857275082e-07, "loss": 0.7633, "step": 43567 }, { "epoch": 0.82, "learning_rate": 4.0411157718921847e-07, "loss": 1.1641, "step": 43568 }, { "epoch": 0.82, "learning_rate": 4.0402830492933807e-07, "loss": 0.8288, "step": 43569 }, { "epoch": 0.82, "learning_rate": 4.0394504049575205e-07, "loss": 0.9188, "step": 43570 }, { "epoch": 0.82, "learning_rate": 4.038617838887712e-07, "loss": 0.8001, "step": 43571 }, { "epoch": 0.82, "learning_rate": 4.037785351087051e-07, "loss": 1.0138, "step": 43572 }, { "epoch": 0.82, "learning_rate": 4.0369529415586695e-07, "loss": 0.7522, "step": 43573 }, { "epoch": 0.82, "learning_rate": 4.036120610305655e-07, "loss": 0.8552, "step": 43574 }, { "epoch": 0.82, "learning_rate": 4.0352883573311186e-07, "loss": 1.0529, "step": 43575 }, { "epoch": 0.82, "learning_rate": 4.0344561826381854e-07, "loss": 0.9553, "step": 43576 }, { "epoch": 0.82, "learning_rate": 4.0336240862299425e-07, "loss": 0.8623, "step": 43577 }, { "epoch": 0.82, "learning_rate": 4.0327920681095064e-07, "loss": 0.6263, "step": 43578 }, { "epoch": 0.82, "learning_rate": 4.03196012827998e-07, "loss": 0.8576, "step": 43579 }, { "epoch": 0.82, "learning_rate": 4.0311282667444744e-07, "loss": 1.1115, "step": 43580 }, { "epoch": 0.82, "learning_rate": 4.030296483506091e-07, "loss": 0.9983, "step": 43581 }, { "epoch": 0.82, "learning_rate": 4.0294647785679375e-07, "loss": 0.845, "step": 43582 }, { "epoch": 0.82, "learning_rate": 4.0286331519331256e-07, "loss": 0.9139, "step": 43583 }, { "epoch": 0.82, "learning_rate": 4.027801603604742e-07, "loss": 0.9022, "step": 43584 }, { "epoch": 0.82, "learning_rate": 4.026970133585917e-07, "loss": 0.7805, "step": 43585 }, { "epoch": 0.82, "learning_rate": 4.0261387418797345e-07, "loss": 0.8068, "step": 43586 }, { "epoch": 0.82, "learning_rate": 4.0253074284893087e-07, "loss": 1.0499, "step": 43587 }, { "epoch": 0.82, "learning_rate": 4.0244761934177425e-07, "loss": 0.955, "step": 43588 }, { "epoch": 0.82, "learning_rate": 4.023645036668136e-07, "loss": 0.8211, "step": 43589 }, { "epoch": 0.82, "learning_rate": 4.022813958243599e-07, "loss": 0.7111, "step": 43590 }, { "epoch": 0.82, "learning_rate": 4.0219829581472303e-07, "loss": 0.8831, "step": 43591 }, { "epoch": 0.82, "learning_rate": 4.021152036382142e-07, "loss": 0.7856, "step": 43592 }, { "epoch": 0.82, "learning_rate": 4.020321192951415e-07, "loss": 0.8818, "step": 43593 }, { "epoch": 0.82, "learning_rate": 4.0194904278581776e-07, "loss": 1.1512, "step": 43594 }, { "epoch": 0.82, "learning_rate": 4.018659741105513e-07, "loss": 0.8856, "step": 43595 }, { "epoch": 0.82, "learning_rate": 4.0178291326965243e-07, "loss": 0.7966, "step": 43596 }, { "epoch": 0.82, "learning_rate": 4.0169986026343283e-07, "loss": 0.7887, "step": 43597 }, { "epoch": 0.82, "learning_rate": 4.016168150922012e-07, "loss": 0.8646, "step": 43598 }, { "epoch": 0.82, "learning_rate": 4.015337777562681e-07, "loss": 0.8268, "step": 43599 }, { "epoch": 0.82, "learning_rate": 4.014507482559435e-07, "loss": 1.1981, "step": 43600 }, { "epoch": 0.82, "learning_rate": 4.013677265915375e-07, "loss": 0.8416, "step": 43601 }, { "epoch": 0.82, "learning_rate": 4.0128471276335985e-07, "loss": 0.8034, "step": 43602 }, { "epoch": 0.82, "learning_rate": 4.012017067717208e-07, "loss": 0.7977, "step": 43603 }, { "epoch": 0.82, "learning_rate": 4.0111870861693105e-07, "loss": 1.1902, "step": 43604 }, { "epoch": 0.82, "learning_rate": 4.0103571829929827e-07, "loss": 1.0519, "step": 43605 }, { "epoch": 0.82, "learning_rate": 4.009527358191351e-07, "loss": 1.0217, "step": 43606 }, { "epoch": 0.82, "learning_rate": 4.008697611767495e-07, "loss": 0.9178, "step": 43607 }, { "epoch": 0.82, "learning_rate": 4.0078679437245166e-07, "loss": 0.8506, "step": 43608 }, { "epoch": 0.82, "learning_rate": 4.007038354065518e-07, "loss": 0.835, "step": 43609 }, { "epoch": 0.82, "learning_rate": 4.0062088427935906e-07, "loss": 0.7992, "step": 43610 }, { "epoch": 0.82, "learning_rate": 4.005379409911839e-07, "loss": 0.8947, "step": 43611 }, { "epoch": 0.82, "learning_rate": 4.004550055423356e-07, "loss": 1.1263, "step": 43612 }, { "epoch": 0.82, "learning_rate": 4.003720779331247e-07, "loss": 1.0284, "step": 43613 }, { "epoch": 0.82, "learning_rate": 4.0028915816385874e-07, "loss": 0.9256, "step": 43614 }, { "epoch": 0.82, "learning_rate": 4.002062462348497e-07, "loss": 0.9051, "step": 43615 }, { "epoch": 0.82, "learning_rate": 4.001233421464057e-07, "loss": 0.9236, "step": 43616 }, { "epoch": 0.82, "learning_rate": 4.000404458988363e-07, "loss": 1.13, "step": 43617 }, { "epoch": 0.82, "learning_rate": 3.999575574924525e-07, "loss": 0.7492, "step": 43618 }, { "epoch": 0.82, "learning_rate": 3.9987467692756245e-07, "loss": 0.9892, "step": 43619 }, { "epoch": 0.82, "learning_rate": 3.997918042044757e-07, "loss": 0.8476, "step": 43620 }, { "epoch": 0.82, "learning_rate": 3.997089393235021e-07, "loss": 1.028, "step": 43621 }, { "epoch": 0.82, "learning_rate": 3.996260822849507e-07, "loss": 0.7057, "step": 43622 }, { "epoch": 0.82, "learning_rate": 3.9954323308913134e-07, "loss": 0.6235, "step": 43623 }, { "epoch": 0.82, "learning_rate": 3.994603917363532e-07, "loss": 1.0063, "step": 43624 }, { "epoch": 0.82, "learning_rate": 3.9937755822692606e-07, "loss": 1.0836, "step": 43625 }, { "epoch": 0.82, "learning_rate": 3.9929473256115735e-07, "loss": 0.7882, "step": 43626 }, { "epoch": 0.82, "learning_rate": 3.9921191473935917e-07, "loss": 0.9303, "step": 43627 }, { "epoch": 0.82, "learning_rate": 3.991291047618384e-07, "loss": 0.9432, "step": 43628 }, { "epoch": 0.82, "learning_rate": 3.9904630262890544e-07, "loss": 0.7942, "step": 43629 }, { "epoch": 0.82, "learning_rate": 3.9896350834086913e-07, "loss": 0.9199, "step": 43630 }, { "epoch": 0.82, "learning_rate": 3.988807218980384e-07, "loss": 1.0541, "step": 43631 }, { "epoch": 0.82, "learning_rate": 3.9879794330072274e-07, "loss": 1.0376, "step": 43632 }, { "epoch": 0.82, "learning_rate": 3.987151725492314e-07, "loss": 0.9942, "step": 43633 }, { "epoch": 0.82, "learning_rate": 3.9863240964387344e-07, "loss": 0.7606, "step": 43634 }, { "epoch": 0.82, "learning_rate": 3.9854965458495655e-07, "loss": 1.0969, "step": 43635 }, { "epoch": 0.82, "learning_rate": 3.98466907372792e-07, "loss": 0.8553, "step": 43636 }, { "epoch": 0.82, "learning_rate": 3.983841680076872e-07, "loss": 0.9659, "step": 43637 }, { "epoch": 0.82, "learning_rate": 3.983014364899507e-07, "loss": 0.9769, "step": 43638 }, { "epoch": 0.82, "learning_rate": 3.9821871281989334e-07, "loss": 0.9581, "step": 43639 }, { "epoch": 0.82, "learning_rate": 3.9813599699782215e-07, "loss": 0.9227, "step": 43640 }, { "epoch": 0.82, "learning_rate": 3.9805328902404686e-07, "loss": 0.884, "step": 43641 }, { "epoch": 0.82, "learning_rate": 3.9797058889887636e-07, "loss": 0.884, "step": 43642 }, { "epoch": 0.82, "learning_rate": 3.978878966226188e-07, "loss": 1.0141, "step": 43643 }, { "epoch": 0.82, "learning_rate": 3.978052121955836e-07, "loss": 0.9141, "step": 43644 }, { "epoch": 0.82, "learning_rate": 3.9772253561807944e-07, "loss": 0.9567, "step": 43645 }, { "epoch": 0.82, "learning_rate": 3.976398668904152e-07, "loss": 0.9399, "step": 43646 }, { "epoch": 0.82, "learning_rate": 3.975572060128982e-07, "loss": 0.8291, "step": 43647 }, { "epoch": 0.82, "learning_rate": 3.974745529858393e-07, "loss": 0.7321, "step": 43648 }, { "epoch": 0.82, "learning_rate": 3.9739190780954536e-07, "loss": 1.0704, "step": 43649 }, { "epoch": 0.82, "learning_rate": 3.973092704843254e-07, "loss": 0.8809, "step": 43650 }, { "epoch": 0.82, "learning_rate": 3.972266410104883e-07, "loss": 0.8999, "step": 43651 }, { "epoch": 0.82, "learning_rate": 3.9714401938834247e-07, "loss": 0.9479, "step": 43652 }, { "epoch": 0.82, "learning_rate": 3.970614056181965e-07, "loss": 0.6691, "step": 43653 }, { "epoch": 0.82, "learning_rate": 3.9697879970035853e-07, "loss": 0.847, "step": 43654 }, { "epoch": 0.82, "learning_rate": 3.9689620163513796e-07, "loss": 1.0117, "step": 43655 }, { "epoch": 0.82, "learning_rate": 3.968136114228413e-07, "loss": 0.8875, "step": 43656 }, { "epoch": 0.82, "learning_rate": 3.9673102906377936e-07, "loss": 0.8411, "step": 43657 }, { "epoch": 0.82, "learning_rate": 3.9664845455825856e-07, "loss": 0.7731, "step": 43658 }, { "epoch": 0.82, "learning_rate": 3.965658879065876e-07, "loss": 0.8623, "step": 43659 }, { "epoch": 0.82, "learning_rate": 3.964833291090761e-07, "loss": 0.7521, "step": 43660 }, { "epoch": 0.82, "learning_rate": 3.964007781660306e-07, "loss": 0.9065, "step": 43661 }, { "epoch": 0.82, "learning_rate": 3.963182350777603e-07, "loss": 0.9557, "step": 43662 }, { "epoch": 0.82, "learning_rate": 3.9623569984457324e-07, "loss": 1.0704, "step": 43663 }, { "epoch": 0.82, "learning_rate": 3.961531724667775e-07, "loss": 0.9393, "step": 43664 }, { "epoch": 0.82, "learning_rate": 3.9607065294468145e-07, "loss": 0.8363, "step": 43665 }, { "epoch": 0.82, "learning_rate": 3.959881412785929e-07, "loss": 0.9368, "step": 43666 }, { "epoch": 0.82, "learning_rate": 3.9590563746882083e-07, "loss": 0.817, "step": 43667 }, { "epoch": 0.82, "learning_rate": 3.958231415156713e-07, "loss": 0.9443, "step": 43668 }, { "epoch": 0.82, "learning_rate": 3.9574065341945496e-07, "loss": 0.8412, "step": 43669 }, { "epoch": 0.82, "learning_rate": 3.956581731804776e-07, "loss": 0.8189, "step": 43670 }, { "epoch": 0.82, "learning_rate": 3.955757007990485e-07, "loss": 0.9301, "step": 43671 }, { "epoch": 0.82, "learning_rate": 3.9549323627547517e-07, "loss": 0.9944, "step": 43672 }, { "epoch": 0.82, "learning_rate": 3.9541077961006535e-07, "loss": 0.8013, "step": 43673 }, { "epoch": 0.82, "learning_rate": 3.953283308031272e-07, "loss": 0.795, "step": 43674 }, { "epoch": 0.82, "learning_rate": 3.9524588985496855e-07, "loss": 1.0912, "step": 43675 }, { "epoch": 0.82, "learning_rate": 3.95163456765898e-07, "loss": 1.0264, "step": 43676 }, { "epoch": 0.82, "learning_rate": 3.950810315362211e-07, "loss": 0.9424, "step": 43677 }, { "epoch": 0.82, "learning_rate": 3.9499861416624846e-07, "loss": 0.7461, "step": 43678 }, { "epoch": 0.82, "learning_rate": 3.949162046562857e-07, "loss": 0.7786, "step": 43679 }, { "epoch": 0.82, "learning_rate": 3.9483380300664066e-07, "loss": 0.791, "step": 43680 }, { "epoch": 0.82, "learning_rate": 3.9475140921762303e-07, "loss": 0.9901, "step": 43681 }, { "epoch": 0.82, "learning_rate": 3.946690232895384e-07, "loss": 1.1125, "step": 43682 }, { "epoch": 0.82, "learning_rate": 3.945866452226951e-07, "loss": 0.7041, "step": 43683 }, { "epoch": 0.82, "learning_rate": 3.945042750174008e-07, "loss": 0.851, "step": 43684 }, { "epoch": 0.82, "learning_rate": 3.944219126739629e-07, "loss": 0.7619, "step": 43685 }, { "epoch": 0.82, "learning_rate": 3.94339558192689e-07, "loss": 1.0198, "step": 43686 }, { "epoch": 0.82, "learning_rate": 3.9425721157388656e-07, "loss": 1.0646, "step": 43687 }, { "epoch": 0.82, "learning_rate": 3.94174872817864e-07, "loss": 0.9512, "step": 43688 }, { "epoch": 0.82, "learning_rate": 3.940925419249264e-07, "loss": 0.7623, "step": 43689 }, { "epoch": 0.82, "learning_rate": 3.94010218895384e-07, "loss": 1.0538, "step": 43690 }, { "epoch": 0.82, "learning_rate": 3.939279037295424e-07, "loss": 0.8229, "step": 43691 }, { "epoch": 0.82, "learning_rate": 3.9384559642770935e-07, "loss": 1.0724, "step": 43692 }, { "epoch": 0.82, "learning_rate": 3.937632969901922e-07, "loss": 1.2108, "step": 43693 }, { "epoch": 0.82, "learning_rate": 3.936810054172982e-07, "loss": 1.1802, "step": 43694 }, { "epoch": 0.82, "learning_rate": 3.935987217093351e-07, "loss": 0.765, "step": 43695 }, { "epoch": 0.82, "learning_rate": 3.935164458666094e-07, "loss": 1.0218, "step": 43696 }, { "epoch": 0.82, "learning_rate": 3.934341778894296e-07, "loss": 0.903, "step": 43697 }, { "epoch": 0.82, "learning_rate": 3.933519177781006e-07, "loss": 0.7013, "step": 43698 }, { "epoch": 0.82, "learning_rate": 3.932696655329324e-07, "loss": 1.0078, "step": 43699 }, { "epoch": 0.82, "learning_rate": 3.931874211542297e-07, "loss": 1.0752, "step": 43700 }, { "epoch": 0.82, "learning_rate": 3.931051846423004e-07, "loss": 0.9201, "step": 43701 }, { "epoch": 0.82, "learning_rate": 3.9302295599745243e-07, "loss": 1.0398, "step": 43702 }, { "epoch": 0.82, "learning_rate": 3.929407352199921e-07, "loss": 0.9844, "step": 43703 }, { "epoch": 0.82, "learning_rate": 3.9285852231022605e-07, "loss": 0.7148, "step": 43704 }, { "epoch": 0.82, "learning_rate": 3.927763172684618e-07, "loss": 0.7692, "step": 43705 }, { "epoch": 0.82, "learning_rate": 3.926941200950063e-07, "loss": 1.1833, "step": 43706 }, { "epoch": 0.82, "learning_rate": 3.92611930790166e-07, "loss": 0.6709, "step": 43707 }, { "epoch": 0.82, "learning_rate": 3.9252974935424847e-07, "loss": 0.8442, "step": 43708 }, { "epoch": 0.82, "learning_rate": 3.9244757578756063e-07, "loss": 0.895, "step": 43709 }, { "epoch": 0.82, "learning_rate": 3.9236541009040783e-07, "loss": 0.9154, "step": 43710 }, { "epoch": 0.82, "learning_rate": 3.922832522630993e-07, "loss": 0.9498, "step": 43711 }, { "epoch": 0.82, "learning_rate": 3.922011023059397e-07, "loss": 1.2471, "step": 43712 }, { "epoch": 0.82, "learning_rate": 3.9211896021923656e-07, "loss": 0.8441, "step": 43713 }, { "epoch": 0.82, "learning_rate": 3.920368260032967e-07, "loss": 0.9741, "step": 43714 }, { "epoch": 0.82, "learning_rate": 3.9195469965842667e-07, "loss": 1.0441, "step": 43715 }, { "epoch": 0.82, "learning_rate": 3.9187258118493304e-07, "loss": 0.6648, "step": 43716 }, { "epoch": 0.82, "learning_rate": 3.917904705831227e-07, "loss": 0.8067, "step": 43717 }, { "epoch": 0.82, "learning_rate": 3.9170836785330264e-07, "loss": 0.8593, "step": 43718 }, { "epoch": 0.82, "learning_rate": 3.916262729957776e-07, "loss": 1.0399, "step": 43719 }, { "epoch": 0.82, "learning_rate": 3.915441860108568e-07, "loss": 0.7928, "step": 43720 }, { "epoch": 0.82, "learning_rate": 3.9146210689884474e-07, "loss": 0.9995, "step": 43721 }, { "epoch": 0.82, "learning_rate": 3.913800356600478e-07, "loss": 0.9674, "step": 43722 }, { "epoch": 0.82, "learning_rate": 3.9129797229477437e-07, "loss": 0.6804, "step": 43723 }, { "epoch": 0.82, "learning_rate": 3.9121591680332916e-07, "loss": 0.9874, "step": 43724 }, { "epoch": 0.82, "learning_rate": 3.911338691860189e-07, "loss": 1.05, "step": 43725 }, { "epoch": 0.82, "learning_rate": 3.9105182944315034e-07, "loss": 1.0085, "step": 43726 }, { "epoch": 0.82, "learning_rate": 3.909697975750293e-07, "loss": 0.8206, "step": 43727 }, { "epoch": 0.83, "learning_rate": 3.908877735819627e-07, "loss": 0.8741, "step": 43728 }, { "epoch": 0.83, "learning_rate": 3.908057574642563e-07, "loss": 0.6848, "step": 43729 }, { "epoch": 0.83, "learning_rate": 3.907237492222171e-07, "loss": 0.9543, "step": 43730 }, { "epoch": 0.83, "learning_rate": 3.906417488561495e-07, "loss": 0.9465, "step": 43731 }, { "epoch": 0.83, "learning_rate": 3.905597563663624e-07, "loss": 0.8483, "step": 43732 }, { "epoch": 0.83, "learning_rate": 3.904777717531597e-07, "loss": 0.756, "step": 43733 }, { "epoch": 0.83, "learning_rate": 3.903957950168483e-07, "loss": 1.0067, "step": 43734 }, { "epoch": 0.83, "learning_rate": 3.903138261577344e-07, "loss": 0.9348, "step": 43735 }, { "epoch": 0.83, "learning_rate": 3.902318651761239e-07, "loss": 1.2042, "step": 43736 }, { "epoch": 0.83, "learning_rate": 3.901499120723229e-07, "loss": 0.9986, "step": 43737 }, { "epoch": 0.83, "learning_rate": 3.9006796684663757e-07, "loss": 0.7577, "step": 43738 }, { "epoch": 0.83, "learning_rate": 3.899860294993743e-07, "loss": 1.0251, "step": 43739 }, { "epoch": 0.83, "learning_rate": 3.8990410003083736e-07, "loss": 0.8734, "step": 43740 }, { "epoch": 0.83, "learning_rate": 3.89822178441335e-07, "loss": 0.7194, "step": 43741 }, { "epoch": 0.83, "learning_rate": 3.897402647311713e-07, "loss": 0.7283, "step": 43742 }, { "epoch": 0.83, "learning_rate": 3.8965835890065197e-07, "loss": 1.0309, "step": 43743 }, { "epoch": 0.83, "learning_rate": 3.8957646095008514e-07, "loss": 1.0378, "step": 43744 }, { "epoch": 0.83, "learning_rate": 3.8949457087977425e-07, "loss": 0.7992, "step": 43745 }, { "epoch": 0.83, "learning_rate": 3.8941268869002597e-07, "loss": 0.9233, "step": 43746 }, { "epoch": 0.83, "learning_rate": 3.8933081438114613e-07, "loss": 0.8949, "step": 43747 }, { "epoch": 0.83, "learning_rate": 3.892489479534403e-07, "loss": 0.88, "step": 43748 }, { "epoch": 0.83, "learning_rate": 3.8916708940721417e-07, "loss": 1.038, "step": 43749 }, { "epoch": 0.83, "learning_rate": 3.8908523874277323e-07, "loss": 1.098, "step": 43750 }, { "epoch": 0.83, "learning_rate": 3.8900339596042417e-07, "loss": 1.0176, "step": 43751 }, { "epoch": 0.83, "learning_rate": 3.889215610604702e-07, "loss": 1.048, "step": 43752 }, { "epoch": 0.83, "learning_rate": 3.888397340432198e-07, "loss": 0.9008, "step": 43753 }, { "epoch": 0.83, "learning_rate": 3.887579149089765e-07, "loss": 0.8083, "step": 43754 }, { "epoch": 0.83, "learning_rate": 3.8867610365804635e-07, "loss": 0.9348, "step": 43755 }, { "epoch": 0.83, "learning_rate": 3.8859430029073495e-07, "loss": 0.9451, "step": 43756 }, { "epoch": 0.83, "learning_rate": 3.8851250480734766e-07, "loss": 0.753, "step": 43757 }, { "epoch": 0.83, "learning_rate": 3.884307172081897e-07, "loss": 0.879, "step": 43758 }, { "epoch": 0.83, "learning_rate": 3.88348937493567e-07, "loss": 0.8679, "step": 43759 }, { "epoch": 0.83, "learning_rate": 3.8826716566378516e-07, "loss": 0.9623, "step": 43760 }, { "epoch": 0.83, "learning_rate": 3.881854017191478e-07, "loss": 0.9374, "step": 43761 }, { "epoch": 0.83, "learning_rate": 3.881036456599627e-07, "loss": 0.9999, "step": 43762 }, { "epoch": 0.83, "learning_rate": 3.88021897486533e-07, "loss": 1.194, "step": 43763 }, { "epoch": 0.83, "learning_rate": 3.8794015719916424e-07, "loss": 0.9681, "step": 43764 }, { "epoch": 0.83, "learning_rate": 3.878584247981634e-07, "loss": 0.8167, "step": 43765 }, { "epoch": 0.83, "learning_rate": 3.8777670028383395e-07, "loss": 0.7621, "step": 43766 }, { "epoch": 0.83, "learning_rate": 3.8769498365648137e-07, "loss": 1.0377, "step": 43767 }, { "epoch": 0.83, "learning_rate": 3.8761327491641107e-07, "loss": 1.0743, "step": 43768 }, { "epoch": 0.83, "learning_rate": 3.8753157406392793e-07, "loss": 0.8682, "step": 43769 }, { "epoch": 0.83, "learning_rate": 3.874498810993374e-07, "loss": 0.8555, "step": 43770 }, { "epoch": 0.83, "learning_rate": 3.873681960229439e-07, "loss": 0.7942, "step": 43771 }, { "epoch": 0.83, "learning_rate": 3.8728651883505356e-07, "loss": 0.8219, "step": 43772 }, { "epoch": 0.83, "learning_rate": 3.872048495359698e-07, "loss": 0.9356, "step": 43773 }, { "epoch": 0.83, "learning_rate": 3.871231881259985e-07, "loss": 0.9903, "step": 43774 }, { "epoch": 0.83, "learning_rate": 3.870415346054446e-07, "loss": 1.0474, "step": 43775 }, { "epoch": 0.83, "learning_rate": 3.869598889746126e-07, "loss": 1.0024, "step": 43776 }, { "epoch": 0.83, "learning_rate": 3.868782512338076e-07, "loss": 0.843, "step": 43777 }, { "epoch": 0.83, "learning_rate": 3.8679662138333436e-07, "loss": 0.9846, "step": 43778 }, { "epoch": 0.83, "learning_rate": 3.8671499942349866e-07, "loss": 0.9248, "step": 43779 }, { "epoch": 0.83, "learning_rate": 3.8663338535460284e-07, "loss": 0.8957, "step": 43780 }, { "epoch": 0.83, "learning_rate": 3.8655177917695437e-07, "loss": 1.0486, "step": 43781 }, { "epoch": 0.83, "learning_rate": 3.864701808908564e-07, "loss": 1.1221, "step": 43782 }, { "epoch": 0.83, "learning_rate": 3.863885904966136e-07, "loss": 0.8417, "step": 43783 }, { "epoch": 0.83, "learning_rate": 3.8630700799453137e-07, "loss": 0.7188, "step": 43784 }, { "epoch": 0.83, "learning_rate": 3.8622543338491384e-07, "loss": 0.7859, "step": 43785 }, { "epoch": 0.83, "learning_rate": 3.8614386666806556e-07, "loss": 1.0822, "step": 43786 }, { "epoch": 0.83, "learning_rate": 3.8606230784429153e-07, "loss": 1.0847, "step": 43787 }, { "epoch": 0.83, "learning_rate": 3.859807569138965e-07, "loss": 0.8499, "step": 43788 }, { "epoch": 0.83, "learning_rate": 3.8589921387718333e-07, "loss": 0.9546, "step": 43789 }, { "epoch": 0.83, "learning_rate": 3.8581767873445834e-07, "loss": 0.8396, "step": 43790 }, { "epoch": 0.83, "learning_rate": 3.8573615148602584e-07, "loss": 0.7874, "step": 43791 }, { "epoch": 0.83, "learning_rate": 3.8565463213218826e-07, "loss": 0.729, "step": 43792 }, { "epoch": 0.83, "learning_rate": 3.85573120673253e-07, "loss": 0.9348, "step": 43793 }, { "epoch": 0.83, "learning_rate": 3.8549161710952214e-07, "loss": 0.9988, "step": 43794 }, { "epoch": 0.83, "learning_rate": 3.8541012144130085e-07, "loss": 0.7332, "step": 43795 }, { "epoch": 0.83, "learning_rate": 3.853286336688933e-07, "loss": 0.6964, "step": 43796 }, { "epoch": 0.83, "learning_rate": 3.852471537926039e-07, "loss": 1.1655, "step": 43797 }, { "epoch": 0.83, "learning_rate": 3.851656818127367e-07, "loss": 0.8525, "step": 43798 }, { "epoch": 0.83, "learning_rate": 3.8508421772959575e-07, "loss": 0.8266, "step": 43799 }, { "epoch": 0.83, "learning_rate": 3.850027615434865e-07, "loss": 0.9835, "step": 43800 }, { "epoch": 0.83, "learning_rate": 3.8492131325471057e-07, "loss": 1.0212, "step": 43801 }, { "epoch": 0.83, "learning_rate": 3.8483987286357493e-07, "loss": 0.938, "step": 43802 }, { "epoch": 0.83, "learning_rate": 3.847584403703819e-07, "loss": 0.7245, "step": 43803 }, { "epoch": 0.83, "learning_rate": 3.8467701577543595e-07, "loss": 0.7409, "step": 43804 }, { "epoch": 0.83, "learning_rate": 3.8459559907904095e-07, "loss": 0.8351, "step": 43805 }, { "epoch": 0.83, "learning_rate": 3.8451419028150113e-07, "loss": 1.084, "step": 43806 }, { "epoch": 0.83, "learning_rate": 3.844327893831207e-07, "loss": 0.9362, "step": 43807 }, { "epoch": 0.83, "learning_rate": 3.8435139638420324e-07, "loss": 0.9614, "step": 43808 }, { "epoch": 0.83, "learning_rate": 3.8427001128505335e-07, "loss": 1.0328, "step": 43809 }, { "epoch": 0.83, "learning_rate": 3.8418863408597323e-07, "loss": 0.5106, "step": 43810 }, { "epoch": 0.83, "learning_rate": 3.8410726478726846e-07, "loss": 0.8241, "step": 43811 }, { "epoch": 0.83, "learning_rate": 3.8402590338924297e-07, "loss": 1.0516, "step": 43812 }, { "epoch": 0.83, "learning_rate": 3.839445498921987e-07, "loss": 1.0563, "step": 43813 }, { "epoch": 0.83, "learning_rate": 3.838632042964416e-07, "loss": 0.9351, "step": 43814 }, { "epoch": 0.83, "learning_rate": 3.8378186660227384e-07, "loss": 0.8523, "step": 43815 }, { "epoch": 0.83, "learning_rate": 3.8370053681e-07, "loss": 0.8161, "step": 43816 }, { "epoch": 0.83, "learning_rate": 3.8361921491992304e-07, "loss": 0.6779, "step": 43817 }, { "epoch": 0.83, "learning_rate": 3.835379009323473e-07, "loss": 0.9664, "step": 43818 }, { "epoch": 0.83, "learning_rate": 3.834565948475763e-07, "loss": 1.1488, "step": 43819 }, { "epoch": 0.83, "learning_rate": 3.8337529666591323e-07, "loss": 0.8388, "step": 43820 }, { "epoch": 0.83, "learning_rate": 3.8329400638766253e-07, "loss": 0.7989, "step": 43821 }, { "epoch": 0.83, "learning_rate": 3.8321272401312587e-07, "loss": 0.9594, "step": 43822 }, { "epoch": 0.83, "learning_rate": 3.8313144954260944e-07, "loss": 0.8379, "step": 43823 }, { "epoch": 0.83, "learning_rate": 3.830501829764144e-07, "loss": 0.882, "step": 43824 }, { "epoch": 0.83, "learning_rate": 3.829689243148446e-07, "loss": 0.9557, "step": 43825 }, { "epoch": 0.83, "learning_rate": 3.828876735582052e-07, "loss": 0.7839, "step": 43826 }, { "epoch": 0.83, "learning_rate": 3.828064307067975e-07, "loss": 0.8029, "step": 43827 }, { "epoch": 0.83, "learning_rate": 3.827251957609257e-07, "loss": 1.001, "step": 43828 }, { "epoch": 0.83, "learning_rate": 3.8264396872089326e-07, "loss": 0.7632, "step": 43829 }, { "epoch": 0.83, "learning_rate": 3.8256274958700323e-07, "loss": 0.9931, "step": 43830 }, { "epoch": 0.83, "learning_rate": 3.8248153835955896e-07, "loss": 1.2114, "step": 43831 }, { "epoch": 0.83, "learning_rate": 3.8240033503886386e-07, "loss": 0.8254, "step": 43832 }, { "epoch": 0.83, "learning_rate": 3.823191396252213e-07, "loss": 0.821, "step": 43833 }, { "epoch": 0.83, "learning_rate": 3.8223795211893316e-07, "loss": 0.6705, "step": 43834 }, { "epoch": 0.83, "learning_rate": 3.8215677252030456e-07, "loss": 0.8381, "step": 43835 }, { "epoch": 0.83, "learning_rate": 3.8207560082963724e-07, "loss": 0.7109, "step": 43836 }, { "epoch": 0.83, "learning_rate": 3.819944370472348e-07, "loss": 0.8966, "step": 43837 }, { "epoch": 0.83, "learning_rate": 3.819132811734e-07, "loss": 1.0501, "step": 43838 }, { "epoch": 0.83, "learning_rate": 3.81832133208436e-07, "loss": 0.9744, "step": 43839 }, { "epoch": 0.83, "learning_rate": 3.817509931526461e-07, "loss": 0.7049, "step": 43840 }, { "epoch": 0.83, "learning_rate": 3.81669861006333e-07, "loss": 0.9092, "step": 43841 }, { "epoch": 0.83, "learning_rate": 3.8158873676980015e-07, "loss": 0.9293, "step": 43842 }, { "epoch": 0.83, "learning_rate": 3.8150762044334877e-07, "loss": 0.8779, "step": 43843 }, { "epoch": 0.83, "learning_rate": 3.814265120272842e-07, "loss": 1.0485, "step": 43844 }, { "epoch": 0.83, "learning_rate": 3.813454115219076e-07, "loss": 0.8969, "step": 43845 }, { "epoch": 0.83, "learning_rate": 3.812643189275217e-07, "loss": 0.8049, "step": 43846 }, { "epoch": 0.83, "learning_rate": 3.8118323424443106e-07, "loss": 0.7548, "step": 43847 }, { "epoch": 0.83, "learning_rate": 3.811021574729365e-07, "loss": 0.728, "step": 43848 }, { "epoch": 0.83, "learning_rate": 3.810210886133417e-07, "loss": 0.9598, "step": 43849 }, { "epoch": 0.83, "learning_rate": 3.809400276659489e-07, "loss": 1.0262, "step": 43850 }, { "epoch": 0.83, "learning_rate": 3.808589746310612e-07, "loss": 0.9649, "step": 43851 }, { "epoch": 0.83, "learning_rate": 3.807779295089814e-07, "loss": 0.796, "step": 43852 }, { "epoch": 0.83, "learning_rate": 3.806968923000115e-07, "loss": 1.0281, "step": 43853 }, { "epoch": 0.83, "learning_rate": 3.8061586300445513e-07, "loss": 0.7129, "step": 43854 }, { "epoch": 0.83, "learning_rate": 3.805348416226129e-07, "loss": 0.739, "step": 43855 }, { "epoch": 0.83, "learning_rate": 3.8045382815478983e-07, "loss": 1.1715, "step": 43856 }, { "epoch": 0.83, "learning_rate": 3.803728226012865e-07, "loss": 1.0534, "step": 43857 }, { "epoch": 0.83, "learning_rate": 3.8029182496240627e-07, "loss": 0.8793, "step": 43858 }, { "epoch": 0.83, "learning_rate": 3.802108352384512e-07, "loss": 0.793, "step": 43859 }, { "epoch": 0.83, "learning_rate": 3.80129853429724e-07, "loss": 0.7694, "step": 43860 }, { "epoch": 0.83, "learning_rate": 3.8004887953652674e-07, "loss": 0.9823, "step": 43861 }, { "epoch": 0.83, "learning_rate": 3.7996791355916216e-07, "loss": 1.0699, "step": 43862 }, { "epoch": 0.83, "learning_rate": 3.798869554979329e-07, "loss": 1.0723, "step": 43863 }, { "epoch": 0.83, "learning_rate": 3.7980600535313965e-07, "loss": 0.7714, "step": 43864 }, { "epoch": 0.83, "learning_rate": 3.7972506312508677e-07, "loss": 0.8103, "step": 43865 }, { "epoch": 0.83, "learning_rate": 3.796441288140751e-07, "loss": 0.7023, "step": 43866 }, { "epoch": 0.83, "learning_rate": 3.7956320242040655e-07, "loss": 0.9373, "step": 43867 }, { "epoch": 0.83, "learning_rate": 3.794822839443851e-07, "loss": 0.9988, "step": 43868 }, { "epoch": 0.83, "learning_rate": 3.7940137338631137e-07, "loss": 1.1198, "step": 43869 }, { "epoch": 0.83, "learning_rate": 3.793204707464876e-07, "loss": 0.9383, "step": 43870 }, { "epoch": 0.83, "learning_rate": 3.7923957602521654e-07, "loss": 1.0021, "step": 43871 }, { "epoch": 0.83, "learning_rate": 3.791586892227997e-07, "loss": 0.7639, "step": 43872 }, { "epoch": 0.83, "learning_rate": 3.7907781033953927e-07, "loss": 0.7162, "step": 43873 }, { "epoch": 0.83, "learning_rate": 3.7899693937573726e-07, "loss": 1.051, "step": 43874 }, { "epoch": 0.83, "learning_rate": 3.7891607633169626e-07, "loss": 1.1591, "step": 43875 }, { "epoch": 0.83, "learning_rate": 3.788352212077165e-07, "loss": 1.0296, "step": 43876 }, { "epoch": 0.83, "learning_rate": 3.7875437400410193e-07, "loss": 1.0035, "step": 43877 }, { "epoch": 0.83, "learning_rate": 3.7867353472115315e-07, "loss": 0.7628, "step": 43878 }, { "epoch": 0.83, "learning_rate": 3.7859270335917216e-07, "loss": 0.9665, "step": 43879 }, { "epoch": 0.83, "learning_rate": 3.785118799184612e-07, "loss": 0.9842, "step": 43880 }, { "epoch": 0.83, "learning_rate": 3.7843106439932164e-07, "loss": 1.0684, "step": 43881 }, { "epoch": 0.83, "learning_rate": 3.783502568020556e-07, "loss": 0.9443, "step": 43882 }, { "epoch": 0.83, "learning_rate": 3.782694571269643e-07, "loss": 0.9275, "step": 43883 }, { "epoch": 0.83, "learning_rate": 3.7818866537435077e-07, "loss": 0.664, "step": 43884 }, { "epoch": 0.83, "learning_rate": 3.7810788154451437e-07, "loss": 0.7543, "step": 43885 }, { "epoch": 0.83, "learning_rate": 3.7802710563775936e-07, "loss": 0.8051, "step": 43886 }, { "epoch": 0.83, "learning_rate": 3.7794633765438517e-07, "loss": 1.0891, "step": 43887 }, { "epoch": 0.83, "learning_rate": 3.778655775946941e-07, "loss": 0.9389, "step": 43888 }, { "epoch": 0.83, "learning_rate": 3.7778482545898886e-07, "loss": 0.777, "step": 43889 }, { "epoch": 0.83, "learning_rate": 3.7770408124756934e-07, "loss": 0.8188, "step": 43890 }, { "epoch": 0.83, "learning_rate": 3.7762334496073804e-07, "loss": 1.0156, "step": 43891 }, { "epoch": 0.83, "learning_rate": 3.775426165987958e-07, "loss": 0.7773, "step": 43892 }, { "epoch": 0.83, "learning_rate": 3.774618961620444e-07, "loss": 1.1695, "step": 43893 }, { "epoch": 0.83, "learning_rate": 3.7738118365078543e-07, "loss": 1.11, "step": 43894 }, { "epoch": 0.83, "learning_rate": 3.773004790653198e-07, "loss": 0.9164, "step": 43895 }, { "epoch": 0.83, "learning_rate": 3.772197824059498e-07, "loss": 0.7686, "step": 43896 }, { "epoch": 0.83, "learning_rate": 3.771390936729749e-07, "loss": 0.9034, "step": 43897 }, { "epoch": 0.83, "learning_rate": 3.770584128666985e-07, "loss": 0.7213, "step": 43898 }, { "epoch": 0.83, "learning_rate": 3.7697773998742054e-07, "loss": 1.3542, "step": 43899 }, { "epoch": 0.83, "learning_rate": 3.7689707503544253e-07, "loss": 0.9755, "step": 43900 }, { "epoch": 0.83, "learning_rate": 3.768164180110656e-07, "loss": 0.8546, "step": 43901 }, { "epoch": 0.83, "learning_rate": 3.767357689145912e-07, "loss": 0.973, "step": 43902 }, { "epoch": 0.83, "learning_rate": 3.766551277463204e-07, "loss": 1.0044, "step": 43903 }, { "epoch": 0.83, "learning_rate": 3.7657449450655417e-07, "loss": 0.8983, "step": 43904 }, { "epoch": 0.83, "learning_rate": 3.764938691955941e-07, "loss": 0.8934, "step": 43905 }, { "epoch": 0.83, "learning_rate": 3.7641325181374006e-07, "loss": 1.0709, "step": 43906 }, { "epoch": 0.83, "learning_rate": 3.7633264236129453e-07, "loss": 1.0134, "step": 43907 }, { "epoch": 0.83, "learning_rate": 3.762520408385575e-07, "loss": 1.0529, "step": 43908 }, { "epoch": 0.83, "learning_rate": 3.7617144724582973e-07, "loss": 0.9277, "step": 43909 }, { "epoch": 0.83, "learning_rate": 3.7609086158341356e-07, "loss": 0.7327, "step": 43910 }, { "epoch": 0.83, "learning_rate": 3.760102838516086e-07, "loss": 1.0624, "step": 43911 }, { "epoch": 0.83, "learning_rate": 3.759297140507159e-07, "loss": 1.051, "step": 43912 }, { "epoch": 0.83, "learning_rate": 3.7584915218103674e-07, "loss": 0.8354, "step": 43913 }, { "epoch": 0.83, "learning_rate": 3.757685982428716e-07, "loss": 0.9326, "step": 43914 }, { "epoch": 0.83, "learning_rate": 3.756880522365214e-07, "loss": 0.7541, "step": 43915 }, { "epoch": 0.83, "learning_rate": 3.7560751416228695e-07, "loss": 0.9268, "step": 43916 }, { "epoch": 0.83, "learning_rate": 3.755269840204695e-07, "loss": 0.8115, "step": 43917 }, { "epoch": 0.83, "learning_rate": 3.754464618113679e-07, "loss": 0.8716, "step": 43918 }, { "epoch": 0.83, "learning_rate": 3.7536594753528524e-07, "loss": 0.9942, "step": 43919 }, { "epoch": 0.83, "learning_rate": 3.7528544119252053e-07, "loss": 0.9066, "step": 43920 }, { "epoch": 0.83, "learning_rate": 3.752049427833748e-07, "loss": 0.842, "step": 43921 }, { "epoch": 0.83, "learning_rate": 3.7512445230814846e-07, "loss": 0.915, "step": 43922 }, { "epoch": 0.83, "learning_rate": 3.7504396976714265e-07, "loss": 0.7958, "step": 43923 }, { "epoch": 0.83, "learning_rate": 3.7496349516065705e-07, "loss": 0.8228, "step": 43924 }, { "epoch": 0.83, "learning_rate": 3.7488302848899287e-07, "loss": 1.2028, "step": 43925 }, { "epoch": 0.83, "learning_rate": 3.74802569752451e-07, "loss": 0.8157, "step": 43926 }, { "epoch": 0.83, "learning_rate": 3.7472211895132977e-07, "loss": 0.8, "step": 43927 }, { "epoch": 0.83, "learning_rate": 3.7464167608593225e-07, "loss": 0.9509, "step": 43928 }, { "epoch": 0.83, "learning_rate": 3.745612411565569e-07, "loss": 0.7643, "step": 43929 }, { "epoch": 0.83, "learning_rate": 3.7448081416350424e-07, "loss": 1.0284, "step": 43930 }, { "epoch": 0.83, "learning_rate": 3.74400395107076e-07, "loss": 0.9663, "step": 43931 }, { "epoch": 0.83, "learning_rate": 3.743199839875711e-07, "loss": 1.0593, "step": 43932 }, { "epoch": 0.83, "learning_rate": 3.742395808052904e-07, "loss": 0.7243, "step": 43933 }, { "epoch": 0.83, "learning_rate": 3.7415918556053365e-07, "loss": 0.8424, "step": 43934 }, { "epoch": 0.83, "learning_rate": 3.740787982536012e-07, "loss": 0.8707, "step": 43935 }, { "epoch": 0.83, "learning_rate": 3.7399841888479364e-07, "loss": 0.8886, "step": 43936 }, { "epoch": 0.83, "learning_rate": 3.7391804745441074e-07, "loss": 0.9481, "step": 43937 }, { "epoch": 0.83, "learning_rate": 3.7383768396275303e-07, "loss": 0.9284, "step": 43938 }, { "epoch": 0.83, "learning_rate": 3.7375732841011925e-07, "loss": 1.0316, "step": 43939 }, { "epoch": 0.83, "learning_rate": 3.7367698079681157e-07, "loss": 0.8098, "step": 43940 }, { "epoch": 0.83, "learning_rate": 3.7359664112312815e-07, "loss": 0.9277, "step": 43941 }, { "epoch": 0.83, "learning_rate": 3.7351630938936985e-07, "loss": 0.8726, "step": 43942 }, { "epoch": 0.83, "learning_rate": 3.7343598559583636e-07, "loss": 1.0582, "step": 43943 }, { "epoch": 0.83, "learning_rate": 3.7335566974282785e-07, "loss": 1.0435, "step": 43944 }, { "epoch": 0.83, "learning_rate": 3.732753618306437e-07, "loss": 1.0005, "step": 43945 }, { "epoch": 0.83, "learning_rate": 3.731950618595845e-07, "loss": 0.7903, "step": 43946 }, { "epoch": 0.83, "learning_rate": 3.7311476982995006e-07, "loss": 0.8651, "step": 43947 }, { "epoch": 0.83, "learning_rate": 3.7303448574203873e-07, "loss": 0.9263, "step": 43948 }, { "epoch": 0.83, "learning_rate": 3.7295420959615273e-07, "loss": 1.0794, "step": 43949 }, { "epoch": 0.83, "learning_rate": 3.7287394139258996e-07, "loss": 1.1073, "step": 43950 }, { "epoch": 0.83, "learning_rate": 3.727936811316499e-07, "loss": 0.8985, "step": 43951 }, { "epoch": 0.83, "learning_rate": 3.727134288136342e-07, "loss": 0.9615, "step": 43952 }, { "epoch": 0.83, "learning_rate": 3.7263318443884087e-07, "loss": 0.8114, "step": 43953 }, { "epoch": 0.83, "learning_rate": 3.7255294800756986e-07, "loss": 0.853, "step": 43954 }, { "epoch": 0.83, "learning_rate": 3.724727195201211e-07, "loss": 1.192, "step": 43955 }, { "epoch": 0.83, "learning_rate": 3.723924989767938e-07, "loss": 1.182, "step": 43956 }, { "epoch": 0.83, "learning_rate": 3.723122863778877e-07, "loss": 0.8462, "step": 43957 }, { "epoch": 0.83, "learning_rate": 3.722320817237024e-07, "loss": 1.0187, "step": 43958 }, { "epoch": 0.83, "learning_rate": 3.7215188501453754e-07, "loss": 0.8856, "step": 43959 }, { "epoch": 0.83, "learning_rate": 3.720716962506915e-07, "loss": 0.7675, "step": 43960 }, { "epoch": 0.83, "learning_rate": 3.7199151543246546e-07, "loss": 0.8273, "step": 43961 }, { "epoch": 0.83, "learning_rate": 3.719113425601573e-07, "loss": 0.9998, "step": 43962 }, { "epoch": 0.83, "learning_rate": 3.7183117763406716e-07, "loss": 0.9836, "step": 43963 }, { "epoch": 0.83, "learning_rate": 3.7175102065449386e-07, "loss": 0.8088, "step": 43964 }, { "epoch": 0.83, "learning_rate": 3.716708716217371e-07, "loss": 0.8768, "step": 43965 }, { "epoch": 0.83, "learning_rate": 3.7159073053609605e-07, "loss": 0.7121, "step": 43966 }, { "epoch": 0.83, "learning_rate": 3.7151059739787e-07, "loss": 1.0204, "step": 43967 }, { "epoch": 0.83, "learning_rate": 3.714304722073586e-07, "loss": 0.9844, "step": 43968 }, { "epoch": 0.83, "learning_rate": 3.713503549648595e-07, "loss": 0.9691, "step": 43969 }, { "epoch": 0.83, "learning_rate": 3.71270245670674e-07, "loss": 0.9536, "step": 43970 }, { "epoch": 0.83, "learning_rate": 3.7119014432509953e-07, "loss": 0.9767, "step": 43971 }, { "epoch": 0.83, "learning_rate": 3.7111005092843516e-07, "loss": 0.7721, "step": 43972 }, { "epoch": 0.83, "learning_rate": 3.710299654809821e-07, "loss": 0.7421, "step": 43973 }, { "epoch": 0.83, "learning_rate": 3.70949887983037e-07, "loss": 1.0068, "step": 43974 }, { "epoch": 0.83, "learning_rate": 3.7086981843489966e-07, "loss": 0.8929, "step": 43975 }, { "epoch": 0.83, "learning_rate": 3.707897568368693e-07, "loss": 0.8634, "step": 43976 }, { "epoch": 0.83, "learning_rate": 3.707097031892445e-07, "loss": 0.9804, "step": 43977 }, { "epoch": 0.83, "learning_rate": 3.706296574923246e-07, "loss": 0.9373, "step": 43978 }, { "epoch": 0.83, "learning_rate": 3.705496197464084e-07, "loss": 0.771, "step": 43979 }, { "epoch": 0.83, "learning_rate": 3.704695899517949e-07, "loss": 0.7181, "step": 43980 }, { "epoch": 0.83, "learning_rate": 3.703895681087816e-07, "loss": 1.1216, "step": 43981 }, { "epoch": 0.83, "learning_rate": 3.7030955421766964e-07, "loss": 0.7576, "step": 43982 }, { "epoch": 0.83, "learning_rate": 3.7022954827875574e-07, "loss": 1.0283, "step": 43983 }, { "epoch": 0.83, "learning_rate": 3.701495502923394e-07, "loss": 0.9127, "step": 43984 }, { "epoch": 0.83, "learning_rate": 3.7006956025871957e-07, "loss": 0.7657, "step": 43985 }, { "epoch": 0.83, "learning_rate": 3.6998957817819455e-07, "loss": 0.8976, "step": 43986 }, { "epoch": 0.83, "learning_rate": 3.69909604051063e-07, "loss": 1.1925, "step": 43987 }, { "epoch": 0.83, "learning_rate": 3.6982963787762394e-07, "loss": 0.996, "step": 43988 }, { "epoch": 0.83, "learning_rate": 3.697496796581762e-07, "loss": 0.8941, "step": 43989 }, { "epoch": 0.83, "learning_rate": 3.6966972939301653e-07, "loss": 0.7534, "step": 43990 }, { "epoch": 0.83, "learning_rate": 3.695897870824461e-07, "loss": 0.8234, "step": 43991 }, { "epoch": 0.83, "learning_rate": 3.6950985272676155e-07, "loss": 0.9146, "step": 43992 }, { "epoch": 0.83, "learning_rate": 3.69429926326261e-07, "loss": 1.1488, "step": 43993 }, { "epoch": 0.83, "learning_rate": 3.6935000788124507e-07, "loss": 0.9092, "step": 43994 }, { "epoch": 0.83, "learning_rate": 3.6927009739201045e-07, "loss": 0.7646, "step": 43995 }, { "epoch": 0.83, "learning_rate": 3.691901948588561e-07, "loss": 0.8091, "step": 43996 }, { "epoch": 0.83, "learning_rate": 3.691103002820798e-07, "loss": 0.8221, "step": 43997 }, { "epoch": 0.83, "learning_rate": 3.6903041366198074e-07, "loss": 0.8688, "step": 43998 }, { "epoch": 0.83, "learning_rate": 3.6895053499885647e-07, "loss": 0.8586, "step": 43999 }, { "epoch": 0.83, "learning_rate": 3.6887066429300566e-07, "loss": 1.1246, "step": 44000 }, { "epoch": 0.83, "learning_rate": 3.6879080154472694e-07, "loss": 1.037, "step": 44001 }, { "epoch": 0.83, "learning_rate": 3.6871094675431705e-07, "loss": 0.6849, "step": 44002 }, { "epoch": 0.83, "learning_rate": 3.6863109992207605e-07, "loss": 0.7681, "step": 44003 }, { "epoch": 0.83, "learning_rate": 3.685512610483008e-07, "loss": 0.8133, "step": 44004 }, { "epoch": 0.83, "learning_rate": 3.684714301332898e-07, "loss": 1.1569, "step": 44005 }, { "epoch": 0.83, "learning_rate": 3.6839160717734105e-07, "loss": 0.9733, "step": 44006 }, { "epoch": 0.83, "learning_rate": 3.6831179218075247e-07, "loss": 1.1859, "step": 44007 }, { "epoch": 0.83, "learning_rate": 3.682319851438232e-07, "loss": 0.879, "step": 44008 }, { "epoch": 0.83, "learning_rate": 3.681521860668491e-07, "loss": 0.9286, "step": 44009 }, { "epoch": 0.83, "learning_rate": 3.680723949501305e-07, "loss": 0.8837, "step": 44010 }, { "epoch": 0.83, "learning_rate": 3.6799261179396363e-07, "loss": 0.7855, "step": 44011 }, { "epoch": 0.83, "learning_rate": 3.6791283659864703e-07, "loss": 0.8718, "step": 44012 }, { "epoch": 0.83, "learning_rate": 3.6783306936447854e-07, "loss": 0.8093, "step": 44013 }, { "epoch": 0.83, "learning_rate": 3.6775331009175573e-07, "loss": 0.803, "step": 44014 }, { "epoch": 0.83, "learning_rate": 3.6767355878077697e-07, "loss": 0.856, "step": 44015 }, { "epoch": 0.83, "learning_rate": 3.675938154318398e-07, "loss": 0.7828, "step": 44016 }, { "epoch": 0.83, "learning_rate": 3.675140800452423e-07, "loss": 0.873, "step": 44017 }, { "epoch": 0.83, "learning_rate": 3.6743435262128063e-07, "loss": 1.1481, "step": 44018 }, { "epoch": 0.83, "learning_rate": 3.6735463316025455e-07, "loss": 1.0649, "step": 44019 }, { "epoch": 0.83, "learning_rate": 3.6727492166246133e-07, "loss": 0.9128, "step": 44020 }, { "epoch": 0.83, "learning_rate": 3.671952181281971e-07, "loss": 0.8023, "step": 44021 }, { "epoch": 0.83, "learning_rate": 3.671155225577616e-07, "loss": 0.7642, "step": 44022 }, { "epoch": 0.83, "learning_rate": 3.670358349514508e-07, "loss": 0.8492, "step": 44023 }, { "epoch": 0.83, "learning_rate": 3.6695615530956267e-07, "loss": 0.9147, "step": 44024 }, { "epoch": 0.83, "learning_rate": 3.6687648363239487e-07, "loss": 1.0099, "step": 44025 }, { "epoch": 0.83, "learning_rate": 3.667968199202451e-07, "loss": 1.0831, "step": 44026 }, { "epoch": 0.83, "learning_rate": 3.667171641734105e-07, "loss": 0.8249, "step": 44027 }, { "epoch": 0.83, "learning_rate": 3.666375163921884e-07, "loss": 0.7659, "step": 44028 }, { "epoch": 0.83, "learning_rate": 3.6655787657687734e-07, "loss": 0.8371, "step": 44029 }, { "epoch": 0.83, "learning_rate": 3.664782447277723e-07, "loss": 0.8509, "step": 44030 }, { "epoch": 0.83, "learning_rate": 3.6639862084517336e-07, "loss": 0.9966, "step": 44031 }, { "epoch": 0.83, "learning_rate": 3.6631900492937604e-07, "loss": 1.0897, "step": 44032 }, { "epoch": 0.83, "learning_rate": 3.6623939698067797e-07, "loss": 0.6676, "step": 44033 }, { "epoch": 0.83, "learning_rate": 3.661597969993766e-07, "loss": 1.1137, "step": 44034 }, { "epoch": 0.83, "learning_rate": 3.660802049857692e-07, "loss": 0.767, "step": 44035 }, { "epoch": 0.83, "learning_rate": 3.660006209401529e-07, "loss": 0.8295, "step": 44036 }, { "epoch": 0.83, "learning_rate": 3.659210448628248e-07, "loss": 1.0684, "step": 44037 }, { "epoch": 0.83, "learning_rate": 3.6584147675408273e-07, "loss": 0.8149, "step": 44038 }, { "epoch": 0.83, "learning_rate": 3.657619166142218e-07, "loss": 0.7576, "step": 44039 }, { "epoch": 0.83, "learning_rate": 3.6568236444354116e-07, "loss": 0.8264, "step": 44040 }, { "epoch": 0.83, "learning_rate": 3.656028202423378e-07, "loss": 0.7949, "step": 44041 }, { "epoch": 0.83, "learning_rate": 3.655232840109069e-07, "loss": 0.8175, "step": 44042 }, { "epoch": 0.83, "learning_rate": 3.6544375574954743e-07, "loss": 1.0599, "step": 44043 }, { "epoch": 0.83, "learning_rate": 3.653642354585554e-07, "loss": 0.671, "step": 44044 }, { "epoch": 0.83, "learning_rate": 3.6528472313822755e-07, "loss": 0.7416, "step": 44045 }, { "epoch": 0.83, "learning_rate": 3.6520521878886136e-07, "loss": 0.9825, "step": 44046 }, { "epoch": 0.83, "learning_rate": 3.651257224107532e-07, "loss": 0.9293, "step": 44047 }, { "epoch": 0.83, "learning_rate": 3.6504623400420017e-07, "loss": 0.8455, "step": 44048 }, { "epoch": 0.83, "learning_rate": 3.6496675356949894e-07, "loss": 1.0446, "step": 44049 }, { "epoch": 0.83, "learning_rate": 3.648872811069473e-07, "loss": 1.0178, "step": 44050 }, { "epoch": 0.83, "learning_rate": 3.648078166168398e-07, "loss": 0.7231, "step": 44051 }, { "epoch": 0.83, "learning_rate": 3.6472836009947554e-07, "loss": 0.7796, "step": 44052 }, { "epoch": 0.83, "learning_rate": 3.6464891155514936e-07, "loss": 0.8355, "step": 44053 }, { "epoch": 0.83, "learning_rate": 3.645694709841591e-07, "loss": 0.7651, "step": 44054 }, { "epoch": 0.83, "learning_rate": 3.6449003838680054e-07, "loss": 1.0271, "step": 44055 }, { "epoch": 0.83, "learning_rate": 3.64410613763371e-07, "loss": 1.2712, "step": 44056 }, { "epoch": 0.83, "learning_rate": 3.6433119711416663e-07, "loss": 0.9127, "step": 44057 }, { "epoch": 0.83, "learning_rate": 3.642517884394839e-07, "loss": 0.9389, "step": 44058 }, { "epoch": 0.83, "learning_rate": 3.6417238773962026e-07, "loss": 0.9632, "step": 44059 }, { "epoch": 0.83, "learning_rate": 3.6409299501487055e-07, "loss": 0.7844, "step": 44060 }, { "epoch": 0.83, "learning_rate": 3.640136102655323e-07, "loss": 0.7926, "step": 44061 }, { "epoch": 0.83, "learning_rate": 3.639342334919024e-07, "loss": 0.7073, "step": 44062 }, { "epoch": 0.83, "learning_rate": 3.638548646942755e-07, "loss": 1.0922, "step": 44063 }, { "epoch": 0.83, "learning_rate": 3.6377550387295013e-07, "loss": 0.9668, "step": 44064 }, { "epoch": 0.83, "learning_rate": 3.636961510282211e-07, "loss": 0.9229, "step": 44065 }, { "epoch": 0.83, "learning_rate": 3.636168061603851e-07, "loss": 0.6783, "step": 44066 }, { "epoch": 0.83, "learning_rate": 3.6353746926973824e-07, "loss": 0.8284, "step": 44067 }, { "epoch": 0.83, "learning_rate": 3.634581403565771e-07, "loss": 1.2341, "step": 44068 }, { "epoch": 0.83, "learning_rate": 3.633788194211979e-07, "loss": 0.9371, "step": 44069 }, { "epoch": 0.83, "learning_rate": 3.6329950646389637e-07, "loss": 0.862, "step": 44070 }, { "epoch": 0.83, "learning_rate": 3.632202014849698e-07, "loss": 0.8564, "step": 44071 }, { "epoch": 0.83, "learning_rate": 3.631409044847123e-07, "loss": 0.7696, "step": 44072 }, { "epoch": 0.83, "learning_rate": 3.6306161546342227e-07, "loss": 0.8299, "step": 44073 }, { "epoch": 0.83, "learning_rate": 3.6298233442139395e-07, "loss": 0.9343, "step": 44074 }, { "epoch": 0.83, "learning_rate": 3.6290306135892406e-07, "loss": 1.1288, "step": 44075 }, { "epoch": 0.83, "learning_rate": 3.628237962763087e-07, "loss": 0.9306, "step": 44076 }, { "epoch": 0.83, "learning_rate": 3.627445391738438e-07, "loss": 0.8054, "step": 44077 }, { "epoch": 0.83, "learning_rate": 3.626652900518254e-07, "loss": 0.843, "step": 44078 }, { "epoch": 0.83, "learning_rate": 3.62586048910549e-07, "loss": 0.7663, "step": 44079 }, { "epoch": 0.83, "learning_rate": 3.6250681575031144e-07, "loss": 0.7612, "step": 44080 }, { "epoch": 0.83, "learning_rate": 3.624275905714067e-07, "loss": 0.9507, "step": 44081 }, { "epoch": 0.83, "learning_rate": 3.623483733741326e-07, "loss": 0.8347, "step": 44082 }, { "epoch": 0.83, "learning_rate": 3.6226916415878444e-07, "loss": 0.806, "step": 44083 }, { "epoch": 0.83, "learning_rate": 3.621899629256567e-07, "loss": 0.8712, "step": 44084 }, { "epoch": 0.83, "learning_rate": 3.6211076967504697e-07, "loss": 0.7389, "step": 44085 }, { "epoch": 0.83, "learning_rate": 3.6203158440724973e-07, "loss": 0.8917, "step": 44086 }, { "epoch": 0.83, "learning_rate": 3.619524071225611e-07, "loss": 1.2275, "step": 44087 }, { "epoch": 0.83, "learning_rate": 3.6187323782127636e-07, "loss": 1.1498, "step": 44088 }, { "epoch": 0.83, "learning_rate": 3.6179407650369145e-07, "loss": 1.0754, "step": 44089 }, { "epoch": 0.83, "learning_rate": 3.61714923170102e-07, "loss": 0.9195, "step": 44090 }, { "epoch": 0.83, "learning_rate": 3.616357778208035e-07, "loss": 1.09, "step": 44091 }, { "epoch": 0.83, "learning_rate": 3.615566404560919e-07, "loss": 0.7508, "step": 44092 }, { "epoch": 0.83, "learning_rate": 3.6147751107626113e-07, "loss": 1.0555, "step": 44093 }, { "epoch": 0.83, "learning_rate": 3.61398389681609e-07, "loss": 0.9644, "step": 44094 }, { "epoch": 0.83, "learning_rate": 3.6131927627242907e-07, "loss": 0.7713, "step": 44095 }, { "epoch": 0.83, "learning_rate": 3.6124017084901734e-07, "loss": 0.8319, "step": 44096 }, { "epoch": 0.83, "learning_rate": 3.611610734116694e-07, "loss": 0.8159, "step": 44097 }, { "epoch": 0.83, "learning_rate": 3.6108198396068025e-07, "loss": 0.9355, "step": 44098 }, { "epoch": 0.83, "learning_rate": 3.6100290249634543e-07, "loss": 0.803, "step": 44099 }, { "epoch": 0.83, "learning_rate": 3.609238290189601e-07, "loss": 1.0539, "step": 44100 }, { "epoch": 0.83, "learning_rate": 3.6084476352882036e-07, "loss": 0.9997, "step": 44101 }, { "epoch": 0.83, "learning_rate": 3.607657060262196e-07, "loss": 0.9371, "step": 44102 }, { "epoch": 0.83, "learning_rate": 3.6068665651145446e-07, "loss": 1.1172, "step": 44103 }, { "epoch": 0.83, "learning_rate": 3.6060761498482035e-07, "loss": 0.9193, "step": 44104 }, { "epoch": 0.83, "learning_rate": 3.6052858144661083e-07, "loss": 1.0226, "step": 44105 }, { "epoch": 0.83, "learning_rate": 3.60449555897123e-07, "loss": 1.1809, "step": 44106 }, { "epoch": 0.83, "learning_rate": 3.603705383366504e-07, "loss": 1.005, "step": 44107 }, { "epoch": 0.83, "learning_rate": 3.602915287654887e-07, "loss": 0.9255, "step": 44108 }, { "epoch": 0.83, "learning_rate": 3.602125271839327e-07, "loss": 0.8727, "step": 44109 }, { "epoch": 0.83, "learning_rate": 3.601335335922776e-07, "loss": 0.7757, "step": 44110 }, { "epoch": 0.83, "learning_rate": 3.60054547990818e-07, "loss": 1.055, "step": 44111 }, { "epoch": 0.83, "learning_rate": 3.599755703798494e-07, "loss": 0.8975, "step": 44112 }, { "epoch": 0.83, "learning_rate": 3.598966007596669e-07, "loss": 0.8285, "step": 44113 }, { "epoch": 0.83, "learning_rate": 3.5981763913056384e-07, "loss": 0.8171, "step": 44114 }, { "epoch": 0.83, "learning_rate": 3.5973868549283697e-07, "loss": 0.9742, "step": 44115 }, { "epoch": 0.83, "learning_rate": 3.5965973984677993e-07, "loss": 0.9773, "step": 44116 }, { "epoch": 0.83, "learning_rate": 3.5958080219268776e-07, "loss": 0.7142, "step": 44117 }, { "epoch": 0.83, "learning_rate": 3.5950187253085495e-07, "loss": 1.067, "step": 44118 }, { "epoch": 0.83, "learning_rate": 3.594229508615768e-07, "loss": 0.9474, "step": 44119 }, { "epoch": 0.83, "learning_rate": 3.593440371851478e-07, "loss": 0.8864, "step": 44120 }, { "epoch": 0.83, "learning_rate": 3.592651315018622e-07, "loss": 0.8755, "step": 44121 }, { "epoch": 0.83, "learning_rate": 3.5918623381201583e-07, "loss": 0.9719, "step": 44122 }, { "epoch": 0.83, "learning_rate": 3.5910734411590126e-07, "loss": 0.7549, "step": 44123 }, { "epoch": 0.83, "learning_rate": 3.590284624138146e-07, "loss": 0.9331, "step": 44124 }, { "epoch": 0.83, "learning_rate": 3.589495887060507e-07, "loss": 1.0042, "step": 44125 }, { "epoch": 0.83, "learning_rate": 3.5887072299290225e-07, "loss": 0.8069, "step": 44126 }, { "epoch": 0.83, "learning_rate": 3.587918652746661e-07, "loss": 0.9504, "step": 44127 }, { "epoch": 0.83, "learning_rate": 3.587130155516347e-07, "loss": 0.9901, "step": 44128 }, { "epoch": 0.83, "learning_rate": 3.5863417382410337e-07, "loss": 0.5419, "step": 44129 }, { "epoch": 0.83, "learning_rate": 3.585553400923664e-07, "loss": 1.1147, "step": 44130 }, { "epoch": 0.83, "learning_rate": 3.5847651435671816e-07, "loss": 1.2322, "step": 44131 }, { "epoch": 0.83, "learning_rate": 3.5839769661745297e-07, "loss": 0.9219, "step": 44132 }, { "epoch": 0.83, "learning_rate": 3.5831888687486495e-07, "loss": 1.1361, "step": 44133 }, { "epoch": 0.83, "learning_rate": 3.582400851292492e-07, "loss": 0.9044, "step": 44134 }, { "epoch": 0.83, "learning_rate": 3.581612913808982e-07, "loss": 0.8365, "step": 44135 }, { "epoch": 0.83, "learning_rate": 3.580825056301082e-07, "loss": 0.7036, "step": 44136 }, { "epoch": 0.83, "learning_rate": 3.5800372787717226e-07, "loss": 0.9822, "step": 44137 }, { "epoch": 0.83, "learning_rate": 3.579249581223845e-07, "loss": 0.7845, "step": 44138 }, { "epoch": 0.83, "learning_rate": 3.5784619636603926e-07, "loss": 0.885, "step": 44139 }, { "epoch": 0.83, "learning_rate": 3.577674426084307e-07, "loss": 0.9145, "step": 44140 }, { "epoch": 0.83, "learning_rate": 3.576886968498527e-07, "loss": 0.8542, "step": 44141 }, { "epoch": 0.83, "learning_rate": 3.576099590905996e-07, "loss": 0.615, "step": 44142 }, { "epoch": 0.83, "learning_rate": 3.5753122933096575e-07, "loss": 0.9391, "step": 44143 }, { "epoch": 0.83, "learning_rate": 3.5745250757124347e-07, "loss": 0.9248, "step": 44144 }, { "epoch": 0.83, "learning_rate": 3.573737938117283e-07, "loss": 0.8861, "step": 44145 }, { "epoch": 0.83, "learning_rate": 3.572950880527143e-07, "loss": 0.9082, "step": 44146 }, { "epoch": 0.83, "learning_rate": 3.572163902944936e-07, "loss": 1.038, "step": 44147 }, { "epoch": 0.83, "learning_rate": 3.5713770053736247e-07, "loss": 0.9326, "step": 44148 }, { "epoch": 0.83, "learning_rate": 3.570590187816128e-07, "loss": 1.1027, "step": 44149 }, { "epoch": 0.83, "learning_rate": 3.569803450275389e-07, "loss": 1.0534, "step": 44150 }, { "epoch": 0.83, "learning_rate": 3.5690167927543487e-07, "loss": 0.9323, "step": 44151 }, { "epoch": 0.83, "learning_rate": 3.568230215255944e-07, "loss": 0.7909, "step": 44152 }, { "epoch": 0.83, "learning_rate": 3.567443717783109e-07, "loss": 0.882, "step": 44153 }, { "epoch": 0.83, "learning_rate": 3.56665730033878e-07, "loss": 0.7712, "step": 44154 }, { "epoch": 0.83, "learning_rate": 3.565870962925905e-07, "loss": 0.9417, "step": 44155 }, { "epoch": 0.83, "learning_rate": 3.5650847055473947e-07, "loss": 0.9331, "step": 44156 }, { "epoch": 0.83, "learning_rate": 3.564298528206217e-07, "loss": 0.9316, "step": 44157 }, { "epoch": 0.83, "learning_rate": 3.5635124309052833e-07, "loss": 0.9248, "step": 44158 }, { "epoch": 0.83, "learning_rate": 3.5627264136475356e-07, "loss": 0.9553, "step": 44159 }, { "epoch": 0.83, "learning_rate": 3.561940476435913e-07, "loss": 0.8633, "step": 44160 }, { "epoch": 0.83, "learning_rate": 3.561154619273346e-07, "loss": 0.8403, "step": 44161 }, { "epoch": 0.83, "learning_rate": 3.5603688421627703e-07, "loss": 1.0568, "step": 44162 }, { "epoch": 0.83, "learning_rate": 3.5595831451071205e-07, "loss": 0.9662, "step": 44163 }, { "epoch": 0.83, "learning_rate": 3.558797528109334e-07, "loss": 0.9751, "step": 44164 }, { "epoch": 0.83, "learning_rate": 3.55801199117233e-07, "loss": 0.9057, "step": 44165 }, { "epoch": 0.83, "learning_rate": 3.5572265342990575e-07, "loss": 1.0392, "step": 44166 }, { "epoch": 0.83, "learning_rate": 3.556441157492449e-07, "loss": 0.9094, "step": 44167 }, { "epoch": 0.83, "learning_rate": 3.555655860755419e-07, "loss": 1.0842, "step": 44168 }, { "epoch": 0.83, "learning_rate": 3.5548706440909267e-07, "loss": 0.8823, "step": 44169 }, { "epoch": 0.83, "learning_rate": 3.554085507501884e-07, "loss": 1.005, "step": 44170 }, { "epoch": 0.83, "learning_rate": 3.553300450991226e-07, "loss": 0.8443, "step": 44171 }, { "epoch": 0.83, "learning_rate": 3.5525154745618877e-07, "loss": 0.7907, "step": 44172 }, { "epoch": 0.83, "learning_rate": 3.5517305782168e-07, "loss": 0.9552, "step": 44173 }, { "epoch": 0.83, "learning_rate": 3.5509457619588935e-07, "loss": 0.9388, "step": 44174 }, { "epoch": 0.83, "learning_rate": 3.550161025791096e-07, "loss": 1.0733, "step": 44175 }, { "epoch": 0.83, "learning_rate": 3.5493763697163454e-07, "loss": 0.7144, "step": 44176 }, { "epoch": 0.83, "learning_rate": 3.548591793737555e-07, "loss": 0.9234, "step": 44177 }, { "epoch": 0.83, "learning_rate": 3.547807297857675e-07, "loss": 0.9883, "step": 44178 }, { "epoch": 0.83, "learning_rate": 3.5470228820796205e-07, "loss": 0.8704, "step": 44179 }, { "epoch": 0.83, "learning_rate": 3.546238546406325e-07, "loss": 0.8985, "step": 44180 }, { "epoch": 0.83, "learning_rate": 3.545454290840716e-07, "loss": 1.0788, "step": 44181 }, { "epoch": 0.83, "learning_rate": 3.5446701153857233e-07, "loss": 0.9568, "step": 44182 }, { "epoch": 0.83, "learning_rate": 3.543886020044274e-07, "loss": 0.8521, "step": 44183 }, { "epoch": 0.83, "learning_rate": 3.5431020048192986e-07, "loss": 0.8848, "step": 44184 }, { "epoch": 0.83, "learning_rate": 3.542318069713727e-07, "loss": 0.8948, "step": 44185 }, { "epoch": 0.83, "learning_rate": 3.541534214730469e-07, "loss": 0.8177, "step": 44186 }, { "epoch": 0.83, "learning_rate": 3.54075043987247e-07, "loss": 1.1301, "step": 44187 }, { "epoch": 0.83, "learning_rate": 3.539966745142659e-07, "loss": 0.8921, "step": 44188 }, { "epoch": 0.83, "learning_rate": 3.5391831305439413e-07, "loss": 0.7463, "step": 44189 }, { "epoch": 0.83, "learning_rate": 3.538399596079267e-07, "loss": 0.7168, "step": 44190 }, { "epoch": 0.83, "learning_rate": 3.537616141751546e-07, "loss": 0.7753, "step": 44191 }, { "epoch": 0.83, "learning_rate": 3.5368327675637056e-07, "loss": 0.7482, "step": 44192 }, { "epoch": 0.83, "learning_rate": 3.536049473518677e-07, "loss": 0.765, "step": 44193 }, { "epoch": 0.83, "learning_rate": 3.53526625961938e-07, "loss": 1.1296, "step": 44194 }, { "epoch": 0.83, "learning_rate": 3.5344831258687403e-07, "loss": 0.7517, "step": 44195 }, { "epoch": 0.83, "learning_rate": 3.5337000722696827e-07, "loss": 0.8828, "step": 44196 }, { "epoch": 0.83, "learning_rate": 3.5329170988251364e-07, "loss": 0.893, "step": 44197 }, { "epoch": 0.83, "learning_rate": 3.53213420553801e-07, "loss": 0.6691, "step": 44198 }, { "epoch": 0.83, "learning_rate": 3.531351392411245e-07, "loss": 1.0402, "step": 44199 }, { "epoch": 0.83, "learning_rate": 3.53056865944775e-07, "loss": 1.095, "step": 44200 }, { "epoch": 0.83, "learning_rate": 3.529786006650454e-07, "loss": 0.9496, "step": 44201 }, { "epoch": 0.83, "learning_rate": 3.5290034340222796e-07, "loss": 0.8857, "step": 44202 }, { "epoch": 0.83, "learning_rate": 3.528220941566149e-07, "loss": 0.8156, "step": 44203 }, { "epoch": 0.83, "learning_rate": 3.527438529284982e-07, "loss": 0.8117, "step": 44204 }, { "epoch": 0.83, "learning_rate": 3.5266561971816994e-07, "loss": 0.9516, "step": 44205 }, { "epoch": 0.83, "learning_rate": 3.525873945259231e-07, "loss": 1.0419, "step": 44206 }, { "epoch": 0.83, "learning_rate": 3.5250917735204807e-07, "loss": 1.1605, "step": 44207 }, { "epoch": 0.83, "learning_rate": 3.5243096819683823e-07, "loss": 0.5634, "step": 44208 }, { "epoch": 0.83, "learning_rate": 3.5235276706058613e-07, "loss": 0.7046, "step": 44209 }, { "epoch": 0.83, "learning_rate": 3.5227457394358177e-07, "loss": 0.6887, "step": 44210 }, { "epoch": 0.83, "learning_rate": 3.521963888461194e-07, "loss": 0.7742, "step": 44211 }, { "epoch": 0.83, "learning_rate": 3.521182117684893e-07, "loss": 0.9995, "step": 44212 }, { "epoch": 0.83, "learning_rate": 3.5204004271098407e-07, "loss": 0.874, "step": 44213 }, { "epoch": 0.83, "learning_rate": 3.519618816738951e-07, "loss": 0.8307, "step": 44214 }, { "epoch": 0.83, "learning_rate": 3.5188372865751496e-07, "loss": 0.6899, "step": 44215 }, { "epoch": 0.83, "learning_rate": 3.5180558366213507e-07, "loss": 0.947, "step": 44216 }, { "epoch": 0.83, "learning_rate": 3.517274466880471e-07, "loss": 0.8221, "step": 44217 }, { "epoch": 0.83, "learning_rate": 3.5164931773554373e-07, "loss": 1.1847, "step": 44218 }, { "epoch": 0.83, "learning_rate": 3.5157119680491457e-07, "loss": 1.2008, "step": 44219 }, { "epoch": 0.83, "learning_rate": 3.514930838964539e-07, "loss": 0.8862, "step": 44220 }, { "epoch": 0.83, "learning_rate": 3.514149790104518e-07, "loss": 0.8826, "step": 44221 }, { "epoch": 0.83, "learning_rate": 3.513368821472002e-07, "loss": 0.9603, "step": 44222 }, { "epoch": 0.83, "learning_rate": 3.512587933069905e-07, "loss": 0.6786, "step": 44223 }, { "epoch": 0.83, "learning_rate": 3.511807124901151e-07, "loss": 1.0225, "step": 44224 }, { "epoch": 0.83, "learning_rate": 3.5110263969686476e-07, "loss": 1.063, "step": 44225 }, { "epoch": 0.83, "learning_rate": 3.5102457492753125e-07, "loss": 0.9976, "step": 44226 }, { "epoch": 0.83, "learning_rate": 3.5094651818240677e-07, "loss": 1.0078, "step": 44227 }, { "epoch": 0.83, "learning_rate": 3.508684694617809e-07, "loss": 1.0283, "step": 44228 }, { "epoch": 0.83, "learning_rate": 3.5079042876594664e-07, "loss": 0.9796, "step": 44229 }, { "epoch": 0.83, "learning_rate": 3.507123960951958e-07, "loss": 1.0563, "step": 44230 }, { "epoch": 0.83, "learning_rate": 3.5063437144981784e-07, "loss": 1.1003, "step": 44231 }, { "epoch": 0.83, "learning_rate": 3.5055635483010636e-07, "loss": 0.8494, "step": 44232 }, { "epoch": 0.83, "learning_rate": 3.504783462363509e-07, "loss": 0.8198, "step": 44233 }, { "epoch": 0.83, "learning_rate": 3.5040034566884347e-07, "loss": 1.0268, "step": 44234 }, { "epoch": 0.83, "learning_rate": 3.5032235312787544e-07, "loss": 0.9208, "step": 44235 }, { "epoch": 0.83, "learning_rate": 3.502443686137375e-07, "loss": 1.0219, "step": 44236 }, { "epoch": 0.83, "learning_rate": 3.501663921267212e-07, "loss": 1.0786, "step": 44237 }, { "epoch": 0.83, "learning_rate": 3.500884236671179e-07, "loss": 0.9114, "step": 44238 }, { "epoch": 0.83, "learning_rate": 3.5001046323521886e-07, "loss": 0.9109, "step": 44239 }, { "epoch": 0.83, "learning_rate": 3.499325108313145e-07, "loss": 0.9163, "step": 44240 }, { "epoch": 0.83, "learning_rate": 3.4985456645569596e-07, "loss": 0.8134, "step": 44241 }, { "epoch": 0.83, "learning_rate": 3.497766301086547e-07, "loss": 0.7936, "step": 44242 }, { "epoch": 0.83, "learning_rate": 3.4969870179048155e-07, "loss": 0.981, "step": 44243 }, { "epoch": 0.83, "learning_rate": 3.4962078150146765e-07, "loss": 0.9739, "step": 44244 }, { "epoch": 0.83, "learning_rate": 3.495428692419037e-07, "loss": 1.0175, "step": 44245 }, { "epoch": 0.83, "learning_rate": 3.4946496501208125e-07, "loss": 0.9294, "step": 44246 }, { "epoch": 0.83, "learning_rate": 3.493870688122894e-07, "loss": 0.7807, "step": 44247 }, { "epoch": 0.83, "learning_rate": 3.493091806428217e-07, "loss": 0.8654, "step": 44248 }, { "epoch": 0.83, "learning_rate": 3.492313005039669e-07, "loss": 1.0404, "step": 44249 }, { "epoch": 0.83, "learning_rate": 3.4915342839601603e-07, "loss": 0.9262, "step": 44250 }, { "epoch": 0.83, "learning_rate": 3.4907556431926144e-07, "loss": 0.7116, "step": 44251 }, { "epoch": 0.83, "learning_rate": 3.4899770827399204e-07, "loss": 0.9135, "step": 44252 }, { "epoch": 0.83, "learning_rate": 3.4891986026049926e-07, "loss": 0.9459, "step": 44253 }, { "epoch": 0.83, "learning_rate": 3.4884202027907376e-07, "loss": 0.9327, "step": 44254 }, { "epoch": 0.83, "learning_rate": 3.4876418833000637e-07, "loss": 1.0294, "step": 44255 }, { "epoch": 0.83, "learning_rate": 3.4868636441358737e-07, "loss": 1.0859, "step": 44256 }, { "epoch": 0.83, "learning_rate": 3.4860854853010744e-07, "loss": 0.912, "step": 44257 }, { "epoch": 0.84, "learning_rate": 3.4853074067985797e-07, "loss": 0.9318, "step": 44258 }, { "epoch": 0.84, "learning_rate": 3.4845294086312763e-07, "loss": 0.8138, "step": 44259 }, { "epoch": 0.84, "learning_rate": 3.4837514908020897e-07, "loss": 0.6208, "step": 44260 }, { "epoch": 0.84, "learning_rate": 3.482973653313912e-07, "loss": 0.8741, "step": 44261 }, { "epoch": 0.84, "learning_rate": 3.4821958961696516e-07, "loss": 1.2198, "step": 44262 }, { "epoch": 0.84, "learning_rate": 3.4814182193722097e-07, "loss": 0.981, "step": 44263 }, { "epoch": 0.84, "learning_rate": 3.4806406229244916e-07, "loss": 1.009, "step": 44264 }, { "epoch": 0.84, "learning_rate": 3.4798631068294037e-07, "loss": 0.791, "step": 44265 }, { "epoch": 0.84, "learning_rate": 3.4790856710898465e-07, "loss": 0.7683, "step": 44266 }, { "epoch": 0.84, "learning_rate": 3.478308315708731e-07, "loss": 0.7179, "step": 44267 }, { "epoch": 0.84, "learning_rate": 3.477531040688939e-07, "loss": 0.9476, "step": 44268 }, { "epoch": 0.84, "learning_rate": 3.476753846033398e-07, "loss": 0.9149, "step": 44269 }, { "epoch": 0.84, "learning_rate": 3.4759767317449926e-07, "loss": 0.8579, "step": 44270 }, { "epoch": 0.84, "learning_rate": 3.475199697826623e-07, "loss": 0.8928, "step": 44271 }, { "epoch": 0.84, "learning_rate": 3.4744227442812114e-07, "loss": 0.8676, "step": 44272 }, { "epoch": 0.84, "learning_rate": 3.473645871111639e-07, "loss": 0.8409, "step": 44273 }, { "epoch": 0.84, "learning_rate": 3.472869078320812e-07, "loss": 1.0892, "step": 44274 }, { "epoch": 0.84, "learning_rate": 3.4720923659116333e-07, "loss": 1.0433, "step": 44275 }, { "epoch": 0.84, "learning_rate": 3.4713157338869987e-07, "loss": 0.9439, "step": 44276 }, { "epoch": 0.84, "learning_rate": 3.470539182249813e-07, "loss": 0.777, "step": 44277 }, { "epoch": 0.84, "learning_rate": 3.4697627110029746e-07, "loss": 1.1088, "step": 44278 }, { "epoch": 0.84, "learning_rate": 3.4689863201493867e-07, "loss": 0.976, "step": 44279 }, { "epoch": 0.84, "learning_rate": 3.468210009691933e-07, "loss": 1.0797, "step": 44280 }, { "epoch": 0.84, "learning_rate": 3.467433779633536e-07, "loss": 1.05, "step": 44281 }, { "epoch": 0.84, "learning_rate": 3.4666576299770714e-07, "loss": 0.8666, "step": 44282 }, { "epoch": 0.84, "learning_rate": 3.465881560725451e-07, "loss": 0.7009, "step": 44283 }, { "epoch": 0.84, "learning_rate": 3.465105571881566e-07, "loss": 0.8913, "step": 44284 }, { "epoch": 0.84, "learning_rate": 3.464329663448318e-07, "loss": 0.6535, "step": 44285 }, { "epoch": 0.84, "learning_rate": 3.4635538354286015e-07, "loss": 0.9075, "step": 44286 }, { "epoch": 0.84, "learning_rate": 3.462778087825314e-07, "loss": 1.0112, "step": 44287 }, { "epoch": 0.84, "learning_rate": 3.462002420641361e-07, "loss": 1.0344, "step": 44288 }, { "epoch": 0.84, "learning_rate": 3.461226833879616e-07, "loss": 0.9034, "step": 44289 }, { "epoch": 0.84, "learning_rate": 3.4604513275430044e-07, "loss": 0.7798, "step": 44290 }, { "epoch": 0.84, "learning_rate": 3.459675901634399e-07, "loss": 0.8562, "step": 44291 }, { "epoch": 0.84, "learning_rate": 3.4589005561566994e-07, "loss": 0.9333, "step": 44292 }, { "epoch": 0.84, "learning_rate": 3.4581252911128156e-07, "loss": 1.0528, "step": 44293 }, { "epoch": 0.84, "learning_rate": 3.4573501065056247e-07, "loss": 0.9582, "step": 44294 }, { "epoch": 0.84, "learning_rate": 3.4565750023380277e-07, "loss": 0.7181, "step": 44295 }, { "epoch": 0.84, "learning_rate": 3.45579997861292e-07, "loss": 0.8411, "step": 44296 }, { "epoch": 0.84, "learning_rate": 3.4550250353331957e-07, "loss": 0.9709, "step": 44297 }, { "epoch": 0.84, "learning_rate": 3.454250172501747e-07, "loss": 0.7927, "step": 44298 }, { "epoch": 0.84, "learning_rate": 3.4534753901214664e-07, "loss": 1.0701, "step": 44299 }, { "epoch": 0.84, "learning_rate": 3.452700688195254e-07, "loss": 1.0829, "step": 44300 }, { "epoch": 0.84, "learning_rate": 3.451926066725986e-07, "loss": 0.9609, "step": 44301 }, { "epoch": 0.84, "learning_rate": 3.4511515257165756e-07, "loss": 0.923, "step": 44302 }, { "epoch": 0.84, "learning_rate": 3.450377065169899e-07, "loss": 0.9847, "step": 44303 }, { "epoch": 0.84, "learning_rate": 3.4496026850888544e-07, "loss": 0.8942, "step": 44304 }, { "epoch": 0.84, "learning_rate": 3.4488283854763324e-07, "loss": 0.967, "step": 44305 }, { "epoch": 0.84, "learning_rate": 3.448054166335224e-07, "loss": 1.0523, "step": 44306 }, { "epoch": 0.84, "learning_rate": 3.4472800276684206e-07, "loss": 0.9635, "step": 44307 }, { "epoch": 0.84, "learning_rate": 3.446505969478814e-07, "loss": 0.8741, "step": 44308 }, { "epoch": 0.84, "learning_rate": 3.445731991769299e-07, "loss": 0.6712, "step": 44309 }, { "epoch": 0.84, "learning_rate": 3.444958094542747e-07, "loss": 0.6765, "step": 44310 }, { "epoch": 0.84, "learning_rate": 3.4441842778020736e-07, "loss": 0.7758, "step": 44311 }, { "epoch": 0.84, "learning_rate": 3.4434105415501464e-07, "loss": 1.1219, "step": 44312 }, { "epoch": 0.84, "learning_rate": 3.44263688578986e-07, "loss": 1.0163, "step": 44313 }, { "epoch": 0.84, "learning_rate": 3.4418633105241185e-07, "loss": 0.8159, "step": 44314 }, { "epoch": 0.84, "learning_rate": 3.441089815755791e-07, "loss": 0.9857, "step": 44315 }, { "epoch": 0.84, "learning_rate": 3.4403164014877754e-07, "loss": 0.6538, "step": 44316 }, { "epoch": 0.84, "learning_rate": 3.439543067722956e-07, "loss": 0.8193, "step": 44317 }, { "epoch": 0.84, "learning_rate": 3.4387698144642214e-07, "loss": 1.0024, "step": 44318 }, { "epoch": 0.84, "learning_rate": 3.437996641714458e-07, "loss": 1.2111, "step": 44319 }, { "epoch": 0.84, "learning_rate": 3.4372235494765567e-07, "loss": 0.9869, "step": 44320 }, { "epoch": 0.84, "learning_rate": 3.4364505377534054e-07, "loss": 0.9271, "step": 44321 }, { "epoch": 0.84, "learning_rate": 3.435677606547877e-07, "loss": 0.8915, "step": 44322 }, { "epoch": 0.84, "learning_rate": 3.4349047558628777e-07, "loss": 0.9601, "step": 44323 }, { "epoch": 0.84, "learning_rate": 3.434131985701275e-07, "loss": 1.0131, "step": 44324 }, { "epoch": 0.84, "learning_rate": 3.433359296065966e-07, "loss": 0.8307, "step": 44325 }, { "epoch": 0.84, "learning_rate": 3.4325866869598294e-07, "loss": 0.851, "step": 44326 }, { "epoch": 0.84, "learning_rate": 3.4318141583857546e-07, "loss": 0.8873, "step": 44327 }, { "epoch": 0.84, "learning_rate": 3.431041710346622e-07, "loss": 0.9271, "step": 44328 }, { "epoch": 0.84, "learning_rate": 3.4302693428453215e-07, "loss": 0.7699, "step": 44329 }, { "epoch": 0.84, "learning_rate": 3.429497055884737e-07, "loss": 0.9189, "step": 44330 }, { "epoch": 0.84, "learning_rate": 3.428724849467738e-07, "loss": 1.2332, "step": 44331 }, { "epoch": 0.84, "learning_rate": 3.427952723597233e-07, "loss": 0.928, "step": 44332 }, { "epoch": 0.84, "learning_rate": 3.4271806782760817e-07, "loss": 0.7403, "step": 44333 }, { "epoch": 0.84, "learning_rate": 3.426408713507173e-07, "loss": 0.8478, "step": 44334 }, { "epoch": 0.84, "learning_rate": 3.425636829293405e-07, "loss": 0.8126, "step": 44335 }, { "epoch": 0.84, "learning_rate": 3.4248650256376386e-07, "loss": 0.9809, "step": 44336 }, { "epoch": 0.84, "learning_rate": 3.4240933025427666e-07, "loss": 0.97, "step": 44337 }, { "epoch": 0.84, "learning_rate": 3.4233216600116694e-07, "loss": 1.0201, "step": 44338 }, { "epoch": 0.84, "learning_rate": 3.422550098047228e-07, "loss": 0.9866, "step": 44339 }, { "epoch": 0.84, "learning_rate": 3.4217786166523213e-07, "loss": 0.8869, "step": 44340 }, { "epoch": 0.84, "learning_rate": 3.421007215829833e-07, "loss": 0.7006, "step": 44341 }, { "epoch": 0.84, "learning_rate": 3.4202358955826463e-07, "loss": 0.957, "step": 44342 }, { "epoch": 0.84, "learning_rate": 3.419464655913626e-07, "loss": 0.9737, "step": 44343 }, { "epoch": 0.84, "learning_rate": 3.418693496825676e-07, "loss": 1.1246, "step": 44344 }, { "epoch": 0.84, "learning_rate": 3.4179224183216537e-07, "loss": 0.9841, "step": 44345 }, { "epoch": 0.84, "learning_rate": 3.417151420404452e-07, "loss": 0.9395, "step": 44346 }, { "epoch": 0.84, "learning_rate": 3.416380503076941e-07, "loss": 0.9044, "step": 44347 }, { "epoch": 0.84, "learning_rate": 3.415609666342007e-07, "loss": 0.5584, "step": 44348 }, { "epoch": 0.84, "learning_rate": 3.4148389102025223e-07, "loss": 0.9603, "step": 44349 }, { "epoch": 0.84, "learning_rate": 3.4140682346613663e-07, "loss": 1.0452, "step": 44350 }, { "epoch": 0.84, "learning_rate": 3.4132976397214245e-07, "loss": 1.0577, "step": 44351 }, { "epoch": 0.84, "learning_rate": 3.412527125385556e-07, "loss": 0.8323, "step": 44352 }, { "epoch": 0.84, "learning_rate": 3.411756691656662e-07, "loss": 0.8414, "step": 44353 }, { "epoch": 0.84, "learning_rate": 3.4109863385376e-07, "loss": 0.9099, "step": 44354 }, { "epoch": 0.84, "learning_rate": 3.4102160660312496e-07, "loss": 0.862, "step": 44355 }, { "epoch": 0.84, "learning_rate": 3.409445874140499e-07, "loss": 0.7597, "step": 44356 }, { "epoch": 0.84, "learning_rate": 3.4086757628682103e-07, "loss": 0.7547, "step": 44357 }, { "epoch": 0.84, "learning_rate": 3.407905732217265e-07, "loss": 0.9229, "step": 44358 }, { "epoch": 0.84, "learning_rate": 3.407135782190538e-07, "loss": 0.9831, "step": 44359 }, { "epoch": 0.84, "learning_rate": 3.4063659127909014e-07, "loss": 0.9353, "step": 44360 }, { "epoch": 0.84, "learning_rate": 3.405596124021235e-07, "loss": 1.1054, "step": 44361 }, { "epoch": 0.84, "learning_rate": 3.4048264158844103e-07, "loss": 0.9445, "step": 44362 }, { "epoch": 0.84, "learning_rate": 3.404056788383306e-07, "loss": 0.9793, "step": 44363 }, { "epoch": 0.84, "learning_rate": 3.4032872415207805e-07, "loss": 1.0069, "step": 44364 }, { "epoch": 0.84, "learning_rate": 3.40251777529973e-07, "loss": 0.8673, "step": 44365 }, { "epoch": 0.84, "learning_rate": 3.4017483897230116e-07, "loss": 0.8379, "step": 44366 }, { "epoch": 0.84, "learning_rate": 3.4009790847935015e-07, "loss": 0.8382, "step": 44367 }, { "epoch": 0.84, "learning_rate": 3.4002098605140725e-07, "loss": 1.0377, "step": 44368 }, { "epoch": 0.84, "learning_rate": 3.3994407168875977e-07, "loss": 1.1302, "step": 44369 }, { "epoch": 0.84, "learning_rate": 3.398671653916949e-07, "loss": 0.9233, "step": 44370 }, { "epoch": 0.84, "learning_rate": 3.3979026716049995e-07, "loss": 0.9401, "step": 44371 }, { "epoch": 0.84, "learning_rate": 3.397133769954622e-07, "loss": 0.9191, "step": 44372 }, { "epoch": 0.84, "learning_rate": 3.396364948968675e-07, "loss": 0.8115, "step": 44373 }, { "epoch": 0.84, "learning_rate": 3.395596208650051e-07, "loss": 0.7324, "step": 44374 }, { "epoch": 0.84, "learning_rate": 3.3948275490016e-07, "loss": 0.8896, "step": 44375 }, { "epoch": 0.84, "learning_rate": 3.3940589700261986e-07, "loss": 0.8481, "step": 44376 }, { "epoch": 0.84, "learning_rate": 3.3932904717267264e-07, "loss": 0.9399, "step": 44377 }, { "epoch": 0.84, "learning_rate": 3.392522054106043e-07, "loss": 1.0803, "step": 44378 }, { "epoch": 0.84, "learning_rate": 3.391753717167018e-07, "loss": 0.907, "step": 44379 }, { "epoch": 0.84, "learning_rate": 3.3909854609125216e-07, "loss": 0.9531, "step": 44380 }, { "epoch": 0.84, "learning_rate": 3.3902172853454237e-07, "loss": 1.1619, "step": 44381 }, { "epoch": 0.84, "learning_rate": 3.389449190468591e-07, "loss": 0.913, "step": 44382 }, { "epoch": 0.84, "learning_rate": 3.3886811762848914e-07, "loss": 0.7324, "step": 44383 }, { "epoch": 0.84, "learning_rate": 3.3879132427972e-07, "loss": 0.9661, "step": 44384 }, { "epoch": 0.84, "learning_rate": 3.38714539000837e-07, "loss": 0.7994, "step": 44385 }, { "epoch": 0.84, "learning_rate": 3.3863776179212827e-07, "loss": 0.9636, "step": 44386 }, { "epoch": 0.84, "learning_rate": 3.3856099265387966e-07, "loss": 1.0345, "step": 44387 }, { "epoch": 0.84, "learning_rate": 3.384842315863779e-07, "loss": 1.0986, "step": 44388 }, { "epoch": 0.84, "learning_rate": 3.3840747858990967e-07, "loss": 0.9096, "step": 44389 }, { "epoch": 0.84, "learning_rate": 3.383307336647618e-07, "loss": 0.8391, "step": 44390 }, { "epoch": 0.84, "learning_rate": 3.3825399681122054e-07, "loss": 0.8068, "step": 44391 }, { "epoch": 0.84, "learning_rate": 3.381772680295728e-07, "loss": 0.8396, "step": 44392 }, { "epoch": 0.84, "learning_rate": 3.3810054732010515e-07, "loss": 0.8666, "step": 44393 }, { "epoch": 0.84, "learning_rate": 3.38023834683103e-07, "loss": 0.9921, "step": 44394 }, { "epoch": 0.84, "learning_rate": 3.3794713011885444e-07, "loss": 0.9253, "step": 44395 }, { "epoch": 0.84, "learning_rate": 3.378704336276445e-07, "loss": 0.9821, "step": 44396 }, { "epoch": 0.84, "learning_rate": 3.3779374520975933e-07, "loss": 0.9756, "step": 44397 }, { "epoch": 0.84, "learning_rate": 3.3771706486548733e-07, "loss": 0.9961, "step": 44398 }, { "epoch": 0.84, "learning_rate": 3.37640392595113e-07, "loss": 0.9379, "step": 44399 }, { "epoch": 0.84, "learning_rate": 3.37563728398923e-07, "loss": 0.77, "step": 44400 }, { "epoch": 0.84, "learning_rate": 3.374870722772036e-07, "loss": 0.869, "step": 44401 }, { "epoch": 0.84, "learning_rate": 3.3741042423024145e-07, "loss": 0.8455, "step": 44402 }, { "epoch": 0.84, "learning_rate": 3.373337842583224e-07, "loss": 0.8363, "step": 44403 }, { "epoch": 0.84, "learning_rate": 3.3725715236173266e-07, "loss": 0.7927, "step": 44404 }, { "epoch": 0.84, "learning_rate": 3.371805285407589e-07, "loss": 1.0779, "step": 44405 }, { "epoch": 0.84, "learning_rate": 3.3710391279568573e-07, "loss": 0.8645, "step": 44406 }, { "epoch": 0.84, "learning_rate": 3.370273051268014e-07, "loss": 0.9237, "step": 44407 }, { "epoch": 0.84, "learning_rate": 3.3695070553439015e-07, "loss": 0.8357, "step": 44408 }, { "epoch": 0.84, "learning_rate": 3.368741140187387e-07, "loss": 0.7279, "step": 44409 }, { "epoch": 0.84, "learning_rate": 3.3679753058013296e-07, "loss": 0.6643, "step": 44410 }, { "epoch": 0.84, "learning_rate": 3.3672095521885884e-07, "loss": 1.0748, "step": 44411 }, { "epoch": 0.84, "learning_rate": 3.366443879352024e-07, "loss": 1.1356, "step": 44412 }, { "epoch": 0.84, "learning_rate": 3.365678287294494e-07, "loss": 0.9814, "step": 44413 }, { "epoch": 0.84, "learning_rate": 3.3649127760188636e-07, "loss": 0.9837, "step": 44414 }, { "epoch": 0.84, "learning_rate": 3.364147345527977e-07, "loss": 1.012, "step": 44415 }, { "epoch": 0.84, "learning_rate": 3.3633819958247077e-07, "loss": 0.8893, "step": 44416 }, { "epoch": 0.84, "learning_rate": 3.362616726911905e-07, "loss": 0.7079, "step": 44417 }, { "epoch": 0.84, "learning_rate": 3.361851538792421e-07, "loss": 1.0827, "step": 44418 }, { "epoch": 0.84, "learning_rate": 3.3610864314691295e-07, "loss": 0.9083, "step": 44419 }, { "epoch": 0.84, "learning_rate": 3.3603214049448746e-07, "loss": 0.8617, "step": 44420 }, { "epoch": 0.84, "learning_rate": 3.3595564592225157e-07, "loss": 0.6809, "step": 44421 }, { "epoch": 0.84, "learning_rate": 3.358791594304908e-07, "loss": 0.9146, "step": 44422 }, { "epoch": 0.84, "learning_rate": 3.358026810194909e-07, "loss": 0.8397, "step": 44423 }, { "epoch": 0.84, "learning_rate": 3.3572621068953757e-07, "loss": 0.8226, "step": 44424 }, { "epoch": 0.84, "learning_rate": 3.356497484409163e-07, "loss": 1.0773, "step": 44425 }, { "epoch": 0.84, "learning_rate": 3.355732942739129e-07, "loss": 0.8333, "step": 44426 }, { "epoch": 0.84, "learning_rate": 3.354968481888113e-07, "loss": 0.9015, "step": 44427 }, { "epoch": 0.84, "learning_rate": 3.354204101858993e-07, "loss": 0.756, "step": 44428 }, { "epoch": 0.84, "learning_rate": 3.353439802654604e-07, "loss": 0.7049, "step": 44429 }, { "epoch": 0.84, "learning_rate": 3.352675584277809e-07, "loss": 0.9866, "step": 44430 }, { "epoch": 0.84, "learning_rate": 3.3519114467314597e-07, "loss": 1.1692, "step": 44431 }, { "epoch": 0.84, "learning_rate": 3.3511473900184084e-07, "loss": 0.8856, "step": 44432 }, { "epoch": 0.84, "learning_rate": 3.3503834141415086e-07, "loss": 0.8325, "step": 44433 }, { "epoch": 0.84, "learning_rate": 3.349619519103617e-07, "loss": 0.8318, "step": 44434 }, { "epoch": 0.84, "learning_rate": 3.348855704907583e-07, "loss": 0.8495, "step": 44435 }, { "epoch": 0.84, "learning_rate": 3.34809197155625e-07, "loss": 1.0628, "step": 44436 }, { "epoch": 0.84, "learning_rate": 3.347328319052481e-07, "loss": 1.107, "step": 44437 }, { "epoch": 0.84, "learning_rate": 3.3465647473991306e-07, "loss": 1.0187, "step": 44438 }, { "epoch": 0.84, "learning_rate": 3.345801256599032e-07, "loss": 0.8764, "step": 44439 }, { "epoch": 0.84, "learning_rate": 3.345037846655061e-07, "loss": 0.8913, "step": 44440 }, { "epoch": 0.84, "learning_rate": 3.344274517570048e-07, "loss": 1.0788, "step": 44441 }, { "epoch": 0.84, "learning_rate": 3.3435112693468496e-07, "loss": 0.8874, "step": 44442 }, { "epoch": 0.84, "learning_rate": 3.3427481019883163e-07, "loss": 1.118, "step": 44443 }, { "epoch": 0.84, "learning_rate": 3.3419850154972955e-07, "loss": 1.0021, "step": 44444 }, { "epoch": 0.84, "learning_rate": 3.3412220098766404e-07, "loss": 0.8281, "step": 44445 }, { "epoch": 0.84, "learning_rate": 3.3404590851291994e-07, "loss": 0.8881, "step": 44446 }, { "epoch": 0.84, "learning_rate": 3.3396962412578225e-07, "loss": 0.6074, "step": 44447 }, { "epoch": 0.84, "learning_rate": 3.3389334782653464e-07, "loss": 0.8481, "step": 44448 }, { "epoch": 0.84, "learning_rate": 3.338170796154641e-07, "loss": 0.994, "step": 44449 }, { "epoch": 0.84, "learning_rate": 3.3374081949285345e-07, "loss": 0.7421, "step": 44450 }, { "epoch": 0.84, "learning_rate": 3.3366456745898834e-07, "loss": 1.0767, "step": 44451 }, { "epoch": 0.84, "learning_rate": 3.335883235141532e-07, "loss": 0.8397, "step": 44452 }, { "epoch": 0.84, "learning_rate": 3.3351208765863284e-07, "loss": 0.7801, "step": 44453 }, { "epoch": 0.84, "learning_rate": 3.3343585989271175e-07, "loss": 0.7634, "step": 44454 }, { "epoch": 0.84, "learning_rate": 3.33359640216675e-07, "loss": 0.7234, "step": 44455 }, { "epoch": 0.84, "learning_rate": 3.332834286308073e-07, "loss": 1.1444, "step": 44456 }, { "epoch": 0.84, "learning_rate": 3.332072251353918e-07, "loss": 0.9833, "step": 44457 }, { "epoch": 0.84, "learning_rate": 3.331310297307147e-07, "loss": 0.8782, "step": 44458 }, { "epoch": 0.84, "learning_rate": 3.3305484241706015e-07, "loss": 0.6765, "step": 44459 }, { "epoch": 0.84, "learning_rate": 3.3297866319471157e-07, "loss": 0.9025, "step": 44460 }, { "epoch": 0.84, "learning_rate": 3.3290249206395534e-07, "loss": 0.8511, "step": 44461 }, { "epoch": 0.84, "learning_rate": 3.328263290250741e-07, "loss": 0.9413, "step": 44462 }, { "epoch": 0.84, "learning_rate": 3.327501740783529e-07, "loss": 1.014, "step": 44463 }, { "epoch": 0.84, "learning_rate": 3.326740272240761e-07, "loss": 1.0457, "step": 44464 }, { "epoch": 0.84, "learning_rate": 3.325978884625281e-07, "loss": 0.8676, "step": 44465 }, { "epoch": 0.84, "learning_rate": 3.325217577939932e-07, "loss": 0.8999, "step": 44466 }, { "epoch": 0.84, "learning_rate": 3.3244563521875524e-07, "loss": 0.9219, "step": 44467 }, { "epoch": 0.84, "learning_rate": 3.3236952073709973e-07, "loss": 0.995, "step": 44468 }, { "epoch": 0.84, "learning_rate": 3.322934143493087e-07, "loss": 1.004, "step": 44469 }, { "epoch": 0.84, "learning_rate": 3.322173160556688e-07, "loss": 0.6808, "step": 44470 }, { "epoch": 0.84, "learning_rate": 3.321412258564624e-07, "loss": 0.8755, "step": 44471 }, { "epoch": 0.84, "learning_rate": 3.3206514375197424e-07, "loss": 0.8543, "step": 44472 }, { "epoch": 0.84, "learning_rate": 3.3198906974248823e-07, "loss": 0.7971, "step": 44473 }, { "epoch": 0.84, "learning_rate": 3.3191300382828864e-07, "loss": 0.9772, "step": 44474 }, { "epoch": 0.84, "learning_rate": 3.3183694600965985e-07, "loss": 0.9662, "step": 44475 }, { "epoch": 0.84, "learning_rate": 3.317608962868846e-07, "loss": 0.9602, "step": 44476 }, { "epoch": 0.84, "learning_rate": 3.3168485466024857e-07, "loss": 0.8903, "step": 44477 }, { "epoch": 0.84, "learning_rate": 3.3160882113003417e-07, "loss": 0.9826, "step": 44478 }, { "epoch": 0.84, "learning_rate": 3.315327956965256e-07, "loss": 0.803, "step": 44479 }, { "epoch": 0.84, "learning_rate": 3.314567783600081e-07, "loss": 0.8785, "step": 44480 }, { "epoch": 0.84, "learning_rate": 3.3138076912076406e-07, "loss": 1.0452, "step": 44481 }, { "epoch": 0.84, "learning_rate": 3.3130476797907764e-07, "loss": 0.7789, "step": 44482 }, { "epoch": 0.84, "learning_rate": 3.312287749352328e-07, "loss": 0.7059, "step": 44483 }, { "epoch": 0.84, "learning_rate": 3.311527899895131e-07, "loss": 0.7697, "step": 44484 }, { "epoch": 0.84, "learning_rate": 3.310768131422024e-07, "loss": 0.7903, "step": 44485 }, { "epoch": 0.84, "learning_rate": 3.310008443935844e-07, "loss": 1.0102, "step": 44486 }, { "epoch": 0.84, "learning_rate": 3.3092488374394325e-07, "loss": 1.0247, "step": 44487 }, { "epoch": 0.84, "learning_rate": 3.308489311935612e-07, "loss": 0.9437, "step": 44488 }, { "epoch": 0.84, "learning_rate": 3.307729867427234e-07, "loss": 0.7938, "step": 44489 }, { "epoch": 0.84, "learning_rate": 3.3069705039171257e-07, "loss": 0.9728, "step": 44490 }, { "epoch": 0.84, "learning_rate": 3.306211221408123e-07, "loss": 0.7007, "step": 44491 }, { "epoch": 0.84, "learning_rate": 3.305452019903063e-07, "loss": 1.0304, "step": 44492 }, { "epoch": 0.84, "learning_rate": 3.304692899404779e-07, "loss": 0.9866, "step": 44493 }, { "epoch": 0.84, "learning_rate": 3.3039338599161086e-07, "loss": 0.89, "step": 44494 }, { "epoch": 0.84, "learning_rate": 3.3031749014398846e-07, "loss": 0.936, "step": 44495 }, { "epoch": 0.84, "learning_rate": 3.302416023978944e-07, "loss": 0.919, "step": 44496 }, { "epoch": 0.84, "learning_rate": 3.3016572275361034e-07, "loss": 0.8916, "step": 44497 }, { "epoch": 0.84, "learning_rate": 3.300898512114223e-07, "loss": 0.694, "step": 44498 }, { "epoch": 0.84, "learning_rate": 3.300139877716116e-07, "loss": 1.0519, "step": 44499 }, { "epoch": 0.84, "learning_rate": 3.299381324344617e-07, "loss": 0.944, "step": 44500 }, { "epoch": 0.84, "learning_rate": 3.2986228520025727e-07, "loss": 0.9996, "step": 44501 }, { "epoch": 0.84, "learning_rate": 3.297864460692801e-07, "loss": 0.8109, "step": 44502 }, { "epoch": 0.84, "learning_rate": 3.2971061504181364e-07, "loss": 0.712, "step": 44503 }, { "epoch": 0.84, "learning_rate": 3.2963479211814144e-07, "loss": 0.8258, "step": 44504 }, { "epoch": 0.84, "learning_rate": 3.2955897729854607e-07, "loss": 0.7209, "step": 44505 }, { "epoch": 0.84, "learning_rate": 3.2948317058331095e-07, "loss": 1.0871, "step": 44506 }, { "epoch": 0.84, "learning_rate": 3.294073719727195e-07, "loss": 0.8745, "step": 44507 }, { "epoch": 0.84, "learning_rate": 3.2933158146705446e-07, "loss": 0.8775, "step": 44508 }, { "epoch": 0.84, "learning_rate": 3.292557990665979e-07, "loss": 0.8649, "step": 44509 }, { "epoch": 0.84, "learning_rate": 3.291800247716348e-07, "loss": 0.7136, "step": 44510 }, { "epoch": 0.84, "learning_rate": 3.291042585824461e-07, "loss": 0.9427, "step": 44511 }, { "epoch": 0.84, "learning_rate": 3.2902850049931575e-07, "loss": 1.0204, "step": 44512 }, { "epoch": 0.84, "learning_rate": 3.289527505225265e-07, "loss": 0.9677, "step": 44513 }, { "epoch": 0.84, "learning_rate": 3.2887700865236097e-07, "loss": 0.9677, "step": 44514 }, { "epoch": 0.84, "learning_rate": 3.28801274889102e-07, "loss": 0.8541, "step": 44515 }, { "epoch": 0.84, "learning_rate": 3.287255492330327e-07, "loss": 0.8134, "step": 44516 }, { "epoch": 0.84, "learning_rate": 3.2864983168443607e-07, "loss": 0.8732, "step": 44517 }, { "epoch": 0.84, "learning_rate": 3.285741222435934e-07, "loss": 1.1385, "step": 44518 }, { "epoch": 0.84, "learning_rate": 3.2849842091078943e-07, "loss": 1.1439, "step": 44519 }, { "epoch": 0.84, "learning_rate": 3.28422727686305e-07, "loss": 1.0647, "step": 44520 }, { "epoch": 0.84, "learning_rate": 3.283470425704233e-07, "loss": 0.6411, "step": 44521 }, { "epoch": 0.84, "learning_rate": 3.2827136556342815e-07, "loss": 0.927, "step": 44522 }, { "epoch": 0.84, "learning_rate": 3.2819569666560055e-07, "loss": 0.6526, "step": 44523 }, { "epoch": 0.84, "learning_rate": 3.281200358772238e-07, "loss": 0.8947, "step": 44524 }, { "epoch": 0.84, "learning_rate": 3.2804438319858e-07, "loss": 1.0148, "step": 44525 }, { "epoch": 0.84, "learning_rate": 3.279687386299518e-07, "loss": 1.1489, "step": 44526 }, { "epoch": 0.84, "learning_rate": 3.2789310217162193e-07, "loss": 0.7299, "step": 44527 }, { "epoch": 0.84, "learning_rate": 3.2781747382387266e-07, "loss": 0.8979, "step": 44528 }, { "epoch": 0.84, "learning_rate": 3.2774185358698694e-07, "loss": 0.9691, "step": 44529 }, { "epoch": 0.84, "learning_rate": 3.2766624146124527e-07, "loss": 1.0089, "step": 44530 }, { "epoch": 0.84, "learning_rate": 3.275906374469323e-07, "loss": 0.9837, "step": 44531 }, { "epoch": 0.84, "learning_rate": 3.27515041544329e-07, "loss": 0.9167, "step": 44532 }, { "epoch": 0.84, "learning_rate": 3.274394537537176e-07, "loss": 0.8957, "step": 44533 }, { "epoch": 0.84, "learning_rate": 3.2736387407538097e-07, "loss": 0.8592, "step": 44534 }, { "epoch": 0.84, "learning_rate": 3.2728830250960075e-07, "loss": 0.8388, "step": 44535 }, { "epoch": 0.84, "learning_rate": 3.272127390566596e-07, "loss": 0.9887, "step": 44536 }, { "epoch": 0.84, "learning_rate": 3.271371837168394e-07, "loss": 1.0757, "step": 44537 }, { "epoch": 0.84, "learning_rate": 3.270616364904228e-07, "loss": 0.7503, "step": 44538 }, { "epoch": 0.84, "learning_rate": 3.269860973776906e-07, "loss": 1.0137, "step": 44539 }, { "epoch": 0.84, "learning_rate": 3.2691056637892654e-07, "loss": 0.8631, "step": 44540 }, { "epoch": 0.84, "learning_rate": 3.2683504349441117e-07, "loss": 0.8629, "step": 44541 }, { "epoch": 0.84, "learning_rate": 3.2675952872442686e-07, "loss": 0.6023, "step": 44542 }, { "epoch": 0.84, "learning_rate": 3.266840220692566e-07, "loss": 1.0818, "step": 44543 }, { "epoch": 0.84, "learning_rate": 3.266085235291813e-07, "loss": 1.153, "step": 44544 }, { "epoch": 0.84, "learning_rate": 3.2653303310448304e-07, "loss": 0.7821, "step": 44545 }, { "epoch": 0.84, "learning_rate": 3.264575507954437e-07, "loss": 0.8764, "step": 44546 }, { "epoch": 0.84, "learning_rate": 3.263820766023451e-07, "loss": 0.834, "step": 44547 }, { "epoch": 0.84, "learning_rate": 3.263066105254695e-07, "loss": 0.6901, "step": 44548 }, { "epoch": 0.84, "learning_rate": 3.262311525650982e-07, "loss": 0.7155, "step": 44549 }, { "epoch": 0.84, "learning_rate": 3.261557027215137e-07, "loss": 1.095, "step": 44550 }, { "epoch": 0.84, "learning_rate": 3.2608026099499617e-07, "loss": 0.7484, "step": 44551 }, { "epoch": 0.84, "learning_rate": 3.2600482738582935e-07, "loss": 0.7219, "step": 44552 }, { "epoch": 0.84, "learning_rate": 3.259294018942932e-07, "loss": 0.8896, "step": 44553 }, { "epoch": 0.84, "learning_rate": 3.258539845206701e-07, "loss": 0.9764, "step": 44554 }, { "epoch": 0.84, "learning_rate": 3.257785752652415e-07, "loss": 0.685, "step": 44555 }, { "epoch": 0.84, "learning_rate": 3.25703174128289e-07, "loss": 0.8855, "step": 44556 }, { "epoch": 0.84, "learning_rate": 3.2562778111009415e-07, "loss": 0.959, "step": 44557 }, { "epoch": 0.84, "learning_rate": 3.255523962109386e-07, "loss": 0.7927, "step": 44558 }, { "epoch": 0.84, "learning_rate": 3.2547701943110437e-07, "loss": 0.8748, "step": 44559 }, { "epoch": 0.84, "learning_rate": 3.2540165077087097e-07, "loss": 0.7088, "step": 44560 }, { "epoch": 0.84, "learning_rate": 3.2532629023052235e-07, "loss": 0.7389, "step": 44561 }, { "epoch": 0.84, "learning_rate": 3.25250937810338e-07, "loss": 1.162, "step": 44562 }, { "epoch": 0.84, "learning_rate": 3.251755935105996e-07, "loss": 0.9321, "step": 44563 }, { "epoch": 0.84, "learning_rate": 3.251002573315898e-07, "loss": 0.8481, "step": 44564 }, { "epoch": 0.84, "learning_rate": 3.2502492927358854e-07, "loss": 0.9841, "step": 44565 }, { "epoch": 0.84, "learning_rate": 3.2494960933687757e-07, "loss": 0.8631, "step": 44566 }, { "epoch": 0.84, "learning_rate": 3.248742975217378e-07, "loss": 0.8998, "step": 44567 }, { "epoch": 0.84, "learning_rate": 3.24798993828451e-07, "loss": 1.1497, "step": 44568 }, { "epoch": 0.84, "learning_rate": 3.2472369825729794e-07, "loss": 0.84, "step": 44569 }, { "epoch": 0.84, "learning_rate": 3.2464841080855985e-07, "loss": 0.9109, "step": 44570 }, { "epoch": 0.84, "learning_rate": 3.2457313148251844e-07, "loss": 0.9591, "step": 44571 }, { "epoch": 0.84, "learning_rate": 3.2449786027945326e-07, "loss": 0.7932, "step": 44572 }, { "epoch": 0.84, "learning_rate": 3.244225971996473e-07, "loss": 0.7861, "step": 44573 }, { "epoch": 0.84, "learning_rate": 3.243473422433804e-07, "loss": 1.0379, "step": 44574 }, { "epoch": 0.84, "learning_rate": 3.2427209541093354e-07, "loss": 1.1476, "step": 44575 }, { "epoch": 0.84, "learning_rate": 3.24196856702588e-07, "loss": 0.8699, "step": 44576 }, { "epoch": 0.84, "learning_rate": 3.2412162611862473e-07, "loss": 0.9586, "step": 44577 }, { "epoch": 0.84, "learning_rate": 3.2404640365932464e-07, "loss": 0.9632, "step": 44578 }, { "epoch": 0.84, "learning_rate": 3.239711893249686e-07, "loss": 0.8832, "step": 44579 }, { "epoch": 0.84, "learning_rate": 3.238959831158378e-07, "loss": 0.9605, "step": 44580 }, { "epoch": 0.84, "learning_rate": 3.238207850322117e-07, "loss": 0.9955, "step": 44581 }, { "epoch": 0.84, "learning_rate": 3.237455950743731e-07, "loss": 0.9408, "step": 44582 }, { "epoch": 0.84, "learning_rate": 3.2367041324260136e-07, "loss": 0.8115, "step": 44583 }, { "epoch": 0.84, "learning_rate": 3.235952395371769e-07, "loss": 0.8157, "step": 44584 }, { "epoch": 0.84, "learning_rate": 3.235200739583821e-07, "loss": 0.9091, "step": 44585 }, { "epoch": 0.84, "learning_rate": 3.2344491650649625e-07, "loss": 0.9223, "step": 44586 }, { "epoch": 0.84, "learning_rate": 3.233697671818001e-07, "loss": 1.16, "step": 44587 }, { "epoch": 0.84, "learning_rate": 3.2329462598457455e-07, "loss": 1.0142, "step": 44588 }, { "epoch": 0.84, "learning_rate": 3.232194929151003e-07, "loss": 0.986, "step": 44589 }, { "epoch": 0.84, "learning_rate": 3.2314436797365763e-07, "loss": 0.8855, "step": 44590 }, { "epoch": 0.84, "learning_rate": 3.230692511605271e-07, "loss": 0.7233, "step": 44591 }, { "epoch": 0.84, "learning_rate": 3.2299414247599e-07, "loss": 0.9884, "step": 44592 }, { "epoch": 0.84, "learning_rate": 3.229190419203246e-07, "loss": 0.9933, "step": 44593 }, { "epoch": 0.84, "learning_rate": 3.2284394949381404e-07, "loss": 0.9722, "step": 44594 }, { "epoch": 0.84, "learning_rate": 3.227688651967367e-07, "loss": 0.7909, "step": 44595 }, { "epoch": 0.84, "learning_rate": 3.226937890293738e-07, "loss": 0.7274, "step": 44596 }, { "epoch": 0.84, "learning_rate": 3.2261872099200563e-07, "loss": 0.9394, "step": 44597 }, { "epoch": 0.84, "learning_rate": 3.2254366108491227e-07, "loss": 0.8223, "step": 44598 }, { "epoch": 0.84, "learning_rate": 3.2246860930837424e-07, "loss": 1.0143, "step": 44599 }, { "epoch": 0.84, "learning_rate": 3.2239356566267144e-07, "loss": 1.4523, "step": 44600 }, { "epoch": 0.84, "learning_rate": 3.22318530148085e-07, "loss": 0.8539, "step": 44601 }, { "epoch": 0.84, "learning_rate": 3.222435027648932e-07, "loss": 0.7431, "step": 44602 }, { "epoch": 0.84, "learning_rate": 3.221684835133787e-07, "loss": 0.8611, "step": 44603 }, { "epoch": 0.84, "learning_rate": 3.220934723938196e-07, "loss": 0.9101, "step": 44604 }, { "epoch": 0.84, "learning_rate": 3.220184694064962e-07, "loss": 0.8823, "step": 44605 }, { "epoch": 0.84, "learning_rate": 3.2194347455169e-07, "loss": 0.941, "step": 44606 }, { "epoch": 0.84, "learning_rate": 3.218684878296796e-07, "loss": 0.9145, "step": 44607 }, { "epoch": 0.84, "learning_rate": 3.2179350924074566e-07, "loss": 0.7137, "step": 44608 }, { "epoch": 0.84, "learning_rate": 3.217185387851679e-07, "loss": 0.8596, "step": 44609 }, { "epoch": 0.84, "learning_rate": 3.2164357646322613e-07, "loss": 0.6426, "step": 44610 }, { "epoch": 0.84, "learning_rate": 3.215686222752007e-07, "loss": 0.8589, "step": 44611 }, { "epoch": 0.84, "learning_rate": 3.2149367622137105e-07, "loss": 1.1022, "step": 44612 }, { "epoch": 0.84, "learning_rate": 3.2141873830201786e-07, "loss": 0.7851, "step": 44613 }, { "epoch": 0.84, "learning_rate": 3.213438085174192e-07, "loss": 0.9974, "step": 44614 }, { "epoch": 0.84, "learning_rate": 3.2126888686785704e-07, "loss": 0.9364, "step": 44615 }, { "epoch": 0.84, "learning_rate": 3.2119397335360957e-07, "loss": 0.7777, "step": 44616 }, { "epoch": 0.84, "learning_rate": 3.2111906797495706e-07, "loss": 0.9891, "step": 44617 }, { "epoch": 0.84, "learning_rate": 3.2104417073217905e-07, "loss": 0.9901, "step": 44618 }, { "epoch": 0.84, "learning_rate": 3.2096928162555525e-07, "loss": 1.0533, "step": 44619 }, { "epoch": 0.84, "learning_rate": 3.2089440065536547e-07, "loss": 0.8387, "step": 44620 }, { "epoch": 0.84, "learning_rate": 3.2081952782188895e-07, "loss": 0.6642, "step": 44621 }, { "epoch": 0.84, "learning_rate": 3.207446631254063e-07, "loss": 0.9826, "step": 44622 }, { "epoch": 0.84, "learning_rate": 3.2066980656619505e-07, "loss": 0.8462, "step": 44623 }, { "epoch": 0.84, "learning_rate": 3.2059495814453693e-07, "loss": 1.0626, "step": 44624 }, { "epoch": 0.84, "learning_rate": 3.2052011786071006e-07, "loss": 1.0908, "step": 44625 }, { "epoch": 0.84, "learning_rate": 3.204452857149937e-07, "loss": 0.9684, "step": 44626 }, { "epoch": 0.84, "learning_rate": 3.203704617076686e-07, "loss": 0.7959, "step": 44627 }, { "epoch": 0.84, "learning_rate": 3.202956458390133e-07, "loss": 0.8224, "step": 44628 }, { "epoch": 0.84, "learning_rate": 3.202208381093069e-07, "loss": 0.858, "step": 44629 }, { "epoch": 0.84, "learning_rate": 3.20146038518829e-07, "loss": 0.9579, "step": 44630 }, { "epoch": 0.84, "learning_rate": 3.200712470678591e-07, "loss": 1.1198, "step": 44631 }, { "epoch": 0.84, "learning_rate": 3.1999646375667633e-07, "loss": 1.0487, "step": 44632 }, { "epoch": 0.84, "learning_rate": 3.199216885855599e-07, "loss": 0.7074, "step": 44633 }, { "epoch": 0.84, "learning_rate": 3.198469215547895e-07, "loss": 0.7645, "step": 44634 }, { "epoch": 0.84, "learning_rate": 3.19772162664643e-07, "loss": 0.7474, "step": 44635 }, { "epoch": 0.84, "learning_rate": 3.196974119154012e-07, "loss": 0.9857, "step": 44636 }, { "epoch": 0.84, "learning_rate": 3.1962266930734203e-07, "loss": 1.1402, "step": 44637 }, { "epoch": 0.84, "learning_rate": 3.195479348407449e-07, "loss": 0.9056, "step": 44638 }, { "epoch": 0.84, "learning_rate": 3.1947320851588915e-07, "loss": 0.808, "step": 44639 }, { "epoch": 0.84, "learning_rate": 3.1939849033305324e-07, "loss": 0.792, "step": 44640 }, { "epoch": 0.84, "learning_rate": 3.193237802925167e-07, "loss": 0.6412, "step": 44641 }, { "epoch": 0.84, "learning_rate": 3.1924907839455816e-07, "loss": 0.7597, "step": 44642 }, { "epoch": 0.84, "learning_rate": 3.191743846394574e-07, "loss": 1.0619, "step": 44643 }, { "epoch": 0.84, "learning_rate": 3.190996990274917e-07, "loss": 1.0331, "step": 44644 }, { "epoch": 0.84, "learning_rate": 3.190250215589416e-07, "loss": 0.8976, "step": 44645 }, { "epoch": 0.84, "learning_rate": 3.189503522340848e-07, "loss": 0.9591, "step": 44646 }, { "epoch": 0.84, "learning_rate": 3.188756910531998e-07, "loss": 0.8207, "step": 44647 }, { "epoch": 0.84, "learning_rate": 3.1880103801656736e-07, "loss": 0.7064, "step": 44648 }, { "epoch": 0.84, "learning_rate": 3.187263931244644e-07, "loss": 0.9747, "step": 44649 }, { "epoch": 0.84, "learning_rate": 3.1865175637717014e-07, "loss": 1.1375, "step": 44650 }, { "epoch": 0.84, "learning_rate": 3.1857712777496356e-07, "loss": 0.6626, "step": 44651 }, { "epoch": 0.84, "learning_rate": 3.1850250731812306e-07, "loss": 0.677, "step": 44652 }, { "epoch": 0.84, "learning_rate": 3.1842789500692694e-07, "loss": 0.8556, "step": 44653 }, { "epoch": 0.84, "learning_rate": 3.183532908416545e-07, "loss": 0.7928, "step": 44654 }, { "epoch": 0.84, "learning_rate": 3.182786948225844e-07, "loss": 0.9007, "step": 44655 }, { "epoch": 0.84, "learning_rate": 3.182041069499939e-07, "loss": 1.2799, "step": 44656 }, { "epoch": 0.84, "learning_rate": 3.181295272241633e-07, "loss": 1.0588, "step": 44657 }, { "epoch": 0.84, "learning_rate": 3.180549556453694e-07, "loss": 0.7244, "step": 44658 }, { "epoch": 0.84, "learning_rate": 3.179803922138916e-07, "loss": 0.8185, "step": 44659 }, { "epoch": 0.84, "learning_rate": 3.179058369300081e-07, "loss": 0.7598, "step": 44660 }, { "epoch": 0.84, "learning_rate": 3.1783128979399725e-07, "loss": 0.9199, "step": 44661 }, { "epoch": 0.84, "learning_rate": 3.177567508061377e-07, "loss": 1.0953, "step": 44662 }, { "epoch": 0.84, "learning_rate": 3.1768221996670735e-07, "loss": 0.9964, "step": 44663 }, { "epoch": 0.84, "learning_rate": 3.1760769727598505e-07, "loss": 0.9863, "step": 44664 }, { "epoch": 0.84, "learning_rate": 3.175331827342479e-07, "loss": 0.7329, "step": 44665 }, { "epoch": 0.84, "learning_rate": 3.1745867634177584e-07, "loss": 0.7202, "step": 44666 }, { "epoch": 0.84, "learning_rate": 3.173841780988457e-07, "loss": 0.884, "step": 44667 }, { "epoch": 0.84, "learning_rate": 3.1730968800573553e-07, "loss": 0.7505, "step": 44668 }, { "epoch": 0.84, "learning_rate": 3.1723520606272515e-07, "loss": 0.9207, "step": 44669 }, { "epoch": 0.84, "learning_rate": 3.1716073227009093e-07, "loss": 0.8421, "step": 44670 }, { "epoch": 0.84, "learning_rate": 3.170862666281119e-07, "loss": 0.8514, "step": 44671 }, { "epoch": 0.84, "learning_rate": 3.1701180913706555e-07, "loss": 0.8621, "step": 44672 }, { "epoch": 0.84, "learning_rate": 3.169373597972303e-07, "loss": 0.6561, "step": 44673 }, { "epoch": 0.84, "learning_rate": 3.1686291860888396e-07, "loss": 0.9507, "step": 44674 }, { "epoch": 0.84, "learning_rate": 3.1678848557230467e-07, "loss": 1.0127, "step": 44675 }, { "epoch": 0.84, "learning_rate": 3.167140606877706e-07, "loss": 0.8314, "step": 44676 }, { "epoch": 0.84, "learning_rate": 3.166396439555583e-07, "loss": 0.9282, "step": 44677 }, { "epoch": 0.84, "learning_rate": 3.165652353759477e-07, "loss": 0.8864, "step": 44678 }, { "epoch": 0.84, "learning_rate": 3.164908349492149e-07, "loss": 1.0683, "step": 44679 }, { "epoch": 0.84, "learning_rate": 3.1641644267563856e-07, "loss": 1.0057, "step": 44680 }, { "epoch": 0.84, "learning_rate": 3.163420585554963e-07, "loss": 1.2001, "step": 44681 }, { "epoch": 0.84, "learning_rate": 3.1626768258906564e-07, "loss": 0.9785, "step": 44682 }, { "epoch": 0.84, "learning_rate": 3.161933147766247e-07, "loss": 0.8382, "step": 44683 }, { "epoch": 0.84, "learning_rate": 3.161189551184507e-07, "loss": 0.8852, "step": 44684 }, { "epoch": 0.84, "learning_rate": 3.1604460361482234e-07, "loss": 0.8538, "step": 44685 }, { "epoch": 0.84, "learning_rate": 3.159702602660153e-07, "loss": 0.9043, "step": 44686 }, { "epoch": 0.84, "learning_rate": 3.158959250723095e-07, "loss": 1.173, "step": 44687 }, { "epoch": 0.84, "learning_rate": 3.158215980339807e-07, "loss": 0.6877, "step": 44688 }, { "epoch": 0.84, "learning_rate": 3.1574727915130664e-07, "loss": 0.9703, "step": 44689 }, { "epoch": 0.84, "learning_rate": 3.156729684245663e-07, "loss": 0.836, "step": 44690 }, { "epoch": 0.84, "learning_rate": 3.1559866585403555e-07, "loss": 0.817, "step": 44691 }, { "epoch": 0.84, "learning_rate": 3.1552437143999246e-07, "loss": 0.826, "step": 44692 }, { "epoch": 0.84, "learning_rate": 3.154500851827144e-07, "loss": 0.872, "step": 44693 }, { "epoch": 0.84, "learning_rate": 3.1537580708247887e-07, "loss": 0.9495, "step": 44694 }, { "epoch": 0.84, "learning_rate": 3.153015371395629e-07, "loss": 0.9667, "step": 44695 }, { "epoch": 0.84, "learning_rate": 3.15227275354244e-07, "loss": 0.9596, "step": 44696 }, { "epoch": 0.84, "learning_rate": 3.151530217268001e-07, "loss": 0.8914, "step": 44697 }, { "epoch": 0.84, "learning_rate": 3.1507877625750664e-07, "loss": 0.7331, "step": 44698 }, { "epoch": 0.84, "learning_rate": 3.150045389466433e-07, "loss": 0.9742, "step": 44699 }, { "epoch": 0.84, "learning_rate": 3.149303097944853e-07, "loss": 1.1093, "step": 44700 }, { "epoch": 0.84, "learning_rate": 3.1485608880131053e-07, "loss": 0.6325, "step": 44701 }, { "epoch": 0.84, "learning_rate": 3.147818759673962e-07, "loss": 0.7622, "step": 44702 }, { "epoch": 0.84, "learning_rate": 3.147076712930194e-07, "loss": 0.9042, "step": 44703 }, { "epoch": 0.84, "learning_rate": 3.146334747784571e-07, "loss": 0.6926, "step": 44704 }, { "epoch": 0.84, "learning_rate": 3.145592864239863e-07, "loss": 0.8041, "step": 44705 }, { "epoch": 0.84, "learning_rate": 3.1448510622988484e-07, "loss": 0.9522, "step": 44706 }, { "epoch": 0.84, "learning_rate": 3.144109341964283e-07, "loss": 1.0061, "step": 44707 }, { "epoch": 0.84, "learning_rate": 3.1433677032389447e-07, "loss": 0.9946, "step": 44708 }, { "epoch": 0.84, "learning_rate": 3.142626146125599e-07, "loss": 0.8778, "step": 44709 }, { "epoch": 0.84, "learning_rate": 3.1418846706270186e-07, "loss": 0.8002, "step": 44710 }, { "epoch": 0.84, "learning_rate": 3.1411432767459697e-07, "loss": 0.9022, "step": 44711 }, { "epoch": 0.84, "learning_rate": 3.1404019644852236e-07, "loss": 0.9984, "step": 44712 }, { "epoch": 0.84, "learning_rate": 3.139660733847549e-07, "loss": 0.8179, "step": 44713 }, { "epoch": 0.84, "learning_rate": 3.1389195848357034e-07, "loss": 0.8032, "step": 44714 }, { "epoch": 0.84, "learning_rate": 3.138178517452464e-07, "loss": 0.9608, "step": 44715 }, { "epoch": 0.84, "learning_rate": 3.137437531700602e-07, "loss": 0.8243, "step": 44716 }, { "epoch": 0.84, "learning_rate": 3.1366966275828694e-07, "loss": 0.7956, "step": 44717 }, { "epoch": 0.84, "learning_rate": 3.135955805102048e-07, "loss": 1.0696, "step": 44718 }, { "epoch": 0.84, "learning_rate": 3.1352150642608963e-07, "loss": 0.8401, "step": 44719 }, { "epoch": 0.84, "learning_rate": 3.1344744050621767e-07, "loss": 1.0018, "step": 44720 }, { "epoch": 0.84, "learning_rate": 3.1337338275086617e-07, "loss": 0.9933, "step": 44721 }, { "epoch": 0.84, "learning_rate": 3.132993331603115e-07, "loss": 1.0891, "step": 44722 }, { "epoch": 0.84, "learning_rate": 3.1322529173482996e-07, "loss": 0.8754, "step": 44723 }, { "epoch": 0.84, "learning_rate": 3.131512584746982e-07, "loss": 0.8443, "step": 44724 }, { "epoch": 0.84, "learning_rate": 3.130772333801932e-07, "loss": 1.2783, "step": 44725 }, { "epoch": 0.84, "learning_rate": 3.130032164515895e-07, "loss": 0.8283, "step": 44726 }, { "epoch": 0.84, "learning_rate": 3.129292076891657e-07, "loss": 0.9795, "step": 44727 }, { "epoch": 0.84, "learning_rate": 3.12855207093197e-07, "loss": 0.7215, "step": 44728 }, { "epoch": 0.84, "learning_rate": 3.1278121466395973e-07, "loss": 0.9821, "step": 44729 }, { "epoch": 0.84, "learning_rate": 3.1270723040173005e-07, "loss": 0.8151, "step": 44730 }, { "epoch": 0.84, "learning_rate": 3.12633254306785e-07, "loss": 1.1802, "step": 44731 }, { "epoch": 0.84, "learning_rate": 3.1255928637939997e-07, "loss": 0.8335, "step": 44732 }, { "epoch": 0.84, "learning_rate": 3.124853266198516e-07, "loss": 0.9962, "step": 44733 }, { "epoch": 0.84, "learning_rate": 3.124113750284166e-07, "loss": 0.8551, "step": 44734 }, { "epoch": 0.84, "learning_rate": 3.1233743160536926e-07, "loss": 0.7762, "step": 44735 }, { "epoch": 0.84, "learning_rate": 3.122634963509874e-07, "loss": 0.9213, "step": 44736 }, { "epoch": 0.84, "learning_rate": 3.121895692655472e-07, "loss": 0.9217, "step": 44737 }, { "epoch": 0.84, "learning_rate": 3.1211565034932307e-07, "loss": 0.9467, "step": 44738 }, { "epoch": 0.84, "learning_rate": 3.1204173960259294e-07, "loss": 0.9165, "step": 44739 }, { "epoch": 0.84, "learning_rate": 3.1196783702563127e-07, "loss": 0.8874, "step": 44740 }, { "epoch": 0.84, "learning_rate": 3.118939426187145e-07, "loss": 0.7984, "step": 44741 }, { "epoch": 0.84, "learning_rate": 3.118200563821189e-07, "loss": 0.8096, "step": 44742 }, { "epoch": 0.84, "learning_rate": 3.117461783161202e-07, "loss": 1.0561, "step": 44743 }, { "epoch": 0.84, "learning_rate": 3.116723084209941e-07, "loss": 0.6922, "step": 44744 }, { "epoch": 0.84, "learning_rate": 3.115984466970165e-07, "loss": 0.9755, "step": 44745 }, { "epoch": 0.84, "learning_rate": 3.1152459314446354e-07, "loss": 0.9082, "step": 44746 }, { "epoch": 0.84, "learning_rate": 3.1145074776360974e-07, "loss": 0.8948, "step": 44747 }, { "epoch": 0.84, "learning_rate": 3.1137691055473293e-07, "loss": 0.8313, "step": 44748 }, { "epoch": 0.84, "learning_rate": 3.11303081518107e-07, "loss": 0.9012, "step": 44749 }, { "epoch": 0.84, "learning_rate": 3.112292606540082e-07, "loss": 1.0973, "step": 44750 }, { "epoch": 0.84, "learning_rate": 3.111554479627121e-07, "loss": 0.8642, "step": 44751 }, { "epoch": 0.84, "learning_rate": 3.1108164344449466e-07, "loss": 0.8661, "step": 44752 }, { "epoch": 0.84, "learning_rate": 3.110078470996311e-07, "loss": 0.84, "step": 44753 }, { "epoch": 0.84, "learning_rate": 3.109340589283974e-07, "loss": 0.6309, "step": 44754 }, { "epoch": 0.84, "learning_rate": 3.108602789310691e-07, "loss": 1.0518, "step": 44755 }, { "epoch": 0.84, "learning_rate": 3.1078650710792023e-07, "loss": 0.9136, "step": 44756 }, { "epoch": 0.84, "learning_rate": 3.107127434592283e-07, "loss": 0.7653, "step": 44757 }, { "epoch": 0.84, "learning_rate": 3.106389879852681e-07, "loss": 0.9683, "step": 44758 }, { "epoch": 0.84, "learning_rate": 3.1056524068631384e-07, "loss": 0.7878, "step": 44759 }, { "epoch": 0.84, "learning_rate": 3.104915015626431e-07, "loss": 0.7161, "step": 44760 }, { "epoch": 0.84, "learning_rate": 3.104177706145289e-07, "loss": 0.8148, "step": 44761 }, { "epoch": 0.84, "learning_rate": 3.1034404784224814e-07, "loss": 1.0278, "step": 44762 }, { "epoch": 0.84, "learning_rate": 3.102703332460755e-07, "loss": 1.0037, "step": 44763 }, { "epoch": 0.84, "learning_rate": 3.10196626826286e-07, "loss": 0.7441, "step": 44764 }, { "epoch": 0.84, "learning_rate": 3.101229285831553e-07, "loss": 1.1154, "step": 44765 }, { "epoch": 0.84, "learning_rate": 3.1004923851695844e-07, "loss": 0.9058, "step": 44766 }, { "epoch": 0.84, "learning_rate": 3.0997555662797106e-07, "loss": 0.7563, "step": 44767 }, { "epoch": 0.84, "learning_rate": 3.099018829164668e-07, "loss": 0.9333, "step": 44768 }, { "epoch": 0.84, "learning_rate": 3.09828217382723e-07, "loss": 1.1047, "step": 44769 }, { "epoch": 0.84, "learning_rate": 3.0975456002701273e-07, "loss": 0.9331, "step": 44770 }, { "epoch": 0.84, "learning_rate": 3.096809108496118e-07, "loss": 0.926, "step": 44771 }, { "epoch": 0.84, "learning_rate": 3.096072698507951e-07, "loss": 0.6632, "step": 44772 }, { "epoch": 0.84, "learning_rate": 3.09533637030838e-07, "loss": 0.7955, "step": 44773 }, { "epoch": 0.84, "learning_rate": 3.094600123900149e-07, "loss": 0.9635, "step": 44774 }, { "epoch": 0.84, "learning_rate": 3.0938639592860115e-07, "loss": 0.8741, "step": 44775 }, { "epoch": 0.84, "learning_rate": 3.093127876468718e-07, "loss": 0.8244, "step": 44776 }, { "epoch": 0.84, "learning_rate": 3.092391875451004e-07, "loss": 0.9446, "step": 44777 }, { "epoch": 0.84, "learning_rate": 3.0916559562356286e-07, "loss": 0.7462, "step": 44778 }, { "epoch": 0.84, "learning_rate": 3.090920118825347e-07, "loss": 0.7457, "step": 44779 }, { "epoch": 0.84, "learning_rate": 3.0901843632228867e-07, "loss": 0.8232, "step": 44780 }, { "epoch": 0.84, "learning_rate": 3.0894486894310156e-07, "loss": 0.9214, "step": 44781 }, { "epoch": 0.84, "learning_rate": 3.088713097452467e-07, "loss": 0.7221, "step": 44782 }, { "epoch": 0.84, "learning_rate": 3.087977587289992e-07, "loss": 0.89, "step": 44783 }, { "epoch": 0.84, "learning_rate": 3.087242158946338e-07, "loss": 0.8155, "step": 44784 }, { "epoch": 0.84, "learning_rate": 3.0865068124242473e-07, "loss": 0.6799, "step": 44785 }, { "epoch": 0.84, "learning_rate": 3.085771547726471e-07, "loss": 0.892, "step": 44786 }, { "epoch": 0.84, "learning_rate": 3.085036364855751e-07, "loss": 1.0563, "step": 44787 }, { "epoch": 0.85, "learning_rate": 3.0843012638148373e-07, "loss": 0.9556, "step": 44788 }, { "epoch": 0.85, "learning_rate": 3.083566244606459e-07, "loss": 0.9136, "step": 44789 }, { "epoch": 0.85, "learning_rate": 3.082831307233386e-07, "loss": 0.9467, "step": 44790 }, { "epoch": 0.85, "learning_rate": 3.0820964516983436e-07, "loss": 0.9249, "step": 44791 }, { "epoch": 0.85, "learning_rate": 3.08136167800408e-07, "loss": 0.8021, "step": 44792 }, { "epoch": 0.85, "learning_rate": 3.08062698615334e-07, "loss": 0.99, "step": 44793 }, { "epoch": 0.85, "learning_rate": 3.079892376148866e-07, "loss": 0.9434, "step": 44794 }, { "epoch": 0.85, "learning_rate": 3.0791578479934025e-07, "loss": 0.8226, "step": 44795 }, { "epoch": 0.85, "learning_rate": 3.07842340168969e-07, "loss": 0.9354, "step": 44796 }, { "epoch": 0.85, "learning_rate": 3.0776890372404805e-07, "loss": 0.6604, "step": 44797 }, { "epoch": 0.85, "learning_rate": 3.076954754648495e-07, "loss": 0.8219, "step": 44798 }, { "epoch": 0.85, "learning_rate": 3.0762205539164955e-07, "loss": 1.1075, "step": 44799 }, { "epoch": 0.85, "learning_rate": 3.07548643504722e-07, "loss": 1.071, "step": 44800 }, { "epoch": 0.85, "learning_rate": 3.0747523980433956e-07, "loss": 1.1362, "step": 44801 }, { "epoch": 0.85, "learning_rate": 3.0740184429077834e-07, "loss": 0.9271, "step": 44802 }, { "epoch": 0.85, "learning_rate": 3.073284569643109e-07, "loss": 1.0327, "step": 44803 }, { "epoch": 0.85, "learning_rate": 3.07255077825212e-07, "loss": 0.6, "step": 44804 }, { "epoch": 0.85, "learning_rate": 3.071817068737551e-07, "loss": 0.9207, "step": 44805 }, { "epoch": 0.85, "learning_rate": 3.0710834411021463e-07, "loss": 1.0552, "step": 44806 }, { "epoch": 0.85, "learning_rate": 3.0703498953486426e-07, "loss": 1.1018, "step": 44807 }, { "epoch": 0.85, "learning_rate": 3.0696164314797827e-07, "loss": 0.972, "step": 44808 }, { "epoch": 0.85, "learning_rate": 3.0688830494983057e-07, "loss": 0.9196, "step": 44809 }, { "epoch": 0.85, "learning_rate": 3.0681497494069374e-07, "loss": 0.7485, "step": 44810 }, { "epoch": 0.85, "learning_rate": 3.067416531208436e-07, "loss": 0.9136, "step": 44811 }, { "epoch": 0.85, "learning_rate": 3.066683394905523e-07, "loss": 1.0562, "step": 44812 }, { "epoch": 0.85, "learning_rate": 3.065950340500942e-07, "loss": 0.9615, "step": 44813 }, { "epoch": 0.85, "learning_rate": 3.065217367997428e-07, "loss": 0.8893, "step": 44814 }, { "epoch": 0.85, "learning_rate": 3.0644844773977224e-07, "loss": 1.0313, "step": 44815 }, { "epoch": 0.85, "learning_rate": 3.063751668704559e-07, "loss": 0.9396, "step": 44816 }, { "epoch": 0.85, "learning_rate": 3.063018941920673e-07, "loss": 0.7842, "step": 44817 }, { "epoch": 0.85, "learning_rate": 3.062286297048808e-07, "loss": 0.7338, "step": 44818 }, { "epoch": 0.85, "learning_rate": 3.0615537340916825e-07, "loss": 0.9827, "step": 44819 }, { "epoch": 0.85, "learning_rate": 3.0608212530520485e-07, "loss": 0.818, "step": 44820 }, { "epoch": 0.85, "learning_rate": 3.0600888539326385e-07, "loss": 0.9344, "step": 44821 }, { "epoch": 0.85, "learning_rate": 3.0593565367361746e-07, "loss": 0.8768, "step": 44822 }, { "epoch": 0.85, "learning_rate": 3.058624301465413e-07, "loss": 0.7992, "step": 44823 }, { "epoch": 0.85, "learning_rate": 3.0578921481230676e-07, "loss": 0.815, "step": 44824 }, { "epoch": 0.85, "learning_rate": 3.057160076711882e-07, "loss": 1.2707, "step": 44825 }, { "epoch": 0.85, "learning_rate": 3.056428087234586e-07, "loss": 1.15, "step": 44826 }, { "epoch": 0.85, "learning_rate": 3.0556961796939177e-07, "loss": 0.5857, "step": 44827 }, { "epoch": 0.85, "learning_rate": 3.0549643540926045e-07, "loss": 0.8335, "step": 44828 }, { "epoch": 0.85, "learning_rate": 3.054232610433383e-07, "loss": 0.902, "step": 44829 }, { "epoch": 0.85, "learning_rate": 3.0535009487189875e-07, "loss": 1.0084, "step": 44830 }, { "epoch": 0.85, "learning_rate": 3.052769368952138e-07, "loss": 1.0918, "step": 44831 }, { "epoch": 0.85, "learning_rate": 3.052037871135585e-07, "loss": 0.8358, "step": 44832 }, { "epoch": 0.85, "learning_rate": 3.0513064552720436e-07, "loss": 0.859, "step": 44833 }, { "epoch": 0.85, "learning_rate": 3.050575121364249e-07, "loss": 1.0406, "step": 44834 }, { "epoch": 0.85, "learning_rate": 3.049843869414937e-07, "loss": 0.923, "step": 44835 }, { "epoch": 0.85, "learning_rate": 3.0491126994268345e-07, "loss": 0.8528, "step": 44836 }, { "epoch": 0.85, "learning_rate": 3.048381611402673e-07, "loss": 1.0071, "step": 44837 }, { "epoch": 0.85, "learning_rate": 3.047650605345179e-07, "loss": 0.885, "step": 44838 }, { "epoch": 0.85, "learning_rate": 3.0469196812570906e-07, "loss": 0.8198, "step": 44839 }, { "epoch": 0.85, "learning_rate": 3.0461888391411204e-07, "loss": 0.8914, "step": 44840 }, { "epoch": 0.85, "learning_rate": 3.045458079000016e-07, "loss": 0.838, "step": 44841 }, { "epoch": 0.85, "learning_rate": 3.0447274008365e-07, "loss": 0.9421, "step": 44842 }, { "epoch": 0.85, "learning_rate": 3.0439968046532904e-07, "loss": 0.9289, "step": 44843 }, { "epoch": 0.85, "learning_rate": 3.043266290453131e-07, "loss": 1.1555, "step": 44844 }, { "epoch": 0.85, "learning_rate": 3.0425358582387403e-07, "loss": 1.0568, "step": 44845 }, { "epoch": 0.85, "learning_rate": 3.041805508012846e-07, "loss": 0.8032, "step": 44846 }, { "epoch": 0.85, "learning_rate": 3.041075239778177e-07, "loss": 0.851, "step": 44847 }, { "epoch": 0.85, "learning_rate": 3.040345053537458e-07, "loss": 1.0405, "step": 44848 }, { "epoch": 0.85, "learning_rate": 3.039614949293418e-07, "loss": 0.9, "step": 44849 }, { "epoch": 0.85, "learning_rate": 3.0388849270487825e-07, "loss": 1.0788, "step": 44850 }, { "epoch": 0.85, "learning_rate": 3.0381549868062856e-07, "loss": 0.9298, "step": 44851 }, { "epoch": 0.85, "learning_rate": 3.0374251285686303e-07, "loss": 0.7887, "step": 44852 }, { "epoch": 0.85, "learning_rate": 3.036695352338567e-07, "loss": 0.7866, "step": 44853 }, { "epoch": 0.85, "learning_rate": 3.035965658118806e-07, "loss": 0.8432, "step": 44854 }, { "epoch": 0.85, "learning_rate": 3.0352360459120767e-07, "loss": 1.0049, "step": 44855 }, { "epoch": 0.85, "learning_rate": 3.0345065157211e-07, "loss": 0.9016, "step": 44856 }, { "epoch": 0.85, "learning_rate": 3.0337770675486046e-07, "loss": 1.2029, "step": 44857 }, { "epoch": 0.85, "learning_rate": 3.0330477013973123e-07, "loss": 1.032, "step": 44858 }, { "epoch": 0.85, "learning_rate": 3.0323184172699446e-07, "loss": 0.9435, "step": 44859 }, { "epoch": 0.85, "learning_rate": 3.031589215169231e-07, "loss": 0.8735, "step": 44860 }, { "epoch": 0.85, "learning_rate": 3.030860095097882e-07, "loss": 0.881, "step": 44861 }, { "epoch": 0.85, "learning_rate": 3.030131057058633e-07, "loss": 0.9802, "step": 44862 }, { "epoch": 0.85, "learning_rate": 3.0294021010542046e-07, "loss": 0.9901, "step": 44863 }, { "epoch": 0.85, "learning_rate": 3.028673227087303e-07, "loss": 0.824, "step": 44864 }, { "epoch": 0.85, "learning_rate": 3.0279444351606763e-07, "loss": 0.9991, "step": 44865 }, { "epoch": 0.85, "learning_rate": 3.0272157252770246e-07, "loss": 1.0188, "step": 44866 }, { "epoch": 0.85, "learning_rate": 3.026487097439074e-07, "loss": 0.7599, "step": 44867 }, { "epoch": 0.85, "learning_rate": 3.025758551649549e-07, "loss": 0.9339, "step": 44868 }, { "epoch": 0.85, "learning_rate": 3.0250300879111657e-07, "loss": 0.7625, "step": 44869 }, { "epoch": 0.85, "learning_rate": 3.0243017062266485e-07, "loss": 0.9083, "step": 44870 }, { "epoch": 0.85, "learning_rate": 3.023573406598715e-07, "loss": 0.831, "step": 44871 }, { "epoch": 0.85, "learning_rate": 3.022845189030088e-07, "loss": 0.9455, "step": 44872 }, { "epoch": 0.85, "learning_rate": 3.022117053523474e-07, "loss": 0.7412, "step": 44873 }, { "epoch": 0.85, "learning_rate": 3.021389000081609e-07, "loss": 0.9886, "step": 44874 }, { "epoch": 0.85, "learning_rate": 3.020661028707203e-07, "loss": 0.9948, "step": 44875 }, { "epoch": 0.85, "learning_rate": 3.019933139402972e-07, "loss": 0.9634, "step": 44876 }, { "epoch": 0.85, "learning_rate": 3.0192053321716376e-07, "loss": 0.8752, "step": 44877 }, { "epoch": 0.85, "learning_rate": 3.0184776070159156e-07, "loss": 0.9677, "step": 44878 }, { "epoch": 0.85, "learning_rate": 3.0177499639385237e-07, "loss": 0.6852, "step": 44879 }, { "epoch": 0.85, "learning_rate": 3.01702240294218e-07, "loss": 0.9999, "step": 44880 }, { "epoch": 0.85, "learning_rate": 3.0162949240296056e-07, "loss": 1.1035, "step": 44881 }, { "epoch": 0.85, "learning_rate": 3.015567527203503e-07, "loss": 0.8907, "step": 44882 }, { "epoch": 0.85, "learning_rate": 3.0148402124666023e-07, "loss": 0.722, "step": 44883 }, { "epoch": 0.85, "learning_rate": 3.014112979821618e-07, "loss": 0.7982, "step": 44884 }, { "epoch": 0.85, "learning_rate": 3.013385829271254e-07, "loss": 0.8253, "step": 44885 }, { "epoch": 0.85, "learning_rate": 3.0126587608182404e-07, "loss": 0.8773, "step": 44886 }, { "epoch": 0.85, "learning_rate": 3.011931774465279e-07, "loss": 0.9453, "step": 44887 }, { "epoch": 0.85, "learning_rate": 3.0112048702150924e-07, "loss": 0.9444, "step": 44888 }, { "epoch": 0.85, "learning_rate": 3.010478048070392e-07, "loss": 0.7449, "step": 44889 }, { "epoch": 0.85, "learning_rate": 3.0097513080338926e-07, "loss": 0.9518, "step": 44890 }, { "epoch": 0.85, "learning_rate": 3.009024650108308e-07, "loss": 0.9572, "step": 44891 }, { "epoch": 0.85, "learning_rate": 3.008298074296351e-07, "loss": 0.6418, "step": 44892 }, { "epoch": 0.85, "learning_rate": 3.0075715806007403e-07, "loss": 0.7661, "step": 44893 }, { "epoch": 0.85, "learning_rate": 3.0068451690241724e-07, "loss": 1.0985, "step": 44894 }, { "epoch": 0.85, "learning_rate": 3.00611883956938e-07, "loss": 0.9907, "step": 44895 }, { "epoch": 0.85, "learning_rate": 3.0053925922390594e-07, "loss": 0.8925, "step": 44896 }, { "epoch": 0.85, "learning_rate": 3.0046664270359293e-07, "loss": 0.7255, "step": 44897 }, { "epoch": 0.85, "learning_rate": 3.0039403439627026e-07, "loss": 0.9283, "step": 44898 }, { "epoch": 0.85, "learning_rate": 3.0032143430220843e-07, "loss": 0.9828, "step": 44899 }, { "epoch": 0.85, "learning_rate": 3.002488424216793e-07, "loss": 1.0526, "step": 44900 }, { "epoch": 0.85, "learning_rate": 3.001762587549534e-07, "loss": 0.8524, "step": 44901 }, { "epoch": 0.85, "learning_rate": 3.0010368330230215e-07, "loss": 0.8962, "step": 44902 }, { "epoch": 0.85, "learning_rate": 3.000311160639957e-07, "loss": 0.8932, "step": 44903 }, { "epoch": 0.85, "learning_rate": 2.9995855704030575e-07, "loss": 0.8198, "step": 44904 }, { "epoch": 0.85, "learning_rate": 2.998860062315037e-07, "loss": 1.0395, "step": 44905 }, { "epoch": 0.85, "learning_rate": 2.998134636378591e-07, "loss": 1.1736, "step": 44906 }, { "epoch": 0.85, "learning_rate": 2.997409292596443e-07, "loss": 0.8163, "step": 44907 }, { "epoch": 0.85, "learning_rate": 2.996684030971289e-07, "loss": 0.9291, "step": 44908 }, { "epoch": 0.85, "learning_rate": 2.995958851505845e-07, "loss": 0.8367, "step": 44909 }, { "epoch": 0.85, "learning_rate": 2.9952337542028143e-07, "loss": 0.8452, "step": 44910 }, { "epoch": 0.85, "learning_rate": 2.994508739064905e-07, "loss": 0.7603, "step": 44911 }, { "epoch": 0.85, "learning_rate": 2.993783806094827e-07, "loss": 0.9097, "step": 44912 }, { "epoch": 0.85, "learning_rate": 2.9930589552952835e-07, "loss": 1.0251, "step": 44913 }, { "epoch": 0.85, "learning_rate": 2.992334186668991e-07, "loss": 0.9144, "step": 44914 }, { "epoch": 0.85, "learning_rate": 2.991609500218634e-07, "loss": 0.9229, "step": 44915 }, { "epoch": 0.85, "learning_rate": 2.9908848959469467e-07, "loss": 0.861, "step": 44916 }, { "epoch": 0.85, "learning_rate": 2.9901603738566126e-07, "loss": 0.8915, "step": 44917 }, { "epoch": 0.85, "learning_rate": 2.9894359339503463e-07, "loss": 0.9595, "step": 44918 }, { "epoch": 0.85, "learning_rate": 2.988711576230849e-07, "loss": 1.0125, "step": 44919 }, { "epoch": 0.85, "learning_rate": 2.9879873007008287e-07, "loss": 0.9757, "step": 44920 }, { "epoch": 0.85, "learning_rate": 2.987263107362992e-07, "loss": 0.8054, "step": 44921 }, { "epoch": 0.85, "learning_rate": 2.986538996220037e-07, "loss": 0.7729, "step": 44922 }, { "epoch": 0.85, "learning_rate": 2.985814967274675e-07, "loss": 0.9278, "step": 44923 }, { "epoch": 0.85, "learning_rate": 2.985091020529596e-07, "loss": 0.8032, "step": 44924 }, { "epoch": 0.85, "learning_rate": 2.9843671559875167e-07, "loss": 0.9991, "step": 44925 }, { "epoch": 0.85, "learning_rate": 2.9836433736511407e-07, "loss": 1.0139, "step": 44926 }, { "epoch": 0.85, "learning_rate": 2.9829196735231546e-07, "loss": 0.7362, "step": 44927 }, { "epoch": 0.85, "learning_rate": 2.982196055606285e-07, "loss": 0.9852, "step": 44928 }, { "epoch": 0.85, "learning_rate": 2.981472519903211e-07, "loss": 0.806, "step": 44929 }, { "epoch": 0.85, "learning_rate": 2.980749066416644e-07, "loss": 0.9279, "step": 44930 }, { "epoch": 0.85, "learning_rate": 2.980025695149286e-07, "loss": 1.1396, "step": 44931 }, { "epoch": 0.85, "learning_rate": 2.9793024061038374e-07, "loss": 0.8205, "step": 44932 }, { "epoch": 0.85, "learning_rate": 2.9785791992829963e-07, "loss": 0.8479, "step": 44933 }, { "epoch": 0.85, "learning_rate": 2.977856074689467e-07, "loss": 0.9438, "step": 44934 }, { "epoch": 0.85, "learning_rate": 2.9771330323259546e-07, "loss": 0.7629, "step": 44935 }, { "epoch": 0.85, "learning_rate": 2.9764100721951405e-07, "loss": 0.7305, "step": 44936 }, { "epoch": 0.85, "learning_rate": 2.975687194299745e-07, "loss": 1.0145, "step": 44937 }, { "epoch": 0.85, "learning_rate": 2.9749643986424546e-07, "loss": 1.075, "step": 44938 }, { "epoch": 0.85, "learning_rate": 2.9742416852259705e-07, "loss": 1.0102, "step": 44939 }, { "epoch": 0.85, "learning_rate": 2.9735190540529926e-07, "loss": 0.9479, "step": 44940 }, { "epoch": 0.85, "learning_rate": 2.9727965051262214e-07, "loss": 0.758, "step": 44941 }, { "epoch": 0.85, "learning_rate": 2.9720740384483553e-07, "loss": 0.9235, "step": 44942 }, { "epoch": 0.85, "learning_rate": 2.971351654022081e-07, "loss": 1.0176, "step": 44943 }, { "epoch": 0.85, "learning_rate": 2.9706293518501126e-07, "loss": 0.8512, "step": 44944 }, { "epoch": 0.85, "learning_rate": 2.9699071319351347e-07, "loss": 0.9768, "step": 44945 }, { "epoch": 0.85, "learning_rate": 2.969184994279842e-07, "loss": 0.8481, "step": 44946 }, { "epoch": 0.85, "learning_rate": 2.9684629388869486e-07, "loss": 0.7648, "step": 44947 }, { "epoch": 0.85, "learning_rate": 2.9677409657591333e-07, "loss": 0.7661, "step": 44948 }, { "epoch": 0.85, "learning_rate": 2.9670190748990965e-07, "loss": 0.8891, "step": 44949 }, { "epoch": 0.85, "learning_rate": 2.9662972663095367e-07, "loss": 0.954, "step": 44950 }, { "epoch": 0.85, "learning_rate": 2.9655755399931483e-07, "loss": 0.9257, "step": 44951 }, { "epoch": 0.85, "learning_rate": 2.964853895952624e-07, "loss": 0.9065, "step": 44952 }, { "epoch": 0.85, "learning_rate": 2.9641323341906586e-07, "loss": 0.8569, "step": 44953 }, { "epoch": 0.85, "learning_rate": 2.9634108547099557e-07, "loss": 0.7791, "step": 44954 }, { "epoch": 0.85, "learning_rate": 2.962689457513188e-07, "loss": 0.8, "step": 44955 }, { "epoch": 0.85, "learning_rate": 2.961968142603072e-07, "loss": 1.0993, "step": 44956 }, { "epoch": 0.85, "learning_rate": 2.9612469099822875e-07, "loss": 0.9315, "step": 44957 }, { "epoch": 0.85, "learning_rate": 2.960525759653532e-07, "loss": 0.6561, "step": 44958 }, { "epoch": 0.85, "learning_rate": 2.9598046916194946e-07, "loss": 0.9992, "step": 44959 }, { "epoch": 0.85, "learning_rate": 2.9590837058828733e-07, "loss": 0.7675, "step": 44960 }, { "epoch": 0.85, "learning_rate": 2.9583628024463575e-07, "loss": 0.8741, "step": 44961 }, { "epoch": 0.85, "learning_rate": 2.9576419813126393e-07, "loss": 1.04, "step": 44962 }, { "epoch": 0.85, "learning_rate": 2.956921242484415e-07, "loss": 0.8169, "step": 44963 }, { "epoch": 0.85, "learning_rate": 2.956200585964358e-07, "loss": 0.8161, "step": 44964 }, { "epoch": 0.85, "learning_rate": 2.9554800117551854e-07, "loss": 0.8929, "step": 44965 }, { "epoch": 0.85, "learning_rate": 2.954759519859568e-07, "loss": 1.0126, "step": 44966 }, { "epoch": 0.85, "learning_rate": 2.954039110280199e-07, "loss": 0.8438, "step": 44967 }, { "epoch": 0.85, "learning_rate": 2.9533187830197817e-07, "loss": 0.8896, "step": 44968 }, { "epoch": 0.85, "learning_rate": 2.952598538080992e-07, "loss": 0.4767, "step": 44969 }, { "epoch": 0.85, "learning_rate": 2.9518783754665217e-07, "loss": 0.8802, "step": 44970 }, { "epoch": 0.85, "learning_rate": 2.9511582951790604e-07, "loss": 0.7343, "step": 44971 }, { "epoch": 0.85, "learning_rate": 2.9504382972213004e-07, "loss": 0.928, "step": 44972 }, { "epoch": 0.85, "learning_rate": 2.9497183815959255e-07, "loss": 0.9007, "step": 44973 }, { "epoch": 0.85, "learning_rate": 2.948998548305629e-07, "loss": 0.7962, "step": 44974 }, { "epoch": 0.85, "learning_rate": 2.948278797353099e-07, "loss": 0.9978, "step": 44975 }, { "epoch": 0.85, "learning_rate": 2.947559128741009e-07, "loss": 1.0333, "step": 44976 }, { "epoch": 0.85, "learning_rate": 2.9468395424720687e-07, "loss": 0.9186, "step": 44977 }, { "epoch": 0.85, "learning_rate": 2.94612003854895e-07, "loss": 0.7997, "step": 44978 }, { "epoch": 0.85, "learning_rate": 2.9454006169743396e-07, "loss": 0.772, "step": 44979 }, { "epoch": 0.85, "learning_rate": 2.944681277750927e-07, "loss": 0.8842, "step": 44980 }, { "epoch": 0.85, "learning_rate": 2.9439620208813995e-07, "loss": 1.0339, "step": 44981 }, { "epoch": 0.85, "learning_rate": 2.9432428463684435e-07, "loss": 1.0273, "step": 44982 }, { "epoch": 0.85, "learning_rate": 2.942523754214741e-07, "loss": 0.9828, "step": 44983 }, { "epoch": 0.85, "learning_rate": 2.9418047444229824e-07, "loss": 0.9628, "step": 44984 }, { "epoch": 0.85, "learning_rate": 2.9410858169958396e-07, "loss": 0.8074, "step": 44985 }, { "epoch": 0.85, "learning_rate": 2.940366971936015e-07, "loss": 0.8071, "step": 44986 }, { "epoch": 0.85, "learning_rate": 2.939648209246179e-07, "loss": 1.0685, "step": 44987 }, { "epoch": 0.85, "learning_rate": 2.938929528929016e-07, "loss": 0.9271, "step": 44988 }, { "epoch": 0.85, "learning_rate": 2.938210930987223e-07, "loss": 0.6206, "step": 44989 }, { "epoch": 0.85, "learning_rate": 2.937492415423471e-07, "loss": 0.9312, "step": 44990 }, { "epoch": 0.85, "learning_rate": 2.936773982240443e-07, "loss": 0.6381, "step": 44991 }, { "epoch": 0.85, "learning_rate": 2.936055631440826e-07, "loss": 0.9283, "step": 44992 }, { "epoch": 0.85, "learning_rate": 2.935337363027299e-07, "loss": 0.8884, "step": 44993 }, { "epoch": 0.85, "learning_rate": 2.9346191770025484e-07, "loss": 0.8575, "step": 44994 }, { "epoch": 0.85, "learning_rate": 2.933901073369252e-07, "loss": 0.9622, "step": 44995 }, { "epoch": 0.85, "learning_rate": 2.933183052130098e-07, "loss": 0.8094, "step": 44996 }, { "epoch": 0.85, "learning_rate": 2.9324651132877494e-07, "loss": 0.9454, "step": 44997 }, { "epoch": 0.85, "learning_rate": 2.9317472568449136e-07, "loss": 0.7149, "step": 44998 }, { "epoch": 0.85, "learning_rate": 2.9310294828042487e-07, "loss": 0.8719, "step": 44999 }, { "epoch": 0.85, "learning_rate": 2.930311791168444e-07, "loss": 1.1319, "step": 45000 }, { "epoch": 0.85, "learning_rate": 2.9295941819401793e-07, "loss": 0.8676, "step": 45001 }, { "epoch": 0.85, "learning_rate": 2.9288766551221313e-07, "loss": 0.724, "step": 45002 }, { "epoch": 0.85, "learning_rate": 2.9281592107169824e-07, "loss": 0.9797, "step": 45003 }, { "epoch": 0.85, "learning_rate": 2.927441848727411e-07, "loss": 0.7671, "step": 45004 }, { "epoch": 0.85, "learning_rate": 2.9267245691561e-07, "loss": 1.0104, "step": 45005 }, { "epoch": 0.85, "learning_rate": 2.92600737200571e-07, "loss": 0.909, "step": 45006 }, { "epoch": 0.85, "learning_rate": 2.9252902572789453e-07, "loss": 0.77, "step": 45007 }, { "epoch": 0.85, "learning_rate": 2.924573224978461e-07, "loss": 0.8707, "step": 45008 }, { "epoch": 0.85, "learning_rate": 2.923856275106943e-07, "loss": 0.7411, "step": 45009 }, { "epoch": 0.85, "learning_rate": 2.923139407667075e-07, "loss": 0.685, "step": 45010 }, { "epoch": 0.85, "learning_rate": 2.922422622661525e-07, "loss": 0.9034, "step": 45011 }, { "epoch": 0.85, "learning_rate": 2.921705920092971e-07, "loss": 1.0518, "step": 45012 }, { "epoch": 0.85, "learning_rate": 2.9209892999640886e-07, "loss": 0.8638, "step": 45013 }, { "epoch": 0.85, "learning_rate": 2.920272762277557e-07, "loss": 1.0003, "step": 45014 }, { "epoch": 0.85, "learning_rate": 2.919556307036051e-07, "loss": 0.9057, "step": 45015 }, { "epoch": 0.85, "learning_rate": 2.918839934242243e-07, "loss": 0.9334, "step": 45016 }, { "epoch": 0.85, "learning_rate": 2.9181236438988155e-07, "loss": 0.7233, "step": 45017 }, { "epoch": 0.85, "learning_rate": 2.9174074360084265e-07, "loss": 1.2847, "step": 45018 }, { "epoch": 0.85, "learning_rate": 2.9166913105737715e-07, "loss": 1.0376, "step": 45019 }, { "epoch": 0.85, "learning_rate": 2.9159752675975093e-07, "loss": 0.7227, "step": 45020 }, { "epoch": 0.85, "learning_rate": 2.915259307082316e-07, "loss": 0.8912, "step": 45021 }, { "epoch": 0.85, "learning_rate": 2.9145434290308695e-07, "loss": 0.8707, "step": 45022 }, { "epoch": 0.85, "learning_rate": 2.91382763344584e-07, "loss": 0.7221, "step": 45023 }, { "epoch": 0.85, "learning_rate": 2.913111920329903e-07, "loss": 0.9934, "step": 45024 }, { "epoch": 0.85, "learning_rate": 2.912396289685726e-07, "loss": 1.1559, "step": 45025 }, { "epoch": 0.85, "learning_rate": 2.91168074151599e-07, "loss": 0.7395, "step": 45026 }, { "epoch": 0.85, "learning_rate": 2.910965275823352e-07, "loss": 0.9367, "step": 45027 }, { "epoch": 0.85, "learning_rate": 2.9102498926105033e-07, "loss": 0.7363, "step": 45028 }, { "epoch": 0.85, "learning_rate": 2.909534591880095e-07, "loss": 0.8614, "step": 45029 }, { "epoch": 0.85, "learning_rate": 2.9088193736348053e-07, "loss": 0.7941, "step": 45030 }, { "epoch": 0.85, "learning_rate": 2.9081042378773153e-07, "loss": 1.1564, "step": 45031 }, { "epoch": 0.85, "learning_rate": 2.9073891846102845e-07, "loss": 0.9355, "step": 45032 }, { "epoch": 0.85, "learning_rate": 2.906674213836383e-07, "loss": 0.8022, "step": 45033 }, { "epoch": 0.85, "learning_rate": 2.905959325558283e-07, "loss": 0.9641, "step": 45034 }, { "epoch": 0.85, "learning_rate": 2.905244519778652e-07, "loss": 0.7905, "step": 45035 }, { "epoch": 0.85, "learning_rate": 2.9045297965001633e-07, "loss": 0.9445, "step": 45036 }, { "epoch": 0.85, "learning_rate": 2.9038151557254814e-07, "loss": 0.7623, "step": 45037 }, { "epoch": 0.85, "learning_rate": 2.9031005974572814e-07, "loss": 0.9148, "step": 45038 }, { "epoch": 0.85, "learning_rate": 2.902386121698214e-07, "loss": 0.8705, "step": 45039 }, { "epoch": 0.85, "learning_rate": 2.9016717284509723e-07, "loss": 0.9588, "step": 45040 }, { "epoch": 0.85, "learning_rate": 2.900957417718206e-07, "loss": 0.7131, "step": 45041 }, { "epoch": 0.85, "learning_rate": 2.9002431895025857e-07, "loss": 0.7952, "step": 45042 }, { "epoch": 0.85, "learning_rate": 2.8995290438067786e-07, "loss": 1.0537, "step": 45043 }, { "epoch": 0.85, "learning_rate": 2.898814980633455e-07, "loss": 1.1231, "step": 45044 }, { "epoch": 0.85, "learning_rate": 2.898100999985276e-07, "loss": 0.8093, "step": 45045 }, { "epoch": 0.85, "learning_rate": 2.897387101864912e-07, "loss": 0.9252, "step": 45046 }, { "epoch": 0.85, "learning_rate": 2.896673286275034e-07, "loss": 0.8315, "step": 45047 }, { "epoch": 0.85, "learning_rate": 2.895959553218286e-07, "loss": 0.7294, "step": 45048 }, { "epoch": 0.85, "learning_rate": 2.895245902697355e-07, "loss": 0.7563, "step": 45049 }, { "epoch": 0.85, "learning_rate": 2.8945323347149027e-07, "loss": 0.9866, "step": 45050 }, { "epoch": 0.85, "learning_rate": 2.8938188492735774e-07, "loss": 0.8828, "step": 45051 }, { "epoch": 0.85, "learning_rate": 2.8931054463760654e-07, "loss": 0.7795, "step": 45052 }, { "epoch": 0.85, "learning_rate": 2.892392126025015e-07, "loss": 0.9358, "step": 45053 }, { "epoch": 0.85, "learning_rate": 2.8916788882230954e-07, "loss": 1.0571, "step": 45054 }, { "epoch": 0.85, "learning_rate": 2.890965732972967e-07, "loss": 1.0393, "step": 45055 }, { "epoch": 0.85, "learning_rate": 2.8902526602772987e-07, "loss": 0.9762, "step": 45056 }, { "epoch": 0.85, "learning_rate": 2.889539670138744e-07, "loss": 0.833, "step": 45057 }, { "epoch": 0.85, "learning_rate": 2.888826762559974e-07, "loss": 0.6947, "step": 45058 }, { "epoch": 0.85, "learning_rate": 2.888113937543649e-07, "loss": 0.8377, "step": 45059 }, { "epoch": 0.85, "learning_rate": 2.8874011950924207e-07, "loss": 0.9477, "step": 45060 }, { "epoch": 0.85, "learning_rate": 2.8866885352089675e-07, "loss": 0.9885, "step": 45061 }, { "epoch": 0.85, "learning_rate": 2.8859759578959367e-07, "loss": 0.8757, "step": 45062 }, { "epoch": 0.85, "learning_rate": 2.885263463155993e-07, "loss": 0.9709, "step": 45063 }, { "epoch": 0.85, "learning_rate": 2.884551050991799e-07, "loss": 0.9313, "step": 45064 }, { "epoch": 0.85, "learning_rate": 2.883838721406013e-07, "loss": 0.9823, "step": 45065 }, { "epoch": 0.85, "learning_rate": 2.883126474401293e-07, "loss": 0.8004, "step": 45066 }, { "epoch": 0.85, "learning_rate": 2.8824143099803027e-07, "loss": 0.7408, "step": 45067 }, { "epoch": 0.85, "learning_rate": 2.8817022281457023e-07, "loss": 0.8071, "step": 45068 }, { "epoch": 0.85, "learning_rate": 2.880990228900141e-07, "loss": 1.0164, "step": 45069 }, { "epoch": 0.85, "learning_rate": 2.8802783122462846e-07, "loss": 0.9057, "step": 45070 }, { "epoch": 0.85, "learning_rate": 2.879566478186799e-07, "loss": 0.8596, "step": 45071 }, { "epoch": 0.85, "learning_rate": 2.8788547267243225e-07, "loss": 0.8969, "step": 45072 }, { "epoch": 0.85, "learning_rate": 2.878143057861535e-07, "loss": 0.9684, "step": 45073 }, { "epoch": 0.85, "learning_rate": 2.8774314716010774e-07, "loss": 1.1737, "step": 45074 }, { "epoch": 0.85, "learning_rate": 2.8767199679456124e-07, "loss": 1.0309, "step": 45075 }, { "epoch": 0.85, "learning_rate": 2.876008546897799e-07, "loss": 1.0244, "step": 45076 }, { "epoch": 0.85, "learning_rate": 2.8752972084602897e-07, "loss": 0.7829, "step": 45077 }, { "epoch": 0.85, "learning_rate": 2.8745859526357415e-07, "loss": 0.9603, "step": 45078 }, { "epoch": 0.85, "learning_rate": 2.8738747794268106e-07, "loss": 0.8768, "step": 45079 }, { "epoch": 0.85, "learning_rate": 2.8731636888361584e-07, "loss": 0.934, "step": 45080 }, { "epoch": 0.85, "learning_rate": 2.872452680866425e-07, "loss": 0.9314, "step": 45081 }, { "epoch": 0.85, "learning_rate": 2.871741755520285e-07, "loss": 0.7801, "step": 45082 }, { "epoch": 0.85, "learning_rate": 2.871030912800377e-07, "loss": 1.0658, "step": 45083 }, { "epoch": 0.85, "learning_rate": 2.870320152709363e-07, "loss": 0.9169, "step": 45084 }, { "epoch": 0.85, "learning_rate": 2.8696094752498934e-07, "loss": 0.8813, "step": 45085 }, { "epoch": 0.85, "learning_rate": 2.8688988804246225e-07, "loss": 0.9774, "step": 45086 }, { "epoch": 0.85, "learning_rate": 2.868188368236208e-07, "loss": 1.0998, "step": 45087 }, { "epoch": 0.85, "learning_rate": 2.8674779386872963e-07, "loss": 0.9409, "step": 45088 }, { "epoch": 0.85, "learning_rate": 2.8667675917805503e-07, "loss": 0.9644, "step": 45089 }, { "epoch": 0.85, "learning_rate": 2.8660573275186035e-07, "loss": 0.935, "step": 45090 }, { "epoch": 0.85, "learning_rate": 2.8653471459041263e-07, "loss": 0.9563, "step": 45091 }, { "epoch": 0.85, "learning_rate": 2.8646370469397693e-07, "loss": 0.9805, "step": 45092 }, { "epoch": 0.85, "learning_rate": 2.863927030628169e-07, "loss": 1.0035, "step": 45093 }, { "epoch": 0.85, "learning_rate": 2.863217096971996e-07, "loss": 1.0184, "step": 45094 }, { "epoch": 0.85, "learning_rate": 2.862507245973886e-07, "loss": 0.9595, "step": 45095 }, { "epoch": 0.85, "learning_rate": 2.8617974776364967e-07, "loss": 0.8726, "step": 45096 }, { "epoch": 0.85, "learning_rate": 2.861087791962477e-07, "loss": 1.0475, "step": 45097 }, { "epoch": 0.85, "learning_rate": 2.860378188954474e-07, "loss": 0.9285, "step": 45098 }, { "epoch": 0.85, "learning_rate": 2.8596686686151427e-07, "loss": 0.8658, "step": 45099 }, { "epoch": 0.85, "learning_rate": 2.858959230947128e-07, "loss": 0.9605, "step": 45100 }, { "epoch": 0.85, "learning_rate": 2.8582498759530866e-07, "loss": 0.855, "step": 45101 }, { "epoch": 0.85, "learning_rate": 2.8575406036356527e-07, "loss": 0.7937, "step": 45102 }, { "epoch": 0.85, "learning_rate": 2.8568314139974906e-07, "loss": 0.8741, "step": 45103 }, { "epoch": 0.85, "learning_rate": 2.856122307041237e-07, "loss": 0.8024, "step": 45104 }, { "epoch": 0.85, "learning_rate": 2.855413282769545e-07, "loss": 0.7242, "step": 45105 }, { "epoch": 0.85, "learning_rate": 2.8547043411850606e-07, "loss": 0.9049, "step": 45106 }, { "epoch": 0.85, "learning_rate": 2.853995482290431e-07, "loss": 0.8464, "step": 45107 }, { "epoch": 0.85, "learning_rate": 2.8532867060883015e-07, "loss": 0.939, "step": 45108 }, { "epoch": 0.85, "learning_rate": 2.8525780125813225e-07, "loss": 0.9907, "step": 45109 }, { "epoch": 0.85, "learning_rate": 2.851869401772142e-07, "loss": 0.7412, "step": 45110 }, { "epoch": 0.85, "learning_rate": 2.8511608736633915e-07, "loss": 0.9742, "step": 45111 }, { "epoch": 0.85, "learning_rate": 2.850452428257733e-07, "loss": 1.0731, "step": 45112 }, { "epoch": 0.85, "learning_rate": 2.849744065557811e-07, "loss": 0.9254, "step": 45113 }, { "epoch": 0.85, "learning_rate": 2.8490357855662566e-07, "loss": 0.9528, "step": 45114 }, { "epoch": 0.85, "learning_rate": 2.848327588285732e-07, "loss": 0.9961, "step": 45115 }, { "epoch": 0.85, "learning_rate": 2.8476194737188684e-07, "loss": 0.8486, "step": 45116 }, { "epoch": 0.85, "learning_rate": 2.8469114418683134e-07, "loss": 0.95, "step": 45117 }, { "epoch": 0.85, "learning_rate": 2.8462034927367154e-07, "loss": 0.9493, "step": 45118 }, { "epoch": 0.85, "learning_rate": 2.845495626326711e-07, "loss": 0.9566, "step": 45119 }, { "epoch": 0.85, "learning_rate": 2.8447878426409476e-07, "loss": 0.899, "step": 45120 }, { "epoch": 0.85, "learning_rate": 2.844080141682068e-07, "loss": 0.8677, "step": 45121 }, { "epoch": 0.85, "learning_rate": 2.843372523452717e-07, "loss": 0.9417, "step": 45122 }, { "epoch": 0.85, "learning_rate": 2.8426649879555234e-07, "loss": 0.8265, "step": 45123 }, { "epoch": 0.85, "learning_rate": 2.841957535193152e-07, "loss": 0.8052, "step": 45124 }, { "epoch": 0.85, "learning_rate": 2.8412501651682246e-07, "loss": 1.1935, "step": 45125 }, { "epoch": 0.85, "learning_rate": 2.84054287788339e-07, "loss": 0.8381, "step": 45126 }, { "epoch": 0.85, "learning_rate": 2.8398356733412904e-07, "loss": 0.9128, "step": 45127 }, { "epoch": 0.85, "learning_rate": 2.8391285515445623e-07, "loss": 0.9804, "step": 45128 }, { "epoch": 0.85, "learning_rate": 2.838421512495851e-07, "loss": 0.9533, "step": 45129 }, { "epoch": 0.85, "learning_rate": 2.837714556197793e-07, "loss": 0.8769, "step": 45130 }, { "epoch": 0.85, "learning_rate": 2.837007682653034e-07, "loss": 1.0355, "step": 45131 }, { "epoch": 0.85, "learning_rate": 2.836300891864202e-07, "loss": 0.7908, "step": 45132 }, { "epoch": 0.85, "learning_rate": 2.835594183833945e-07, "loss": 0.8903, "step": 45133 }, { "epoch": 0.85, "learning_rate": 2.8348875585649054e-07, "loss": 0.7143, "step": 45134 }, { "epoch": 0.85, "learning_rate": 2.834181016059706e-07, "loss": 0.9432, "step": 45135 }, { "epoch": 0.85, "learning_rate": 2.8334745563210033e-07, "loss": 0.9633, "step": 45136 }, { "epoch": 0.85, "learning_rate": 2.832768179351425e-07, "loss": 0.8794, "step": 45137 }, { "epoch": 0.85, "learning_rate": 2.8320618851536083e-07, "loss": 1.0338, "step": 45138 }, { "epoch": 0.85, "learning_rate": 2.8313556737301933e-07, "loss": 0.973, "step": 45139 }, { "epoch": 0.85, "learning_rate": 2.830649545083819e-07, "loss": 0.9764, "step": 45140 }, { "epoch": 0.85, "learning_rate": 2.8299434992171163e-07, "loss": 0.8522, "step": 45141 }, { "epoch": 0.85, "learning_rate": 2.8292375361327256e-07, "loss": 0.7648, "step": 45142 }, { "epoch": 0.85, "learning_rate": 2.828531655833289e-07, "loss": 0.9323, "step": 45143 }, { "epoch": 0.85, "learning_rate": 2.827825858321423e-07, "loss": 0.9581, "step": 45144 }, { "epoch": 0.85, "learning_rate": 2.8271201435997875e-07, "loss": 1.0386, "step": 45145 }, { "epoch": 0.85, "learning_rate": 2.826414511671e-07, "loss": 0.76, "step": 45146 }, { "epoch": 0.85, "learning_rate": 2.825708962537699e-07, "loss": 0.9218, "step": 45147 }, { "epoch": 0.85, "learning_rate": 2.8250034962025247e-07, "loss": 1.0021, "step": 45148 }, { "epoch": 0.85, "learning_rate": 2.824298112668103e-07, "loss": 0.8924, "step": 45149 }, { "epoch": 0.85, "learning_rate": 2.823592811937076e-07, "loss": 1.0316, "step": 45150 }, { "epoch": 0.85, "learning_rate": 2.822887594012072e-07, "loss": 0.8428, "step": 45151 }, { "epoch": 0.85, "learning_rate": 2.8221824588957283e-07, "loss": 0.8022, "step": 45152 }, { "epoch": 0.85, "learning_rate": 2.82147740659067e-07, "loss": 0.8134, "step": 45153 }, { "epoch": 0.85, "learning_rate": 2.8207724370995363e-07, "loss": 0.7511, "step": 45154 }, { "epoch": 0.85, "learning_rate": 2.8200675504249655e-07, "loss": 0.8105, "step": 45155 }, { "epoch": 0.85, "learning_rate": 2.8193627465695704e-07, "loss": 1.1737, "step": 45156 }, { "epoch": 0.85, "learning_rate": 2.8186580255360055e-07, "loss": 0.983, "step": 45157 }, { "epoch": 0.85, "learning_rate": 2.817953387326888e-07, "loss": 0.8032, "step": 45158 }, { "epoch": 0.85, "learning_rate": 2.8172488319448495e-07, "loss": 0.8461, "step": 45159 }, { "epoch": 0.85, "learning_rate": 2.816544359392526e-07, "loss": 0.6246, "step": 45160 }, { "epoch": 0.85, "learning_rate": 2.8158399696725456e-07, "loss": 1.0505, "step": 45161 }, { "epoch": 0.85, "learning_rate": 2.8151356627875383e-07, "loss": 1.0218, "step": 45162 }, { "epoch": 0.85, "learning_rate": 2.814431438740134e-07, "loss": 0.966, "step": 45163 }, { "epoch": 0.85, "learning_rate": 2.813727297532967e-07, "loss": 0.8358, "step": 45164 }, { "epoch": 0.85, "learning_rate": 2.813023239168652e-07, "loss": 0.7809, "step": 45165 }, { "epoch": 0.85, "learning_rate": 2.8123192636498404e-07, "loss": 0.8472, "step": 45166 }, { "epoch": 0.85, "learning_rate": 2.81161537097914e-07, "loss": 0.7141, "step": 45167 }, { "epoch": 0.85, "learning_rate": 2.810911561159191e-07, "loss": 1.0378, "step": 45168 }, { "epoch": 0.85, "learning_rate": 2.810207834192616e-07, "loss": 0.9725, "step": 45169 }, { "epoch": 0.85, "learning_rate": 2.8095041900820433e-07, "loss": 0.7511, "step": 45170 }, { "epoch": 0.85, "learning_rate": 2.808800628830102e-07, "loss": 0.8781, "step": 45171 }, { "epoch": 0.85, "learning_rate": 2.8080971504394207e-07, "loss": 1.0112, "step": 45172 }, { "epoch": 0.85, "learning_rate": 2.8073937549126267e-07, "loss": 0.751, "step": 45173 }, { "epoch": 0.85, "learning_rate": 2.8066904422523354e-07, "loss": 0.9967, "step": 45174 }, { "epoch": 0.85, "learning_rate": 2.8059872124611864e-07, "loss": 1.1524, "step": 45175 }, { "epoch": 0.85, "learning_rate": 2.805284065541805e-07, "loss": 0.7242, "step": 45176 }, { "epoch": 0.85, "learning_rate": 2.804581001496809e-07, "loss": 0.8804, "step": 45177 }, { "epoch": 0.85, "learning_rate": 2.803878020328826e-07, "loss": 0.7709, "step": 45178 }, { "epoch": 0.85, "learning_rate": 2.803175122040483e-07, "loss": 0.9303, "step": 45179 }, { "epoch": 0.85, "learning_rate": 2.802472306634402e-07, "loss": 1.0232, "step": 45180 }, { "epoch": 0.85, "learning_rate": 2.801769574113208e-07, "loss": 0.9355, "step": 45181 }, { "epoch": 0.85, "learning_rate": 2.8010669244795285e-07, "loss": 0.8827, "step": 45182 }, { "epoch": 0.85, "learning_rate": 2.800364357735988e-07, "loss": 1.0388, "step": 45183 }, { "epoch": 0.85, "learning_rate": 2.7996618738851985e-07, "loss": 0.8285, "step": 45184 }, { "epoch": 0.85, "learning_rate": 2.798959472929796e-07, "loss": 0.8156, "step": 45185 }, { "epoch": 0.85, "learning_rate": 2.7982571548723967e-07, "loss": 0.8224, "step": 45186 }, { "epoch": 0.85, "learning_rate": 2.7975549197156253e-07, "loss": 0.9819, "step": 45187 }, { "epoch": 0.85, "learning_rate": 2.796852767462102e-07, "loss": 0.9084, "step": 45188 }, { "epoch": 0.85, "learning_rate": 2.796150698114447e-07, "loss": 0.9224, "step": 45189 }, { "epoch": 0.85, "learning_rate": 2.795448711675289e-07, "loss": 0.9561, "step": 45190 }, { "epoch": 0.85, "learning_rate": 2.794746808147242e-07, "loss": 0.8289, "step": 45191 }, { "epoch": 0.85, "learning_rate": 2.7940449875329344e-07, "loss": 0.8204, "step": 45192 }, { "epoch": 0.85, "learning_rate": 2.7933432498349733e-07, "loss": 1.2048, "step": 45193 }, { "epoch": 0.85, "learning_rate": 2.7926415950559976e-07, "loss": 1.0703, "step": 45194 }, { "epoch": 0.85, "learning_rate": 2.791940023198611e-07, "loss": 0.9145, "step": 45195 }, { "epoch": 0.85, "learning_rate": 2.791238534265434e-07, "loss": 0.8933, "step": 45196 }, { "epoch": 0.85, "learning_rate": 2.790537128259102e-07, "loss": 0.8199, "step": 45197 }, { "epoch": 0.85, "learning_rate": 2.78983580518222e-07, "loss": 0.8791, "step": 45198 }, { "epoch": 0.85, "learning_rate": 2.7891345650374075e-07, "loss": 0.8157, "step": 45199 }, { "epoch": 0.85, "learning_rate": 2.788433407827287e-07, "loss": 1.0545, "step": 45200 }, { "epoch": 0.85, "learning_rate": 2.787732333554477e-07, "loss": 0.9243, "step": 45201 }, { "epoch": 0.85, "learning_rate": 2.7870313422215913e-07, "loss": 0.792, "step": 45202 }, { "epoch": 0.85, "learning_rate": 2.78633043383125e-07, "loss": 0.7909, "step": 45203 }, { "epoch": 0.85, "learning_rate": 2.7856296083860726e-07, "loss": 0.6811, "step": 45204 }, { "epoch": 0.85, "learning_rate": 2.784928865888667e-07, "loss": 0.984, "step": 45205 }, { "epoch": 0.85, "learning_rate": 2.784228206341663e-07, "loss": 1.1594, "step": 45206 }, { "epoch": 0.85, "learning_rate": 2.7835276297476675e-07, "loss": 0.9562, "step": 45207 }, { "epoch": 0.85, "learning_rate": 2.782827136109295e-07, "loss": 0.8274, "step": 45208 }, { "epoch": 0.85, "learning_rate": 2.7821267254291684e-07, "loss": 0.7741, "step": 45209 }, { "epoch": 0.85, "learning_rate": 2.7814263977098963e-07, "loss": 0.7714, "step": 45210 }, { "epoch": 0.85, "learning_rate": 2.7807261529540995e-07, "loss": 0.5791, "step": 45211 }, { "epoch": 0.85, "learning_rate": 2.780025991164387e-07, "loss": 1.0245, "step": 45212 }, { "epoch": 0.85, "learning_rate": 2.7793259123433836e-07, "loss": 0.9768, "step": 45213 }, { "epoch": 0.85, "learning_rate": 2.778625916493685e-07, "loss": 0.9124, "step": 45214 }, { "epoch": 0.85, "learning_rate": 2.7779260036179256e-07, "loss": 0.8706, "step": 45215 }, { "epoch": 0.85, "learning_rate": 2.7772261737187054e-07, "loss": 0.8813, "step": 45216 }, { "epoch": 0.85, "learning_rate": 2.7765264267986343e-07, "loss": 0.7407, "step": 45217 }, { "epoch": 0.85, "learning_rate": 2.7758267628603455e-07, "loss": 0.9938, "step": 45218 }, { "epoch": 0.85, "learning_rate": 2.7751271819064283e-07, "loss": 1.0294, "step": 45219 }, { "epoch": 0.85, "learning_rate": 2.7744276839395096e-07, "loss": 0.9859, "step": 45220 }, { "epoch": 0.85, "learning_rate": 2.773728268962195e-07, "loss": 0.9853, "step": 45221 }, { "epoch": 0.85, "learning_rate": 2.7730289369770955e-07, "loss": 0.8376, "step": 45222 }, { "epoch": 0.85, "learning_rate": 2.7723296879868274e-07, "loss": 0.6936, "step": 45223 }, { "epoch": 0.85, "learning_rate": 2.7716305219939953e-07, "loss": 0.9373, "step": 45224 }, { "epoch": 0.85, "learning_rate": 2.7709314390012203e-07, "loss": 0.8001, "step": 45225 }, { "epoch": 0.85, "learning_rate": 2.7702324390110974e-07, "loss": 0.9076, "step": 45226 }, { "epoch": 0.85, "learning_rate": 2.769533522026252e-07, "loss": 0.8771, "step": 45227 }, { "epoch": 0.85, "learning_rate": 2.768834688049282e-07, "loss": 0.8959, "step": 45228 }, { "epoch": 0.85, "learning_rate": 2.768135937082803e-07, "loss": 0.778, "step": 45229 }, { "epoch": 0.85, "learning_rate": 2.767437269129422e-07, "loss": 1.0518, "step": 45230 }, { "epoch": 0.85, "learning_rate": 2.76673868419175e-07, "loss": 0.9436, "step": 45231 }, { "epoch": 0.85, "learning_rate": 2.766040182272395e-07, "loss": 0.7525, "step": 45232 }, { "epoch": 0.85, "learning_rate": 2.7653417633739605e-07, "loss": 0.9694, "step": 45233 }, { "epoch": 0.85, "learning_rate": 2.764643427499067e-07, "loss": 1.0134, "step": 45234 }, { "epoch": 0.85, "learning_rate": 2.763945174650301e-07, "loss": 0.8629, "step": 45235 }, { "epoch": 0.85, "learning_rate": 2.763247004830291e-07, "loss": 0.8462, "step": 45236 }, { "epoch": 0.85, "learning_rate": 2.76254891804163e-07, "loss": 1.0729, "step": 45237 }, { "epoch": 0.85, "learning_rate": 2.761850914286926e-07, "loss": 1.1541, "step": 45238 }, { "epoch": 0.85, "learning_rate": 2.7611529935688e-07, "loss": 0.9006, "step": 45239 }, { "epoch": 0.85, "learning_rate": 2.760455155889838e-07, "loss": 0.8531, "step": 45240 }, { "epoch": 0.85, "learning_rate": 2.759757401252658e-07, "loss": 0.9839, "step": 45241 }, { "epoch": 0.85, "learning_rate": 2.7590597296598606e-07, "loss": 0.8183, "step": 45242 }, { "epoch": 0.85, "learning_rate": 2.7583621411140515e-07, "loss": 0.9729, "step": 45243 }, { "epoch": 0.85, "learning_rate": 2.7576646356178377e-07, "loss": 1.1483, "step": 45244 }, { "epoch": 0.85, "learning_rate": 2.756967213173822e-07, "loss": 0.9244, "step": 45245 }, { "epoch": 0.85, "learning_rate": 2.7562698737846143e-07, "loss": 0.8792, "step": 45246 }, { "epoch": 0.85, "learning_rate": 2.755572617452801e-07, "loss": 0.9381, "step": 45247 }, { "epoch": 0.85, "learning_rate": 2.75487544418101e-07, "loss": 1.0275, "step": 45248 }, { "epoch": 0.85, "learning_rate": 2.754178353971826e-07, "loss": 0.7942, "step": 45249 }, { "epoch": 0.85, "learning_rate": 2.7534813468278547e-07, "loss": 1.0628, "step": 45250 }, { "epoch": 0.85, "learning_rate": 2.752784422751706e-07, "loss": 0.8845, "step": 45251 }, { "epoch": 0.85, "learning_rate": 2.7520875817459767e-07, "loss": 0.844, "step": 45252 }, { "epoch": 0.85, "learning_rate": 2.7513908238132716e-07, "loss": 0.7845, "step": 45253 }, { "epoch": 0.85, "learning_rate": 2.75069414895619e-07, "loss": 0.8499, "step": 45254 }, { "epoch": 0.85, "learning_rate": 2.749997557177339e-07, "loss": 0.8759, "step": 45255 }, { "epoch": 0.85, "learning_rate": 2.7493010484793053e-07, "loss": 0.9838, "step": 45256 }, { "epoch": 0.85, "learning_rate": 2.748604622864709e-07, "loss": 0.8931, "step": 45257 }, { "epoch": 0.85, "learning_rate": 2.747908280336134e-07, "loss": 0.9295, "step": 45258 }, { "epoch": 0.85, "learning_rate": 2.747212020896184e-07, "loss": 0.9233, "step": 45259 }, { "epoch": 0.85, "learning_rate": 2.7465158445474734e-07, "loss": 0.8217, "step": 45260 }, { "epoch": 0.85, "learning_rate": 2.745819751292583e-07, "loss": 0.7816, "step": 45261 }, { "epoch": 0.85, "learning_rate": 2.74512374113412e-07, "loss": 1.0805, "step": 45262 }, { "epoch": 0.85, "learning_rate": 2.7444278140746847e-07, "loss": 0.9744, "step": 45263 }, { "epoch": 0.85, "learning_rate": 2.74373197011687e-07, "loss": 1.0189, "step": 45264 }, { "epoch": 0.85, "learning_rate": 2.7430362092632806e-07, "loss": 0.9137, "step": 45265 }, { "epoch": 0.85, "learning_rate": 2.74234053151651e-07, "loss": 0.92, "step": 45266 }, { "epoch": 0.85, "learning_rate": 2.741644936879162e-07, "loss": 0.7659, "step": 45267 }, { "epoch": 0.85, "learning_rate": 2.740949425353823e-07, "loss": 1.0406, "step": 45268 }, { "epoch": 0.85, "learning_rate": 2.740253996943101e-07, "loss": 1.0729, "step": 45269 }, { "epoch": 0.85, "learning_rate": 2.7395586516495875e-07, "loss": 0.9505, "step": 45270 }, { "epoch": 0.85, "learning_rate": 2.7388633894758765e-07, "loss": 0.8716, "step": 45271 }, { "epoch": 0.85, "learning_rate": 2.738168210424569e-07, "loss": 0.9374, "step": 45272 }, { "epoch": 0.85, "learning_rate": 2.737473114498257e-07, "loss": 0.9413, "step": 45273 }, { "epoch": 0.85, "learning_rate": 2.736778101699539e-07, "loss": 1.2177, "step": 45274 }, { "epoch": 0.85, "learning_rate": 2.7360831720310093e-07, "loss": 0.9071, "step": 45275 }, { "epoch": 0.85, "learning_rate": 2.735388325495267e-07, "loss": 1.0536, "step": 45276 }, { "epoch": 0.85, "learning_rate": 2.734693562094892e-07, "loss": 0.9536, "step": 45277 }, { "epoch": 0.85, "learning_rate": 2.7339988818324977e-07, "loss": 1.0149, "step": 45278 }, { "epoch": 0.85, "learning_rate": 2.7333042847106667e-07, "loss": 0.7583, "step": 45279 }, { "epoch": 0.85, "learning_rate": 2.732609770731987e-07, "loss": 0.8389, "step": 45280 }, { "epoch": 0.85, "learning_rate": 2.7319153398990716e-07, "loss": 1.1595, "step": 45281 }, { "epoch": 0.85, "learning_rate": 2.731220992214495e-07, "loss": 1.0103, "step": 45282 }, { "epoch": 0.85, "learning_rate": 2.7305267276808575e-07, "loss": 0.9686, "step": 45283 }, { "epoch": 0.85, "learning_rate": 2.729832546300748e-07, "loss": 0.8198, "step": 45284 }, { "epoch": 0.85, "learning_rate": 2.7291384480767624e-07, "loss": 1.0424, "step": 45285 }, { "epoch": 0.85, "learning_rate": 2.728444433011493e-07, "loss": 0.6892, "step": 45286 }, { "epoch": 0.85, "learning_rate": 2.727750501107526e-07, "loss": 1.0689, "step": 45287 }, { "epoch": 0.85, "learning_rate": 2.727056652367463e-07, "loss": 0.8926, "step": 45288 }, { "epoch": 0.85, "learning_rate": 2.726362886793876e-07, "loss": 0.9591, "step": 45289 }, { "epoch": 0.85, "learning_rate": 2.7256692043893804e-07, "loss": 0.9402, "step": 45290 }, { "epoch": 0.85, "learning_rate": 2.7249756051565436e-07, "loss": 0.8186, "step": 45291 }, { "epoch": 0.85, "learning_rate": 2.7242820890979684e-07, "loss": 0.7707, "step": 45292 }, { "epoch": 0.85, "learning_rate": 2.7235886562162387e-07, "loss": 0.9237, "step": 45293 }, { "epoch": 0.85, "learning_rate": 2.722895306513948e-07, "loss": 1.1964, "step": 45294 }, { "epoch": 0.85, "learning_rate": 2.722202039993682e-07, "loss": 0.6478, "step": 45295 }, { "epoch": 0.85, "learning_rate": 2.7215088566580283e-07, "loss": 0.9147, "step": 45296 }, { "epoch": 0.85, "learning_rate": 2.7208157565095846e-07, "loss": 1.0131, "step": 45297 }, { "epoch": 0.85, "learning_rate": 2.7201227395509233e-07, "loss": 0.8263, "step": 45298 }, { "epoch": 0.85, "learning_rate": 2.7194298057846484e-07, "loss": 0.7415, "step": 45299 }, { "epoch": 0.85, "learning_rate": 2.7187369552133355e-07, "loss": 1.1029, "step": 45300 }, { "epoch": 0.85, "learning_rate": 2.718044187839569e-07, "loss": 0.8928, "step": 45301 }, { "epoch": 0.85, "learning_rate": 2.717351503665955e-07, "loss": 0.9448, "step": 45302 }, { "epoch": 0.85, "learning_rate": 2.71665890269506e-07, "loss": 0.8152, "step": 45303 }, { "epoch": 0.85, "learning_rate": 2.7159663849294777e-07, "loss": 0.7621, "step": 45304 }, { "epoch": 0.85, "learning_rate": 2.715273950371794e-07, "loss": 1.1111, "step": 45305 }, { "epoch": 0.85, "learning_rate": 2.714581599024596e-07, "loss": 1.0332, "step": 45306 }, { "epoch": 0.85, "learning_rate": 2.713889330890465e-07, "loss": 1.0164, "step": 45307 }, { "epoch": 0.85, "learning_rate": 2.713197145971988e-07, "loss": 0.9614, "step": 45308 }, { "epoch": 0.85, "learning_rate": 2.712505044271754e-07, "loss": 0.8413, "step": 45309 }, { "epoch": 0.85, "learning_rate": 2.711813025792334e-07, "loss": 0.8236, "step": 45310 }, { "epoch": 0.85, "learning_rate": 2.711121090536331e-07, "loss": 0.7308, "step": 45311 }, { "epoch": 0.85, "learning_rate": 2.7104292385063123e-07, "loss": 1.2384, "step": 45312 }, { "epoch": 0.85, "learning_rate": 2.7097374697048676e-07, "loss": 1.0366, "step": 45313 }, { "epoch": 0.85, "learning_rate": 2.709045784134581e-07, "loss": 0.8747, "step": 45314 }, { "epoch": 0.85, "learning_rate": 2.708354181798034e-07, "loss": 0.9022, "step": 45315 }, { "epoch": 0.85, "learning_rate": 2.707662662697808e-07, "loss": 0.8926, "step": 45316 }, { "epoch": 0.85, "learning_rate": 2.7069712268364855e-07, "loss": 1.0172, "step": 45317 }, { "epoch": 0.86, "learning_rate": 2.7062798742166553e-07, "loss": 0.9243, "step": 45318 }, { "epoch": 0.86, "learning_rate": 2.7055886048408807e-07, "loss": 1.0681, "step": 45319 }, { "epoch": 0.86, "learning_rate": 2.704897418711766e-07, "loss": 0.7692, "step": 45320 }, { "epoch": 0.86, "learning_rate": 2.7042063158318755e-07, "loss": 0.9384, "step": 45321 }, { "epoch": 0.86, "learning_rate": 2.70351529620379e-07, "loss": 0.8604, "step": 45322 }, { "epoch": 0.86, "learning_rate": 2.702824359830106e-07, "loss": 0.8005, "step": 45323 }, { "epoch": 0.86, "learning_rate": 2.7021335067133863e-07, "loss": 0.8721, "step": 45324 }, { "epoch": 0.86, "learning_rate": 2.701442736856216e-07, "loss": 1.1017, "step": 45325 }, { "epoch": 0.86, "learning_rate": 2.700752050261174e-07, "loss": 0.8598, "step": 45326 }, { "epoch": 0.86, "learning_rate": 2.7000614469308435e-07, "loss": 1.091, "step": 45327 }, { "epoch": 0.86, "learning_rate": 2.6993709268677975e-07, "loss": 0.8353, "step": 45328 }, { "epoch": 0.86, "learning_rate": 2.698680490074615e-07, "loss": 0.7523, "step": 45329 }, { "epoch": 0.86, "learning_rate": 2.6979901365538826e-07, "loss": 0.8425, "step": 45330 }, { "epoch": 0.86, "learning_rate": 2.6972998663081616e-07, "loss": 1.2112, "step": 45331 }, { "epoch": 0.86, "learning_rate": 2.696609679340048e-07, "loss": 1.1354, "step": 45332 }, { "epoch": 0.86, "learning_rate": 2.695919575652106e-07, "loss": 0.8374, "step": 45333 }, { "epoch": 0.86, "learning_rate": 2.695229555246917e-07, "loss": 0.8287, "step": 45334 }, { "epoch": 0.86, "learning_rate": 2.6945396181270566e-07, "loss": 0.7081, "step": 45335 }, { "epoch": 0.86, "learning_rate": 2.6938497642951007e-07, "loss": 0.8208, "step": 45336 }, { "epoch": 0.86, "learning_rate": 2.6931599937536246e-07, "loss": 1.0136, "step": 45337 }, { "epoch": 0.86, "learning_rate": 2.692470306505207e-07, "loss": 1.0982, "step": 45338 }, { "epoch": 0.86, "learning_rate": 2.6917807025524265e-07, "loss": 0.8647, "step": 45339 }, { "epoch": 0.86, "learning_rate": 2.691091181897842e-07, "loss": 1.1426, "step": 45340 }, { "epoch": 0.86, "learning_rate": 2.6904017445440493e-07, "loss": 0.8984, "step": 45341 }, { "epoch": 0.86, "learning_rate": 2.689712390493607e-07, "loss": 0.8344, "step": 45342 }, { "epoch": 0.86, "learning_rate": 2.6890231197490903e-07, "loss": 1.078, "step": 45343 }, { "epoch": 0.86, "learning_rate": 2.6883339323130864e-07, "loss": 1.0066, "step": 45344 }, { "epoch": 0.86, "learning_rate": 2.6876448281881546e-07, "loss": 0.8043, "step": 45345 }, { "epoch": 0.86, "learning_rate": 2.686955807376873e-07, "loss": 0.8643, "step": 45346 }, { "epoch": 0.86, "learning_rate": 2.686266869881815e-07, "loss": 0.9926, "step": 45347 }, { "epoch": 0.86, "learning_rate": 2.6855780157055534e-07, "loss": 0.8846, "step": 45348 }, { "epoch": 0.86, "learning_rate": 2.684889244850658e-07, "loss": 1.0801, "step": 45349 }, { "epoch": 0.86, "learning_rate": 2.6842005573196993e-07, "loss": 0.9207, "step": 45350 }, { "epoch": 0.86, "learning_rate": 2.6835119531152616e-07, "loss": 0.864, "step": 45351 }, { "epoch": 0.86, "learning_rate": 2.6828234322398923e-07, "loss": 1.0327, "step": 45352 }, { "epoch": 0.86, "learning_rate": 2.6821349946961866e-07, "loss": 0.578, "step": 45353 }, { "epoch": 0.86, "learning_rate": 2.6814466404867014e-07, "loss": 0.9607, "step": 45354 }, { "epoch": 0.86, "learning_rate": 2.6807583696140086e-07, "loss": 1.1583, "step": 45355 }, { "epoch": 0.86, "learning_rate": 2.6800701820806794e-07, "loss": 0.899, "step": 45356 }, { "epoch": 0.86, "learning_rate": 2.6793820778892835e-07, "loss": 1.0769, "step": 45357 }, { "epoch": 0.86, "learning_rate": 2.678694057042391e-07, "loss": 0.7465, "step": 45358 }, { "epoch": 0.86, "learning_rate": 2.6780061195425726e-07, "loss": 0.7347, "step": 45359 }, { "epoch": 0.86, "learning_rate": 2.677318265392398e-07, "loss": 0.8173, "step": 45360 }, { "epoch": 0.86, "learning_rate": 2.676630494594423e-07, "loss": 0.8159, "step": 45361 }, { "epoch": 0.86, "learning_rate": 2.6759428071512354e-07, "loss": 1.0616, "step": 45362 }, { "epoch": 0.86, "learning_rate": 2.6752552030653886e-07, "loss": 0.9136, "step": 45363 }, { "epoch": 0.86, "learning_rate": 2.6745676823394464e-07, "loss": 0.9686, "step": 45364 }, { "epoch": 0.86, "learning_rate": 2.673880244975996e-07, "loss": 0.8697, "step": 45365 }, { "epoch": 0.86, "learning_rate": 2.6731928909775883e-07, "loss": 0.7577, "step": 45366 }, { "epoch": 0.86, "learning_rate": 2.672505620346791e-07, "loss": 0.6736, "step": 45367 }, { "epoch": 0.86, "learning_rate": 2.671818433086176e-07, "loss": 1.1074, "step": 45368 }, { "epoch": 0.86, "learning_rate": 2.6711313291983066e-07, "loss": 1.0761, "step": 45369 }, { "epoch": 0.86, "learning_rate": 2.670444308685746e-07, "loss": 1.0173, "step": 45370 }, { "epoch": 0.86, "learning_rate": 2.6697573715510626e-07, "loss": 0.6914, "step": 45371 }, { "epoch": 0.86, "learning_rate": 2.6690705177968234e-07, "loss": 0.8657, "step": 45372 }, { "epoch": 0.86, "learning_rate": 2.668383747425585e-07, "loss": 0.9849, "step": 45373 }, { "epoch": 0.86, "learning_rate": 2.6676970604399224e-07, "loss": 1.098, "step": 45374 }, { "epoch": 0.86, "learning_rate": 2.667010456842392e-07, "loss": 0.9406, "step": 45375 }, { "epoch": 0.86, "learning_rate": 2.666323936635559e-07, "loss": 0.8429, "step": 45376 }, { "epoch": 0.86, "learning_rate": 2.665637499821988e-07, "loss": 0.9452, "step": 45377 }, { "epoch": 0.86, "learning_rate": 2.6649511464042406e-07, "loss": 0.9869, "step": 45378 }, { "epoch": 0.86, "learning_rate": 2.664264876384881e-07, "loss": 0.8185, "step": 45379 }, { "epoch": 0.86, "learning_rate": 2.6635786897664715e-07, "loss": 0.9859, "step": 45380 }, { "epoch": 0.86, "learning_rate": 2.6628925865515795e-07, "loss": 0.9772, "step": 45381 }, { "epoch": 0.86, "learning_rate": 2.6622065667427534e-07, "loss": 0.9257, "step": 45382 }, { "epoch": 0.86, "learning_rate": 2.6615206303425703e-07, "loss": 0.9086, "step": 45383 }, { "epoch": 0.86, "learning_rate": 2.6608347773535824e-07, "loss": 0.9665, "step": 45384 }, { "epoch": 0.86, "learning_rate": 2.6601490077783456e-07, "loss": 0.8051, "step": 45385 }, { "epoch": 0.86, "learning_rate": 2.6594633216194376e-07, "loss": 0.7265, "step": 45386 }, { "epoch": 0.86, "learning_rate": 2.6587777188794047e-07, "loss": 1.4364, "step": 45387 }, { "epoch": 0.86, "learning_rate": 2.6580921995608076e-07, "loss": 0.8019, "step": 45388 }, { "epoch": 0.86, "learning_rate": 2.6574067636662123e-07, "loss": 1.0214, "step": 45389 }, { "epoch": 0.86, "learning_rate": 2.6567214111981737e-07, "loss": 1.0783, "step": 45390 }, { "epoch": 0.86, "learning_rate": 2.6560361421592546e-07, "loss": 0.7671, "step": 45391 }, { "epoch": 0.86, "learning_rate": 2.655350956552008e-07, "loss": 0.8859, "step": 45392 }, { "epoch": 0.86, "learning_rate": 2.654665854379004e-07, "loss": 1.0585, "step": 45393 }, { "epoch": 0.86, "learning_rate": 2.6539808356427807e-07, "loss": 1.022, "step": 45394 }, { "epoch": 0.86, "learning_rate": 2.6532959003459177e-07, "loss": 0.8922, "step": 45395 }, { "epoch": 0.86, "learning_rate": 2.652611048490958e-07, "loss": 0.8365, "step": 45396 }, { "epoch": 0.86, "learning_rate": 2.6519262800804635e-07, "loss": 1.0139, "step": 45397 }, { "epoch": 0.86, "learning_rate": 2.6512415951169904e-07, "loss": 0.8093, "step": 45398 }, { "epoch": 0.86, "learning_rate": 2.6505569936030985e-07, "loss": 0.7828, "step": 45399 }, { "epoch": 0.86, "learning_rate": 2.6498724755413373e-07, "loss": 0.951, "step": 45400 }, { "epoch": 0.86, "learning_rate": 2.6491880409342696e-07, "loss": 0.9079, "step": 45401 }, { "epoch": 0.86, "learning_rate": 2.648503689784454e-07, "loss": 0.8356, "step": 45402 }, { "epoch": 0.86, "learning_rate": 2.6478194220944305e-07, "loss": 1.1192, "step": 45403 }, { "epoch": 0.86, "learning_rate": 2.6471352378667715e-07, "loss": 0.8515, "step": 45404 }, { "epoch": 0.86, "learning_rate": 2.6464511371040223e-07, "loss": 0.8802, "step": 45405 }, { "epoch": 0.86, "learning_rate": 2.6457671198087314e-07, "loss": 1.0768, "step": 45406 }, { "epoch": 0.86, "learning_rate": 2.645083185983474e-07, "loss": 0.9045, "step": 45407 }, { "epoch": 0.86, "learning_rate": 2.644399335630782e-07, "loss": 0.7324, "step": 45408 }, { "epoch": 0.86, "learning_rate": 2.6437155687532243e-07, "loss": 0.9744, "step": 45409 }, { "epoch": 0.86, "learning_rate": 2.6430318853533364e-07, "loss": 0.8756, "step": 45410 }, { "epoch": 0.86, "learning_rate": 2.642348285433688e-07, "loss": 0.7943, "step": 45411 }, { "epoch": 0.86, "learning_rate": 2.641664768996829e-07, "loss": 1.2132, "step": 45412 }, { "epoch": 0.86, "learning_rate": 2.6409813360453005e-07, "loss": 0.8337, "step": 45413 }, { "epoch": 0.86, "learning_rate": 2.640297986581669e-07, "loss": 0.9957, "step": 45414 }, { "epoch": 0.86, "learning_rate": 2.639614720608477e-07, "loss": 0.7648, "step": 45415 }, { "epoch": 0.86, "learning_rate": 2.638931538128278e-07, "loss": 0.9224, "step": 45416 }, { "epoch": 0.86, "learning_rate": 2.6382484391436204e-07, "loss": 0.821, "step": 45417 }, { "epoch": 0.86, "learning_rate": 2.63756542365706e-07, "loss": 1.1455, "step": 45418 }, { "epoch": 0.86, "learning_rate": 2.636882491671144e-07, "loss": 1.1208, "step": 45419 }, { "epoch": 0.86, "learning_rate": 2.6361996431884226e-07, "loss": 0.8461, "step": 45420 }, { "epoch": 0.86, "learning_rate": 2.6355168782114527e-07, "loss": 0.778, "step": 45421 }, { "epoch": 0.86, "learning_rate": 2.6348341967427665e-07, "loss": 0.9229, "step": 45422 }, { "epoch": 0.86, "learning_rate": 2.6341515987849315e-07, "loss": 0.7394, "step": 45423 }, { "epoch": 0.86, "learning_rate": 2.633469084340487e-07, "loss": 0.8511, "step": 45424 }, { "epoch": 0.86, "learning_rate": 2.632786653411981e-07, "loss": 1.0234, "step": 45425 }, { "epoch": 0.86, "learning_rate": 2.6321043060019644e-07, "loss": 0.8966, "step": 45426 }, { "epoch": 0.86, "learning_rate": 2.6314220421129826e-07, "loss": 0.8271, "step": 45427 }, { "epoch": 0.86, "learning_rate": 2.630739861747589e-07, "loss": 0.8393, "step": 45428 }, { "epoch": 0.86, "learning_rate": 2.6300577649083225e-07, "loss": 0.8624, "step": 45429 }, { "epoch": 0.86, "learning_rate": 2.6293757515977433e-07, "loss": 0.8253, "step": 45430 }, { "epoch": 0.86, "learning_rate": 2.628693821818376e-07, "loss": 1.1841, "step": 45431 }, { "epoch": 0.86, "learning_rate": 2.6280119755727864e-07, "loss": 1.1219, "step": 45432 }, { "epoch": 0.86, "learning_rate": 2.6273302128635185e-07, "loss": 0.8036, "step": 45433 }, { "epoch": 0.86, "learning_rate": 2.6266485336931047e-07, "loss": 0.8351, "step": 45434 }, { "epoch": 0.86, "learning_rate": 2.625966938064109e-07, "loss": 0.8247, "step": 45435 }, { "epoch": 0.86, "learning_rate": 2.625285425979063e-07, "loss": 0.8126, "step": 45436 }, { "epoch": 0.86, "learning_rate": 2.624603997440514e-07, "loss": 1.17, "step": 45437 }, { "epoch": 0.86, "learning_rate": 2.623922652451008e-07, "loss": 0.951, "step": 45438 }, { "epoch": 0.86, "learning_rate": 2.623241391013087e-07, "loss": 0.8894, "step": 45439 }, { "epoch": 0.86, "learning_rate": 2.6225602131292996e-07, "loss": 0.7253, "step": 45440 }, { "epoch": 0.86, "learning_rate": 2.621879118802184e-07, "loss": 0.8707, "step": 45441 }, { "epoch": 0.86, "learning_rate": 2.62119810803429e-07, "loss": 0.8816, "step": 45442 }, { "epoch": 0.86, "learning_rate": 2.620517180828147e-07, "loss": 0.9969, "step": 45443 }, { "epoch": 0.86, "learning_rate": 2.619836337186318e-07, "loss": 1.0647, "step": 45444 }, { "epoch": 0.86, "learning_rate": 2.6191555771113263e-07, "loss": 0.8837, "step": 45445 }, { "epoch": 0.86, "learning_rate": 2.6184749006057247e-07, "loss": 0.7475, "step": 45446 }, { "epoch": 0.86, "learning_rate": 2.61779430767205e-07, "loss": 0.9348, "step": 45447 }, { "epoch": 0.86, "learning_rate": 2.6171137983128455e-07, "loss": 1.0038, "step": 45448 }, { "epoch": 0.86, "learning_rate": 2.6164333725306495e-07, "loss": 0.9704, "step": 45449 }, { "epoch": 0.86, "learning_rate": 2.615753030328008e-07, "loss": 1.1248, "step": 45450 }, { "epoch": 0.86, "learning_rate": 2.615072771707461e-07, "loss": 0.9828, "step": 45451 }, { "epoch": 0.86, "learning_rate": 2.614392596671539e-07, "loss": 0.8007, "step": 45452 }, { "epoch": 0.86, "learning_rate": 2.6137125052227903e-07, "loss": 0.8217, "step": 45453 }, { "epoch": 0.86, "learning_rate": 2.61303249736376e-07, "loss": 0.7838, "step": 45454 }, { "epoch": 0.86, "learning_rate": 2.612352573096968e-07, "loss": 0.8268, "step": 45455 }, { "epoch": 0.86, "learning_rate": 2.6116727324249776e-07, "loss": 0.9731, "step": 45456 }, { "epoch": 0.86, "learning_rate": 2.610992975350307e-07, "loss": 0.8627, "step": 45457 }, { "epoch": 0.86, "learning_rate": 2.610313301875506e-07, "loss": 0.9008, "step": 45458 }, { "epoch": 0.86, "learning_rate": 2.609633712003104e-07, "loss": 0.6711, "step": 45459 }, { "epoch": 0.86, "learning_rate": 2.608954205735648e-07, "loss": 0.8252, "step": 45460 }, { "epoch": 0.86, "learning_rate": 2.6082747830756677e-07, "loss": 0.849, "step": 45461 }, { "epoch": 0.86, "learning_rate": 2.6075954440257014e-07, "loss": 1.1173, "step": 45462 }, { "epoch": 0.86, "learning_rate": 2.6069161885882934e-07, "loss": 0.8355, "step": 45463 }, { "epoch": 0.86, "learning_rate": 2.606237016765964e-07, "loss": 0.8655, "step": 45464 }, { "epoch": 0.86, "learning_rate": 2.60555792856127e-07, "loss": 0.9096, "step": 45465 }, { "epoch": 0.86, "learning_rate": 2.604878923976731e-07, "loss": 0.6844, "step": 45466 }, { "epoch": 0.86, "learning_rate": 2.6042000030148867e-07, "loss": 0.7807, "step": 45467 }, { "epoch": 0.86, "learning_rate": 2.6035211656782714e-07, "loss": 0.8679, "step": 45468 }, { "epoch": 0.86, "learning_rate": 2.6028424119694223e-07, "loss": 1.0507, "step": 45469 }, { "epoch": 0.86, "learning_rate": 2.6021637418908757e-07, "loss": 0.8941, "step": 45470 }, { "epoch": 0.86, "learning_rate": 2.6014851554451605e-07, "loss": 0.8037, "step": 45471 }, { "epoch": 0.86, "learning_rate": 2.6008066526348184e-07, "loss": 0.7658, "step": 45472 }, { "epoch": 0.86, "learning_rate": 2.6001282334623677e-07, "loss": 0.8531, "step": 45473 }, { "epoch": 0.86, "learning_rate": 2.5994498979303563e-07, "loss": 1.0181, "step": 45474 }, { "epoch": 0.86, "learning_rate": 2.598771646041315e-07, "loss": 0.8853, "step": 45475 }, { "epoch": 0.86, "learning_rate": 2.598093477797767e-07, "loss": 1.0359, "step": 45476 }, { "epoch": 0.86, "learning_rate": 2.597415393202257e-07, "loss": 0.9496, "step": 45477 }, { "epoch": 0.86, "learning_rate": 2.596737392257309e-07, "loss": 0.9103, "step": 45478 }, { "epoch": 0.86, "learning_rate": 2.5960594749654564e-07, "loss": 0.807, "step": 45479 }, { "epoch": 0.86, "learning_rate": 2.595381641329231e-07, "loss": 0.7961, "step": 45480 }, { "epoch": 0.86, "learning_rate": 2.5947038913511633e-07, "loss": 0.9528, "step": 45481 }, { "epoch": 0.86, "learning_rate": 2.5940262250337854e-07, "loss": 0.987, "step": 45482 }, { "epoch": 0.86, "learning_rate": 2.5933486423796257e-07, "loss": 0.9932, "step": 45483 }, { "epoch": 0.86, "learning_rate": 2.592671143391218e-07, "loss": 0.9505, "step": 45484 }, { "epoch": 0.86, "learning_rate": 2.591993728071082e-07, "loss": 0.9026, "step": 45485 }, { "epoch": 0.86, "learning_rate": 2.591316396421764e-07, "loss": 0.9623, "step": 45486 }, { "epoch": 0.86, "learning_rate": 2.590639148445778e-07, "loss": 1.1796, "step": 45487 }, { "epoch": 0.86, "learning_rate": 2.589961984145659e-07, "loss": 0.9054, "step": 45488 }, { "epoch": 0.86, "learning_rate": 2.5892849035239337e-07, "loss": 0.7348, "step": 45489 }, { "epoch": 0.86, "learning_rate": 2.5886079065831293e-07, "loss": 0.9741, "step": 45490 }, { "epoch": 0.86, "learning_rate": 2.58793099332578e-07, "loss": 0.7377, "step": 45491 }, { "epoch": 0.86, "learning_rate": 2.587254163754407e-07, "loss": 0.8031, "step": 45492 }, { "epoch": 0.86, "learning_rate": 2.586577417871547e-07, "loss": 1.0982, "step": 45493 }, { "epoch": 0.86, "learning_rate": 2.5859007556797074e-07, "loss": 1.12, "step": 45494 }, { "epoch": 0.86, "learning_rate": 2.585224177181433e-07, "loss": 0.8773, "step": 45495 }, { "epoch": 0.86, "learning_rate": 2.5845476823792486e-07, "loss": 0.9375, "step": 45496 }, { "epoch": 0.86, "learning_rate": 2.5838712712756674e-07, "loss": 0.996, "step": 45497 }, { "epoch": 0.86, "learning_rate": 2.5831949438732325e-07, "loss": 0.9649, "step": 45498 }, { "epoch": 0.86, "learning_rate": 2.582518700174455e-07, "loss": 0.9767, "step": 45499 }, { "epoch": 0.86, "learning_rate": 2.581842540181864e-07, "loss": 1.0081, "step": 45500 }, { "epoch": 0.86, "learning_rate": 2.5811664638979884e-07, "loss": 0.8896, "step": 45501 }, { "epoch": 0.86, "learning_rate": 2.5804904713253503e-07, "loss": 0.8362, "step": 45502 }, { "epoch": 0.86, "learning_rate": 2.5798145624664707e-07, "loss": 0.6548, "step": 45503 }, { "epoch": 0.86, "learning_rate": 2.5791387373238776e-07, "loss": 0.8666, "step": 45504 }, { "epoch": 0.86, "learning_rate": 2.5784629959000966e-07, "loss": 1.1141, "step": 45505 }, { "epoch": 0.86, "learning_rate": 2.57778733819764e-07, "loss": 1.174, "step": 45506 }, { "epoch": 0.86, "learning_rate": 2.5771117642190454e-07, "loss": 1.0252, "step": 45507 }, { "epoch": 0.86, "learning_rate": 2.5764362739668257e-07, "loss": 0.8722, "step": 45508 }, { "epoch": 0.86, "learning_rate": 2.5757608674435026e-07, "loss": 1.0383, "step": 45509 }, { "epoch": 0.86, "learning_rate": 2.575085544651601e-07, "loss": 0.7094, "step": 45510 }, { "epoch": 0.86, "learning_rate": 2.5744103055936445e-07, "loss": 0.832, "step": 45511 }, { "epoch": 0.86, "learning_rate": 2.5737351502721525e-07, "loss": 1.0862, "step": 45512 }, { "epoch": 0.86, "learning_rate": 2.573060078689643e-07, "loss": 0.9199, "step": 45513 }, { "epoch": 0.86, "learning_rate": 2.5723850908486474e-07, "loss": 0.8177, "step": 45514 }, { "epoch": 0.86, "learning_rate": 2.5717101867516663e-07, "loss": 0.8501, "step": 45515 }, { "epoch": 0.86, "learning_rate": 2.5710353664012366e-07, "loss": 0.8766, "step": 45516 }, { "epoch": 0.86, "learning_rate": 2.5703606297998783e-07, "loss": 0.7761, "step": 45517 }, { "epoch": 0.86, "learning_rate": 2.569685976950098e-07, "loss": 0.9911, "step": 45518 }, { "epoch": 0.86, "learning_rate": 2.56901140785443e-07, "loss": 0.9836, "step": 45519 }, { "epoch": 0.86, "learning_rate": 2.5683369225153824e-07, "loss": 0.9293, "step": 45520 }, { "epoch": 0.86, "learning_rate": 2.5676625209354764e-07, "loss": 0.8444, "step": 45521 }, { "epoch": 0.86, "learning_rate": 2.566988203117229e-07, "loss": 0.8727, "step": 45522 }, { "epoch": 0.86, "learning_rate": 2.566313969063161e-07, "loss": 0.7887, "step": 45523 }, { "epoch": 0.86, "learning_rate": 2.565639818775792e-07, "loss": 0.9723, "step": 45524 }, { "epoch": 0.86, "learning_rate": 2.564965752257631e-07, "loss": 1.1277, "step": 45525 }, { "epoch": 0.86, "learning_rate": 2.564291769511207e-07, "loss": 1.0369, "step": 45526 }, { "epoch": 0.86, "learning_rate": 2.56361787053902e-07, "loss": 0.7801, "step": 45527 }, { "epoch": 0.86, "learning_rate": 2.5629440553436055e-07, "loss": 0.8056, "step": 45528 }, { "epoch": 0.86, "learning_rate": 2.5622703239274656e-07, "loss": 0.8384, "step": 45529 }, { "epoch": 0.86, "learning_rate": 2.561596676293121e-07, "loss": 1.0452, "step": 45530 }, { "epoch": 0.86, "learning_rate": 2.5609231124430837e-07, "loss": 1.0142, "step": 45531 }, { "epoch": 0.86, "learning_rate": 2.5602496323798745e-07, "loss": 0.7699, "step": 45532 }, { "epoch": 0.86, "learning_rate": 2.559576236106004e-07, "loss": 0.9926, "step": 45533 }, { "epoch": 0.86, "learning_rate": 2.5589029236239876e-07, "loss": 0.896, "step": 45534 }, { "epoch": 0.86, "learning_rate": 2.5582296949363454e-07, "loss": 0.9756, "step": 45535 }, { "epoch": 0.86, "learning_rate": 2.5575565500455727e-07, "loss": 0.7872, "step": 45536 }, { "epoch": 0.86, "learning_rate": 2.5568834889542036e-07, "loss": 0.9077, "step": 45537 }, { "epoch": 0.86, "learning_rate": 2.5562105116647475e-07, "loss": 0.866, "step": 45538 }, { "epoch": 0.86, "learning_rate": 2.555537618179704e-07, "loss": 0.6959, "step": 45539 }, { "epoch": 0.86, "learning_rate": 2.554864808501603e-07, "loss": 0.8986, "step": 45540 }, { "epoch": 0.86, "learning_rate": 2.5541920826329445e-07, "loss": 0.9622, "step": 45541 }, { "epoch": 0.86, "learning_rate": 2.5535194405762464e-07, "loss": 0.8276, "step": 45542 }, { "epoch": 0.86, "learning_rate": 2.5528468823340173e-07, "loss": 0.8907, "step": 45543 }, { "epoch": 0.86, "learning_rate": 2.5521744079087695e-07, "loss": 0.9179, "step": 45544 }, { "epoch": 0.86, "learning_rate": 2.551502017303015e-07, "loss": 0.8208, "step": 45545 }, { "epoch": 0.86, "learning_rate": 2.550829710519262e-07, "loss": 0.8428, "step": 45546 }, { "epoch": 0.86, "learning_rate": 2.550157487560029e-07, "loss": 1.045, "step": 45547 }, { "epoch": 0.86, "learning_rate": 2.5494853484278075e-07, "loss": 0.8627, "step": 45548 }, { "epoch": 0.86, "learning_rate": 2.54881329312513e-07, "loss": 0.874, "step": 45549 }, { "epoch": 0.86, "learning_rate": 2.548141321654493e-07, "loss": 0.9119, "step": 45550 }, { "epoch": 0.86, "learning_rate": 2.5474694340184043e-07, "loss": 0.9987, "step": 45551 }, { "epoch": 0.86, "learning_rate": 2.5467976302193777e-07, "loss": 1.0305, "step": 45552 }, { "epoch": 0.86, "learning_rate": 2.546125910259922e-07, "loss": 0.9701, "step": 45553 }, { "epoch": 0.86, "learning_rate": 2.545454274142542e-07, "loss": 0.8628, "step": 45554 }, { "epoch": 0.86, "learning_rate": 2.5447827218697486e-07, "loss": 0.8792, "step": 45555 }, { "epoch": 0.86, "learning_rate": 2.544111253444051e-07, "loss": 1.03, "step": 45556 }, { "epoch": 0.86, "learning_rate": 2.5434398688679447e-07, "loss": 0.9609, "step": 45557 }, { "epoch": 0.86, "learning_rate": 2.5427685681439497e-07, "loss": 0.7278, "step": 45558 }, { "epoch": 0.86, "learning_rate": 2.542097351274575e-07, "loss": 0.957, "step": 45559 }, { "epoch": 0.86, "learning_rate": 2.541426218262308e-07, "loss": 0.9392, "step": 45560 }, { "epoch": 0.86, "learning_rate": 2.540755169109677e-07, "loss": 0.8206, "step": 45561 }, { "epoch": 0.86, "learning_rate": 2.540084203819174e-07, "loss": 0.9174, "step": 45562 }, { "epoch": 0.86, "learning_rate": 2.539413322393308e-07, "loss": 0.94, "step": 45563 }, { "epoch": 0.86, "learning_rate": 2.5387425248345835e-07, "loss": 0.859, "step": 45564 }, { "epoch": 0.86, "learning_rate": 2.538071811145507e-07, "loss": 1.0431, "step": 45565 }, { "epoch": 0.86, "learning_rate": 2.5374011813285775e-07, "loss": 0.8188, "step": 45566 }, { "epoch": 0.86, "learning_rate": 2.5367306353863086e-07, "loss": 0.823, "step": 45567 }, { "epoch": 0.86, "learning_rate": 2.5360601733212004e-07, "loss": 0.9054, "step": 45568 }, { "epoch": 0.86, "learning_rate": 2.5353897951357453e-07, "loss": 0.9025, "step": 45569 }, { "epoch": 0.86, "learning_rate": 2.5347195008324665e-07, "loss": 0.9355, "step": 45570 }, { "epoch": 0.86, "learning_rate": 2.534049290413851e-07, "loss": 0.8788, "step": 45571 }, { "epoch": 0.86, "learning_rate": 2.5333791638824076e-07, "loss": 0.7988, "step": 45572 }, { "epoch": 0.86, "learning_rate": 2.5327091212406366e-07, "loss": 0.879, "step": 45573 }, { "epoch": 0.86, "learning_rate": 2.53203916249104e-07, "loss": 1.158, "step": 45574 }, { "epoch": 0.86, "learning_rate": 2.531369287636121e-07, "loss": 1.1385, "step": 45575 }, { "epoch": 0.86, "learning_rate": 2.5306994966783794e-07, "loss": 0.753, "step": 45576 }, { "epoch": 0.86, "learning_rate": 2.530029789620325e-07, "loss": 0.8209, "step": 45577 }, { "epoch": 0.86, "learning_rate": 2.529360166464437e-07, "loss": 0.8345, "step": 45578 }, { "epoch": 0.86, "learning_rate": 2.5286906272132373e-07, "loss": 0.7642, "step": 45579 }, { "epoch": 0.86, "learning_rate": 2.528021171869219e-07, "loss": 0.8758, "step": 45580 }, { "epoch": 0.86, "learning_rate": 2.527351800434874e-07, "loss": 1.0271, "step": 45581 }, { "epoch": 0.86, "learning_rate": 2.5266825129127177e-07, "loss": 0.8845, "step": 45582 }, { "epoch": 0.86, "learning_rate": 2.526013309305234e-07, "loss": 0.8502, "step": 45583 }, { "epoch": 0.86, "learning_rate": 2.5253441896149255e-07, "loss": 0.9791, "step": 45584 }, { "epoch": 0.86, "learning_rate": 2.524675153844297e-07, "loss": 0.8627, "step": 45585 }, { "epoch": 0.86, "learning_rate": 2.524006201995841e-07, "loss": 0.7137, "step": 45586 }, { "epoch": 0.86, "learning_rate": 2.523337334072054e-07, "loss": 1.0983, "step": 45587 }, { "epoch": 0.86, "learning_rate": 2.5226685500754383e-07, "loss": 0.9619, "step": 45588 }, { "epoch": 0.86, "learning_rate": 2.521999850008494e-07, "loss": 0.6909, "step": 45589 }, { "epoch": 0.86, "learning_rate": 2.5213312338737026e-07, "loss": 0.7419, "step": 45590 }, { "epoch": 0.86, "learning_rate": 2.520662701673582e-07, "loss": 0.8735, "step": 45591 }, { "epoch": 0.86, "learning_rate": 2.5199942534106127e-07, "loss": 0.7422, "step": 45592 }, { "epoch": 0.86, "learning_rate": 2.519325889087296e-07, "loss": 0.8891, "step": 45593 }, { "epoch": 0.86, "learning_rate": 2.5186576087061267e-07, "loss": 1.2023, "step": 45594 }, { "epoch": 0.86, "learning_rate": 2.5179894122696003e-07, "loss": 1.0359, "step": 45595 }, { "epoch": 0.86, "learning_rate": 2.517321299780209e-07, "loss": 0.7354, "step": 45596 }, { "epoch": 0.86, "learning_rate": 2.5166532712404545e-07, "loss": 0.9601, "step": 45597 }, { "epoch": 0.86, "learning_rate": 2.515985326652831e-07, "loss": 0.8635, "step": 45598 }, { "epoch": 0.86, "learning_rate": 2.5153174660198204e-07, "loss": 1.0147, "step": 45599 }, { "epoch": 0.86, "learning_rate": 2.514649689343929e-07, "loss": 1.0333, "step": 45600 }, { "epoch": 0.86, "learning_rate": 2.5139819966276513e-07, "loss": 0.9774, "step": 45601 }, { "epoch": 0.86, "learning_rate": 2.5133143878734665e-07, "loss": 0.7923, "step": 45602 }, { "epoch": 0.86, "learning_rate": 2.512646863083884e-07, "loss": 0.7555, "step": 45603 }, { "epoch": 0.86, "learning_rate": 2.5119794222613845e-07, "loss": 0.701, "step": 45604 }, { "epoch": 0.86, "learning_rate": 2.5113120654084666e-07, "loss": 0.9591, "step": 45605 }, { "epoch": 0.86, "learning_rate": 2.510644792527617e-07, "loss": 1.0604, "step": 45606 }, { "epoch": 0.86, "learning_rate": 2.5099776036213304e-07, "loss": 0.6724, "step": 45607 }, { "epoch": 0.86, "learning_rate": 2.5093104986920994e-07, "loss": 0.8647, "step": 45608 }, { "epoch": 0.86, "learning_rate": 2.5086434777424116e-07, "loss": 0.8284, "step": 45609 }, { "epoch": 0.86, "learning_rate": 2.5079765407747674e-07, "loss": 0.8122, "step": 45610 }, { "epoch": 0.86, "learning_rate": 2.507309687791637e-07, "loss": 1.0411, "step": 45611 }, { "epoch": 0.86, "learning_rate": 2.506642918795532e-07, "loss": 1.0872, "step": 45612 }, { "epoch": 0.86, "learning_rate": 2.5059762337889286e-07, "loss": 0.9897, "step": 45613 }, { "epoch": 0.86, "learning_rate": 2.5053096327743194e-07, "loss": 0.8041, "step": 45614 }, { "epoch": 0.86, "learning_rate": 2.504643115754196e-07, "loss": 0.9678, "step": 45615 }, { "epoch": 0.86, "learning_rate": 2.5039766827310463e-07, "loss": 0.8406, "step": 45616 }, { "epoch": 0.86, "learning_rate": 2.503310333707354e-07, "loss": 0.8337, "step": 45617 }, { "epoch": 0.86, "learning_rate": 2.502644068685614e-07, "loss": 1.119, "step": 45618 }, { "epoch": 0.86, "learning_rate": 2.5019778876683166e-07, "loss": 0.7676, "step": 45619 }, { "epoch": 0.86, "learning_rate": 2.5013117906579314e-07, "loss": 0.8996, "step": 45620 }, { "epoch": 0.86, "learning_rate": 2.5006457776569654e-07, "loss": 0.9878, "step": 45621 }, { "epoch": 0.86, "learning_rate": 2.4999798486679024e-07, "loss": 1.0338, "step": 45622 }, { "epoch": 0.86, "learning_rate": 2.499314003693215e-07, "loss": 0.7796, "step": 45623 }, { "epoch": 0.86, "learning_rate": 2.4986482427354105e-07, "loss": 0.9482, "step": 45624 }, { "epoch": 0.86, "learning_rate": 2.4979825657969553e-07, "loss": 0.973, "step": 45625 }, { "epoch": 0.86, "learning_rate": 2.497316972880345e-07, "loss": 1.0622, "step": 45626 }, { "epoch": 0.86, "learning_rate": 2.4966514639880646e-07, "loss": 0.7263, "step": 45627 }, { "epoch": 0.86, "learning_rate": 2.495986039122597e-07, "loss": 0.8472, "step": 45628 }, { "epoch": 0.86, "learning_rate": 2.495320698286427e-07, "loss": 0.7542, "step": 45629 }, { "epoch": 0.86, "learning_rate": 2.494655441482038e-07, "loss": 0.8864, "step": 45630 }, { "epoch": 0.86, "learning_rate": 2.493990268711924e-07, "loss": 1.1603, "step": 45631 }, { "epoch": 0.86, "learning_rate": 2.493325179978548e-07, "loss": 0.7847, "step": 45632 }, { "epoch": 0.86, "learning_rate": 2.492660175284417e-07, "loss": 0.8986, "step": 45633 }, { "epoch": 0.86, "learning_rate": 2.491995254631996e-07, "loss": 1.162, "step": 45634 }, { "epoch": 0.86, "learning_rate": 2.491330418023774e-07, "loss": 0.9368, "step": 45635 }, { "epoch": 0.86, "learning_rate": 2.4906656654622357e-07, "loss": 0.9855, "step": 45636 }, { "epoch": 0.86, "learning_rate": 2.4900009969498625e-07, "loss": 0.9807, "step": 45637 }, { "epoch": 0.86, "learning_rate": 2.489336412489135e-07, "loss": 0.8482, "step": 45638 }, { "epoch": 0.86, "learning_rate": 2.4886719120825354e-07, "loss": 0.9481, "step": 45639 }, { "epoch": 0.86, "learning_rate": 2.488007495732547e-07, "loss": 0.6904, "step": 45640 }, { "epoch": 0.86, "learning_rate": 2.487343163441641e-07, "loss": 0.7903, "step": 45641 }, { "epoch": 0.86, "learning_rate": 2.486678915212309e-07, "loss": 0.7899, "step": 45642 }, { "epoch": 0.86, "learning_rate": 2.486014751047033e-07, "loss": 0.9633, "step": 45643 }, { "epoch": 0.86, "learning_rate": 2.4853506709482833e-07, "loss": 0.8851, "step": 45644 }, { "epoch": 0.86, "learning_rate": 2.4846866749185433e-07, "loss": 1.0475, "step": 45645 }, { "epoch": 0.86, "learning_rate": 2.4840227629602946e-07, "loss": 0.8271, "step": 45646 }, { "epoch": 0.86, "learning_rate": 2.483358935076013e-07, "loss": 0.861, "step": 45647 }, { "epoch": 0.86, "learning_rate": 2.482695191268178e-07, "loss": 0.8567, "step": 45648 }, { "epoch": 0.86, "learning_rate": 2.4820315315392697e-07, "loss": 0.7797, "step": 45649 }, { "epoch": 0.86, "learning_rate": 2.4813679558917697e-07, "loss": 1.2795, "step": 45650 }, { "epoch": 0.86, "learning_rate": 2.480704464328143e-07, "loss": 0.7539, "step": 45651 }, { "epoch": 0.86, "learning_rate": 2.480041056850882e-07, "loss": 0.8032, "step": 45652 }, { "epoch": 0.86, "learning_rate": 2.479377733462457e-07, "loss": 0.8651, "step": 45653 }, { "epoch": 0.86, "learning_rate": 2.478714494165341e-07, "loss": 0.8741, "step": 45654 }, { "epoch": 0.86, "learning_rate": 2.478051338962015e-07, "loss": 0.7908, "step": 45655 }, { "epoch": 0.86, "learning_rate": 2.477388267854958e-07, "loss": 1.0432, "step": 45656 }, { "epoch": 0.86, "learning_rate": 2.4767252808466397e-07, "loss": 0.9852, "step": 45657 }, { "epoch": 0.86, "learning_rate": 2.4760623779395393e-07, "loss": 0.9097, "step": 45658 }, { "epoch": 0.86, "learning_rate": 2.475399559136135e-07, "loss": 0.8579, "step": 45659 }, { "epoch": 0.86, "learning_rate": 2.4747368244388893e-07, "loss": 0.9919, "step": 45660 }, { "epoch": 0.86, "learning_rate": 2.474074173850291e-07, "loss": 0.8588, "step": 45661 }, { "epoch": 0.86, "learning_rate": 2.4734116073728137e-07, "loss": 1.0049, "step": 45662 }, { "epoch": 0.86, "learning_rate": 2.472749125008919e-07, "loss": 1.0396, "step": 45663 }, { "epoch": 0.86, "learning_rate": 2.4720867267610943e-07, "loss": 1.0504, "step": 45664 }, { "epoch": 0.86, "learning_rate": 2.471424412631804e-07, "loss": 0.9648, "step": 45665 }, { "epoch": 0.86, "learning_rate": 2.4707621826235263e-07, "loss": 0.8752, "step": 45666 }, { "epoch": 0.86, "learning_rate": 2.470100036738729e-07, "loss": 0.7915, "step": 45667 }, { "epoch": 0.86, "learning_rate": 2.469437974979888e-07, "loss": 0.965, "step": 45668 }, { "epoch": 0.86, "learning_rate": 2.4687759973494764e-07, "loss": 1.0157, "step": 45669 }, { "epoch": 0.86, "learning_rate": 2.468114103849961e-07, "loss": 1.0408, "step": 45670 }, { "epoch": 0.86, "learning_rate": 2.467452294483824e-07, "loss": 0.7561, "step": 45671 }, { "epoch": 0.86, "learning_rate": 2.466790569253519e-07, "loss": 0.9735, "step": 45672 }, { "epoch": 0.86, "learning_rate": 2.4661289281615374e-07, "loss": 0.6609, "step": 45673 }, { "epoch": 0.86, "learning_rate": 2.465467371210334e-07, "loss": 0.8227, "step": 45674 }, { "epoch": 0.86, "learning_rate": 2.4648058984023867e-07, "loss": 1.0122, "step": 45675 }, { "epoch": 0.86, "learning_rate": 2.46414450974016e-07, "loss": 0.8056, "step": 45676 }, { "epoch": 0.86, "learning_rate": 2.4634832052261274e-07, "loss": 1.0758, "step": 45677 }, { "epoch": 0.86, "learning_rate": 2.4628219848627594e-07, "loss": 0.8119, "step": 45678 }, { "epoch": 0.86, "learning_rate": 2.46216084865252e-07, "loss": 0.8801, "step": 45679 }, { "epoch": 0.86, "learning_rate": 2.4614997965978884e-07, "loss": 1.1497, "step": 45680 }, { "epoch": 0.86, "learning_rate": 2.4608388287013147e-07, "loss": 1.1198, "step": 45681 }, { "epoch": 0.86, "learning_rate": 2.4601779449652835e-07, "loss": 0.9464, "step": 45682 }, { "epoch": 0.86, "learning_rate": 2.4595171453922623e-07, "loss": 0.9163, "step": 45683 }, { "epoch": 0.86, "learning_rate": 2.4588564299847016e-07, "loss": 0.7766, "step": 45684 }, { "epoch": 0.86, "learning_rate": 2.4581957987450886e-07, "loss": 0.7469, "step": 45685 }, { "epoch": 0.86, "learning_rate": 2.457535251675877e-07, "loss": 0.9078, "step": 45686 }, { "epoch": 0.86, "learning_rate": 2.4568747887795397e-07, "loss": 0.9139, "step": 45687 }, { "epoch": 0.86, "learning_rate": 2.456214410058541e-07, "loss": 0.8607, "step": 45688 }, { "epoch": 0.86, "learning_rate": 2.4555541155153435e-07, "loss": 0.8739, "step": 45689 }, { "epoch": 0.86, "learning_rate": 2.454893905152417e-07, "loss": 0.83, "step": 45690 }, { "epoch": 0.86, "learning_rate": 2.454233778972226e-07, "loss": 0.8844, "step": 45691 }, { "epoch": 0.86, "learning_rate": 2.453573736977238e-07, "loss": 0.7508, "step": 45692 }, { "epoch": 0.86, "learning_rate": 2.4529137791699074e-07, "loss": 0.9344, "step": 45693 }, { "epoch": 0.86, "learning_rate": 2.452253905552715e-07, "loss": 0.9278, "step": 45694 }, { "epoch": 0.86, "learning_rate": 2.4515941161281085e-07, "loss": 0.8345, "step": 45695 }, { "epoch": 0.86, "learning_rate": 2.4509344108985587e-07, "loss": 0.7767, "step": 45696 }, { "epoch": 0.86, "learning_rate": 2.4502747898665275e-07, "loss": 0.8362, "step": 45697 }, { "epoch": 0.86, "learning_rate": 2.449615253034482e-07, "loss": 0.6442, "step": 45698 }, { "epoch": 0.86, "learning_rate": 2.4489558004048784e-07, "loss": 1.0745, "step": 45699 }, { "epoch": 0.86, "learning_rate": 2.4482964319801823e-07, "loss": 1.0778, "step": 45700 }, { "epoch": 0.86, "learning_rate": 2.447637147762863e-07, "loss": 0.8745, "step": 45701 }, { "epoch": 0.86, "learning_rate": 2.4469779477553633e-07, "loss": 1.0199, "step": 45702 }, { "epoch": 0.86, "learning_rate": 2.446318831960165e-07, "loss": 0.8873, "step": 45703 }, { "epoch": 0.86, "learning_rate": 2.445659800379721e-07, "loss": 0.9034, "step": 45704 }, { "epoch": 0.86, "learning_rate": 2.4450008530164854e-07, "loss": 0.5624, "step": 45705 }, { "epoch": 0.86, "learning_rate": 2.4443419898729335e-07, "loss": 0.8727, "step": 45706 }, { "epoch": 0.86, "learning_rate": 2.4436832109515114e-07, "loss": 0.7547, "step": 45707 }, { "epoch": 0.86, "learning_rate": 2.4430245162546854e-07, "loss": 0.7329, "step": 45708 }, { "epoch": 0.86, "learning_rate": 2.442365905784913e-07, "loss": 0.8164, "step": 45709 }, { "epoch": 0.86, "learning_rate": 2.441707379544658e-07, "loss": 0.822, "step": 45710 }, { "epoch": 0.86, "learning_rate": 2.441048937536372e-07, "loss": 0.899, "step": 45711 }, { "epoch": 0.86, "learning_rate": 2.4403905797625193e-07, "loss": 0.9393, "step": 45712 }, { "epoch": 0.86, "learning_rate": 2.439732306225562e-07, "loss": 0.8404, "step": 45713 }, { "epoch": 0.86, "learning_rate": 2.439074116927942e-07, "loss": 0.7881, "step": 45714 }, { "epoch": 0.86, "learning_rate": 2.4384160118721385e-07, "loss": 0.8218, "step": 45715 }, { "epoch": 0.86, "learning_rate": 2.437757991060591e-07, "loss": 0.8374, "step": 45716 }, { "epoch": 0.86, "learning_rate": 2.437100054495764e-07, "loss": 0.9249, "step": 45717 }, { "epoch": 0.86, "learning_rate": 2.4364422021801144e-07, "loss": 1.0269, "step": 45718 }, { "epoch": 0.86, "learning_rate": 2.435784434116098e-07, "loss": 1.1546, "step": 45719 }, { "epoch": 0.86, "learning_rate": 2.435126750306172e-07, "loss": 0.9821, "step": 45720 }, { "epoch": 0.86, "learning_rate": 2.4344691507527884e-07, "loss": 0.7315, "step": 45721 }, { "epoch": 0.86, "learning_rate": 2.433811635458411e-07, "loss": 0.9622, "step": 45722 }, { "epoch": 0.86, "learning_rate": 2.433154204425478e-07, "loss": 0.6698, "step": 45723 }, { "epoch": 0.86, "learning_rate": 2.432496857656461e-07, "loss": 0.907, "step": 45724 }, { "epoch": 0.86, "learning_rate": 2.431839595153812e-07, "loss": 0.9729, "step": 45725 }, { "epoch": 0.86, "learning_rate": 2.431182416919975e-07, "loss": 1.1414, "step": 45726 }, { "epoch": 0.86, "learning_rate": 2.4305253229574195e-07, "loss": 0.8265, "step": 45727 }, { "epoch": 0.86, "learning_rate": 2.429868313268585e-07, "loss": 0.8417, "step": 45728 }, { "epoch": 0.86, "learning_rate": 2.4292113878559315e-07, "loss": 1.0085, "step": 45729 }, { "epoch": 0.86, "learning_rate": 2.428554546721909e-07, "loss": 0.7372, "step": 45730 }, { "epoch": 0.86, "learning_rate": 2.427897789868974e-07, "loss": 0.9904, "step": 45731 }, { "epoch": 0.86, "learning_rate": 2.427241117299575e-07, "loss": 0.9389, "step": 45732 }, { "epoch": 0.86, "learning_rate": 2.4265845290161657e-07, "loss": 0.876, "step": 45733 }, { "epoch": 0.86, "learning_rate": 2.425928025021204e-07, "loss": 0.8731, "step": 45734 }, { "epoch": 0.86, "learning_rate": 2.425271605317123e-07, "loss": 0.7855, "step": 45735 }, { "epoch": 0.86, "learning_rate": 2.424615269906397e-07, "loss": 0.9689, "step": 45736 }, { "epoch": 0.86, "learning_rate": 2.423959018791458e-07, "loss": 1.1746, "step": 45737 }, { "epoch": 0.86, "learning_rate": 2.423302851974768e-07, "loss": 0.9865, "step": 45738 }, { "epoch": 0.86, "learning_rate": 2.4226467694587695e-07, "loss": 0.6959, "step": 45739 }, { "epoch": 0.86, "learning_rate": 2.4219907712459164e-07, "loss": 0.9574, "step": 45740 }, { "epoch": 0.86, "learning_rate": 2.4213348573386585e-07, "loss": 1.0526, "step": 45741 }, { "epoch": 0.86, "learning_rate": 2.4206790277394423e-07, "loss": 0.9541, "step": 45742 }, { "epoch": 0.86, "learning_rate": 2.4200232824507257e-07, "loss": 0.9938, "step": 45743 }, { "epoch": 0.86, "learning_rate": 2.4193676214749386e-07, "loss": 1.0496, "step": 45744 }, { "epoch": 0.86, "learning_rate": 2.4187120448145444e-07, "loss": 0.7058, "step": 45745 }, { "epoch": 0.86, "learning_rate": 2.418056552471995e-07, "loss": 0.8331, "step": 45746 }, { "epoch": 0.86, "learning_rate": 2.4174011444497185e-07, "loss": 0.9108, "step": 45747 }, { "epoch": 0.86, "learning_rate": 2.416745820750183e-07, "loss": 0.7201, "step": 45748 }, { "epoch": 0.86, "learning_rate": 2.416090581375821e-07, "loss": 0.9304, "step": 45749 }, { "epoch": 0.86, "learning_rate": 2.4154354263290854e-07, "loss": 1.0436, "step": 45750 }, { "epoch": 0.86, "learning_rate": 2.41478035561242e-07, "loss": 0.7767, "step": 45751 }, { "epoch": 0.86, "learning_rate": 2.4141253692282734e-07, "loss": 0.784, "step": 45752 }, { "epoch": 0.86, "learning_rate": 2.413470467179091e-07, "loss": 0.9535, "step": 45753 }, { "epoch": 0.86, "learning_rate": 2.412815649467315e-07, "loss": 0.797, "step": 45754 }, { "epoch": 0.86, "learning_rate": 2.412160916095399e-07, "loss": 0.7877, "step": 45755 }, { "epoch": 0.86, "learning_rate": 2.411506267065772e-07, "loss": 1.0593, "step": 45756 }, { "epoch": 0.86, "learning_rate": 2.410851702380898e-07, "loss": 1.071, "step": 45757 }, { "epoch": 0.86, "learning_rate": 2.410197222043206e-07, "loss": 0.8502, "step": 45758 }, { "epoch": 0.86, "learning_rate": 2.4095428260551444e-07, "loss": 0.7459, "step": 45759 }, { "epoch": 0.86, "learning_rate": 2.408888514419158e-07, "loss": 0.7684, "step": 45760 }, { "epoch": 0.86, "learning_rate": 2.4082342871376894e-07, "loss": 0.9281, "step": 45761 }, { "epoch": 0.86, "learning_rate": 2.4075801442131815e-07, "loss": 1.1364, "step": 45762 }, { "epoch": 0.86, "learning_rate": 2.406926085648076e-07, "loss": 1.0764, "step": 45763 }, { "epoch": 0.86, "learning_rate": 2.406272111444821e-07, "loss": 1.0424, "step": 45764 }, { "epoch": 0.86, "learning_rate": 2.4056182216058434e-07, "loss": 0.7893, "step": 45765 }, { "epoch": 0.86, "learning_rate": 2.404964416133598e-07, "loss": 0.8779, "step": 45766 }, { "epoch": 0.86, "learning_rate": 2.4043106950305287e-07, "loss": 0.8085, "step": 45767 }, { "epoch": 0.86, "learning_rate": 2.403657058299061e-07, "loss": 1.008, "step": 45768 }, { "epoch": 0.86, "learning_rate": 2.4030035059416534e-07, "loss": 0.9346, "step": 45769 }, { "epoch": 0.86, "learning_rate": 2.402350037960735e-07, "loss": 0.7707, "step": 45770 }, { "epoch": 0.86, "learning_rate": 2.4016966543587486e-07, "loss": 0.865, "step": 45771 }, { "epoch": 0.86, "learning_rate": 2.401043355138133e-07, "loss": 0.9863, "step": 45772 }, { "epoch": 0.86, "learning_rate": 2.400390140301329e-07, "loss": 0.6069, "step": 45773 }, { "epoch": 0.86, "learning_rate": 2.399737009850775e-07, "loss": 0.9611, "step": 45774 }, { "epoch": 0.86, "learning_rate": 2.399083963788909e-07, "loss": 0.8977, "step": 45775 }, { "epoch": 0.86, "learning_rate": 2.398431002118176e-07, "loss": 0.853, "step": 45776 }, { "epoch": 0.86, "learning_rate": 2.397778124841002e-07, "loss": 0.9606, "step": 45777 }, { "epoch": 0.86, "learning_rate": 2.397125331959838e-07, "loss": 0.8437, "step": 45778 }, { "epoch": 0.86, "learning_rate": 2.3964726234771113e-07, "loss": 0.853, "step": 45779 }, { "epoch": 0.86, "learning_rate": 2.395819999395263e-07, "loss": 1.0051, "step": 45780 }, { "epoch": 0.86, "learning_rate": 2.395167459716727e-07, "loss": 1.1065, "step": 45781 }, { "epoch": 0.86, "learning_rate": 2.3945150044439454e-07, "loss": 1.1364, "step": 45782 }, { "epoch": 0.86, "learning_rate": 2.3938626335793524e-07, "loss": 0.7443, "step": 45783 }, { "epoch": 0.86, "learning_rate": 2.39321034712538e-07, "loss": 0.9132, "step": 45784 }, { "epoch": 0.86, "learning_rate": 2.3925581450844756e-07, "loss": 0.8086, "step": 45785 }, { "epoch": 0.86, "learning_rate": 2.391906027459054e-07, "loss": 0.6756, "step": 45786 }, { "epoch": 0.86, "learning_rate": 2.3912539942515663e-07, "loss": 0.9144, "step": 45787 }, { "epoch": 0.86, "learning_rate": 2.390602045464449e-07, "loss": 0.9959, "step": 45788 }, { "epoch": 0.86, "learning_rate": 2.3899501811001205e-07, "loss": 0.8643, "step": 45789 }, { "epoch": 0.86, "learning_rate": 2.389298401161036e-07, "loss": 0.9287, "step": 45790 }, { "epoch": 0.86, "learning_rate": 2.388646705649611e-07, "loss": 0.7808, "step": 45791 }, { "epoch": 0.86, "learning_rate": 2.387995094568285e-07, "loss": 0.8534, "step": 45792 }, { "epoch": 0.86, "learning_rate": 2.387343567919495e-07, "loss": 1.221, "step": 45793 }, { "epoch": 0.86, "learning_rate": 2.3866921257056696e-07, "loss": 0.8443, "step": 45794 }, { "epoch": 0.86, "learning_rate": 2.386040767929243e-07, "loss": 0.934, "step": 45795 }, { "epoch": 0.86, "learning_rate": 2.3853894945926467e-07, "loss": 0.9566, "step": 45796 }, { "epoch": 0.86, "learning_rate": 2.384738305698314e-07, "loss": 0.9986, "step": 45797 }, { "epoch": 0.86, "learning_rate": 2.3840872012486694e-07, "loss": 0.8931, "step": 45798 }, { "epoch": 0.86, "learning_rate": 2.38343618124616e-07, "loss": 0.7422, "step": 45799 }, { "epoch": 0.86, "learning_rate": 2.3827852456931978e-07, "loss": 1.0642, "step": 45800 }, { "epoch": 0.86, "learning_rate": 2.3821343945922253e-07, "loss": 1.0448, "step": 45801 }, { "epoch": 0.86, "learning_rate": 2.381483627945669e-07, "loss": 0.8035, "step": 45802 }, { "epoch": 0.86, "learning_rate": 2.3808329457559593e-07, "loss": 0.757, "step": 45803 }, { "epoch": 0.86, "learning_rate": 2.3801823480255253e-07, "loss": 0.8146, "step": 45804 }, { "epoch": 0.86, "learning_rate": 2.3795318347567958e-07, "loss": 1.0208, "step": 45805 }, { "epoch": 0.86, "learning_rate": 2.3788814059522074e-07, "loss": 1.2026, "step": 45806 }, { "epoch": 0.86, "learning_rate": 2.3782310616141723e-07, "loss": 1.0911, "step": 45807 }, { "epoch": 0.86, "learning_rate": 2.377580801745133e-07, "loss": 0.8579, "step": 45808 }, { "epoch": 0.86, "learning_rate": 2.3769306263475177e-07, "loss": 0.7145, "step": 45809 }, { "epoch": 0.86, "learning_rate": 2.3762805354237417e-07, "loss": 0.8724, "step": 45810 }, { "epoch": 0.86, "learning_rate": 2.3756305289762498e-07, "loss": 0.8608, "step": 45811 }, { "epoch": 0.86, "learning_rate": 2.3749806070074544e-07, "loss": 1.0427, "step": 45812 }, { "epoch": 0.86, "learning_rate": 2.3743307695197865e-07, "loss": 0.8835, "step": 45813 }, { "epoch": 0.86, "learning_rate": 2.3736810165156777e-07, "loss": 0.8456, "step": 45814 }, { "epoch": 0.86, "learning_rate": 2.3730313479975453e-07, "loss": 0.8293, "step": 45815 }, { "epoch": 0.86, "learning_rate": 2.3723817639678237e-07, "loss": 0.9478, "step": 45816 }, { "epoch": 0.86, "learning_rate": 2.371732264428933e-07, "loss": 0.825, "step": 45817 }, { "epoch": 0.86, "learning_rate": 2.3710828493833077e-07, "loss": 0.8354, "step": 45818 }, { "epoch": 0.86, "learning_rate": 2.370433518833354e-07, "loss": 0.8819, "step": 45819 }, { "epoch": 0.86, "learning_rate": 2.3697842727815168e-07, "loss": 0.8298, "step": 45820 }, { "epoch": 0.86, "learning_rate": 2.3691351112302058e-07, "loss": 0.8934, "step": 45821 }, { "epoch": 0.86, "learning_rate": 2.3684860341818522e-07, "loss": 0.6777, "step": 45822 }, { "epoch": 0.86, "learning_rate": 2.3678370416388764e-07, "loss": 0.8774, "step": 45823 }, { "epoch": 0.86, "learning_rate": 2.3671881336037038e-07, "loss": 0.9969, "step": 45824 }, { "epoch": 0.86, "learning_rate": 2.3665393100787554e-07, "loss": 1.177, "step": 45825 }, { "epoch": 0.86, "learning_rate": 2.3658905710664565e-07, "loss": 0.9718, "step": 45826 }, { "epoch": 0.86, "learning_rate": 2.365241916569233e-07, "loss": 0.8861, "step": 45827 }, { "epoch": 0.86, "learning_rate": 2.3645933465894945e-07, "loss": 1.0258, "step": 45828 }, { "epoch": 0.86, "learning_rate": 2.3639448611296718e-07, "loss": 0.685, "step": 45829 }, { "epoch": 0.86, "learning_rate": 2.3632964601921908e-07, "loss": 1.0323, "step": 45830 }, { "epoch": 0.86, "learning_rate": 2.3626481437794585e-07, "loss": 1.0605, "step": 45831 }, { "epoch": 0.86, "learning_rate": 2.3619999118939112e-07, "loss": 1.051, "step": 45832 }, { "epoch": 0.86, "learning_rate": 2.3613517645379612e-07, "loss": 0.8634, "step": 45833 }, { "epoch": 0.86, "learning_rate": 2.360703701714026e-07, "loss": 0.9163, "step": 45834 }, { "epoch": 0.86, "learning_rate": 2.3600557234245313e-07, "loss": 0.7262, "step": 45835 }, { "epoch": 0.86, "learning_rate": 2.359407829671892e-07, "loss": 0.7724, "step": 45836 }, { "epoch": 0.86, "learning_rate": 2.358760020458531e-07, "loss": 0.9701, "step": 45837 }, { "epoch": 0.86, "learning_rate": 2.3581122957868659e-07, "loss": 0.8553, "step": 45838 }, { "epoch": 0.86, "learning_rate": 2.3574646556593195e-07, "loss": 0.6324, "step": 45839 }, { "epoch": 0.86, "learning_rate": 2.3568171000782985e-07, "loss": 0.9767, "step": 45840 }, { "epoch": 0.86, "learning_rate": 2.3561696290462344e-07, "loss": 0.8618, "step": 45841 }, { "epoch": 0.86, "learning_rate": 2.355522242565536e-07, "loss": 0.7748, "step": 45842 }, { "epoch": 0.86, "learning_rate": 2.354874940638624e-07, "loss": 0.7602, "step": 45843 }, { "epoch": 0.86, "learning_rate": 2.354227723267913e-07, "loss": 0.9748, "step": 45844 }, { "epoch": 0.86, "learning_rate": 2.353580590455823e-07, "loss": 0.908, "step": 45845 }, { "epoch": 0.86, "learning_rate": 2.3529335422047662e-07, "loss": 0.8067, "step": 45846 }, { "epoch": 0.86, "learning_rate": 2.352286578517163e-07, "loss": 0.8495, "step": 45847 }, { "epoch": 0.87, "learning_rate": 2.3516396993954305e-07, "loss": 0.8464, "step": 45848 }, { "epoch": 0.87, "learning_rate": 2.3509929048419728e-07, "loss": 1.1516, "step": 45849 }, { "epoch": 0.87, "learning_rate": 2.3503461948592182e-07, "loss": 0.9637, "step": 45850 }, { "epoch": 0.87, "learning_rate": 2.3496995694495815e-07, "loss": 1.0117, "step": 45851 }, { "epoch": 0.87, "learning_rate": 2.3490530286154612e-07, "loss": 0.7356, "step": 45852 }, { "epoch": 0.87, "learning_rate": 2.3484065723592936e-07, "loss": 1.0865, "step": 45853 }, { "epoch": 0.87, "learning_rate": 2.3477602006834744e-07, "loss": 0.7852, "step": 45854 }, { "epoch": 0.87, "learning_rate": 2.3471139135904263e-07, "loss": 0.8929, "step": 45855 }, { "epoch": 0.87, "learning_rate": 2.346467711082559e-07, "loss": 1.0865, "step": 45856 }, { "epoch": 0.87, "learning_rate": 2.3458215931622868e-07, "loss": 0.856, "step": 45857 }, { "epoch": 0.87, "learning_rate": 2.3451755598320219e-07, "loss": 0.9341, "step": 45858 }, { "epoch": 0.87, "learning_rate": 2.3445296110941763e-07, "loss": 0.7805, "step": 45859 }, { "epoch": 0.87, "learning_rate": 2.34388374695117e-07, "loss": 0.7874, "step": 45860 }, { "epoch": 0.87, "learning_rate": 2.3432379674053957e-07, "loss": 0.8727, "step": 45861 }, { "epoch": 0.87, "learning_rate": 2.3425922724592848e-07, "loss": 1.0797, "step": 45862 }, { "epoch": 0.87, "learning_rate": 2.3419466621152355e-07, "loss": 0.9706, "step": 45863 }, { "epoch": 0.87, "learning_rate": 2.341301136375662e-07, "loss": 0.9529, "step": 45864 }, { "epoch": 0.87, "learning_rate": 2.340655695242977e-07, "loss": 0.7972, "step": 45865 }, { "epoch": 0.87, "learning_rate": 2.3400103387195895e-07, "loss": 0.8253, "step": 45866 }, { "epoch": 0.87, "learning_rate": 2.3393650668079055e-07, "loss": 0.9799, "step": 45867 }, { "epoch": 0.87, "learning_rate": 2.33871987951034e-07, "loss": 0.9715, "step": 45868 }, { "epoch": 0.87, "learning_rate": 2.3380747768293049e-07, "loss": 0.8018, "step": 45869 }, { "epoch": 0.87, "learning_rate": 2.337429758767193e-07, "loss": 1.0034, "step": 45870 }, { "epoch": 0.87, "learning_rate": 2.336784825326427e-07, "loss": 0.7784, "step": 45871 }, { "epoch": 0.87, "learning_rate": 2.336139976509419e-07, "loss": 0.748, "step": 45872 }, { "epoch": 0.87, "learning_rate": 2.3354952123185587e-07, "loss": 0.8063, "step": 45873 }, { "epoch": 0.87, "learning_rate": 2.334850532756275e-07, "loss": 1.1448, "step": 45874 }, { "epoch": 0.87, "learning_rate": 2.334205937824957e-07, "loss": 1.1639, "step": 45875 }, { "epoch": 0.87, "learning_rate": 2.33356142752702e-07, "loss": 0.7168, "step": 45876 }, { "epoch": 0.87, "learning_rate": 2.3329170018648705e-07, "loss": 0.9212, "step": 45877 }, { "epoch": 0.87, "learning_rate": 2.3322726608409146e-07, "loss": 0.8175, "step": 45878 }, { "epoch": 0.87, "learning_rate": 2.3316284044575615e-07, "loss": 0.7354, "step": 45879 }, { "epoch": 0.87, "learning_rate": 2.3309842327172037e-07, "loss": 0.9894, "step": 45880 }, { "epoch": 0.87, "learning_rate": 2.3303401456222648e-07, "loss": 0.9661, "step": 45881 }, { "epoch": 0.87, "learning_rate": 2.3296961431751364e-07, "loss": 0.6933, "step": 45882 }, { "epoch": 0.87, "learning_rate": 2.3290522253782256e-07, "loss": 1.0317, "step": 45883 }, { "epoch": 0.87, "learning_rate": 2.3284083922339413e-07, "loss": 0.9178, "step": 45884 }, { "epoch": 0.87, "learning_rate": 2.3277646437446843e-07, "loss": 0.9395, "step": 45885 }, { "epoch": 0.87, "learning_rate": 2.3271209799128587e-07, "loss": 0.8018, "step": 45886 }, { "epoch": 0.87, "learning_rate": 2.3264774007408676e-07, "loss": 0.9821, "step": 45887 }, { "epoch": 0.87, "learning_rate": 2.3258339062311203e-07, "loss": 0.9863, "step": 45888 }, { "epoch": 0.87, "learning_rate": 2.3251904963860038e-07, "loss": 0.922, "step": 45889 }, { "epoch": 0.87, "learning_rate": 2.3245471712079416e-07, "loss": 0.8416, "step": 45890 }, { "epoch": 0.87, "learning_rate": 2.32390393069932e-07, "loss": 0.999, "step": 45891 }, { "epoch": 0.87, "learning_rate": 2.32326077486254e-07, "loss": 0.73, "step": 45892 }, { "epoch": 0.87, "learning_rate": 2.322617703700017e-07, "loss": 0.9441, "step": 45893 }, { "epoch": 0.87, "learning_rate": 2.3219747172141427e-07, "loss": 0.9407, "step": 45894 }, { "epoch": 0.87, "learning_rate": 2.3213318154073183e-07, "loss": 0.9827, "step": 45895 }, { "epoch": 0.87, "learning_rate": 2.3206889982819447e-07, "loss": 1.0441, "step": 45896 }, { "epoch": 0.87, "learning_rate": 2.3200462658404228e-07, "loss": 0.9435, "step": 45897 }, { "epoch": 0.87, "learning_rate": 2.319403618085156e-07, "loss": 0.8627, "step": 45898 }, { "epoch": 0.87, "learning_rate": 2.318761055018537e-07, "loss": 0.7378, "step": 45899 }, { "epoch": 0.87, "learning_rate": 2.3181185766429747e-07, "loss": 1.1166, "step": 45900 }, { "epoch": 0.87, "learning_rate": 2.3174761829608538e-07, "loss": 0.882, "step": 45901 }, { "epoch": 0.87, "learning_rate": 2.3168338739745888e-07, "loss": 0.8812, "step": 45902 }, { "epoch": 0.87, "learning_rate": 2.3161916496865665e-07, "loss": 0.8105, "step": 45903 }, { "epoch": 0.87, "learning_rate": 2.315549510099191e-07, "loss": 0.8146, "step": 45904 }, { "epoch": 0.87, "learning_rate": 2.314907455214857e-07, "loss": 0.7657, "step": 45905 }, { "epoch": 0.87, "learning_rate": 2.314265485035963e-07, "loss": 1.1638, "step": 45906 }, { "epoch": 0.87, "learning_rate": 2.3136235995649042e-07, "loss": 0.8619, "step": 45907 }, { "epoch": 0.87, "learning_rate": 2.3129817988040813e-07, "loss": 0.6929, "step": 45908 }, { "epoch": 0.87, "learning_rate": 2.3123400827558928e-07, "loss": 0.8571, "step": 45909 }, { "epoch": 0.87, "learning_rate": 2.3116984514227225e-07, "loss": 0.9822, "step": 45910 }, { "epoch": 0.87, "learning_rate": 2.3110569048069826e-07, "loss": 0.8943, "step": 45911 }, { "epoch": 0.87, "learning_rate": 2.3104154429110571e-07, "loss": 0.9534, "step": 45912 }, { "epoch": 0.87, "learning_rate": 2.3097740657373386e-07, "loss": 0.8478, "step": 45913 }, { "epoch": 0.87, "learning_rate": 2.309132773288239e-07, "loss": 0.9183, "step": 45914 }, { "epoch": 0.87, "learning_rate": 2.3084915655661371e-07, "loss": 0.9711, "step": 45915 }, { "epoch": 0.87, "learning_rate": 2.307850442573431e-07, "loss": 0.817, "step": 45916 }, { "epoch": 0.87, "learning_rate": 2.307209404312516e-07, "loss": 1.0115, "step": 45917 }, { "epoch": 0.87, "learning_rate": 2.3065684507857844e-07, "loss": 1.0116, "step": 45918 }, { "epoch": 0.87, "learning_rate": 2.3059275819956316e-07, "loss": 1.1937, "step": 45919 }, { "epoch": 0.87, "learning_rate": 2.3052867979444476e-07, "loss": 0.8882, "step": 45920 }, { "epoch": 0.87, "learning_rate": 2.304646098634633e-07, "loss": 0.7702, "step": 45921 }, { "epoch": 0.87, "learning_rate": 2.3040054840685666e-07, "loss": 0.6617, "step": 45922 }, { "epoch": 0.87, "learning_rate": 2.3033649542486548e-07, "loss": 0.7373, "step": 45923 }, { "epoch": 0.87, "learning_rate": 2.302724509177276e-07, "loss": 1.0124, "step": 45924 }, { "epoch": 0.87, "learning_rate": 2.3020841488568313e-07, "loss": 1.0312, "step": 45925 }, { "epoch": 0.87, "learning_rate": 2.3014438732897076e-07, "loss": 0.9876, "step": 45926 }, { "epoch": 0.87, "learning_rate": 2.3008036824782947e-07, "loss": 1.0435, "step": 45927 }, { "epoch": 0.87, "learning_rate": 2.300163576424988e-07, "loss": 0.7624, "step": 45928 }, { "epoch": 0.87, "learning_rate": 2.2995235551321714e-07, "loss": 0.9341, "step": 45929 }, { "epoch": 0.87, "learning_rate": 2.2988836186022433e-07, "loss": 0.7383, "step": 45930 }, { "epoch": 0.87, "learning_rate": 2.2982437668375794e-07, "loss": 1.0335, "step": 45931 }, { "epoch": 0.87, "learning_rate": 2.2976039998405864e-07, "loss": 0.8815, "step": 45932 }, { "epoch": 0.87, "learning_rate": 2.2969643176136398e-07, "loss": 0.9615, "step": 45933 }, { "epoch": 0.87, "learning_rate": 2.2963247201591264e-07, "loss": 0.8722, "step": 45934 }, { "epoch": 0.87, "learning_rate": 2.2956852074794506e-07, "loss": 0.897, "step": 45935 }, { "epoch": 0.87, "learning_rate": 2.2950457795769848e-07, "loss": 0.7506, "step": 45936 }, { "epoch": 0.87, "learning_rate": 2.2944064364541218e-07, "loss": 1.0674, "step": 45937 }, { "epoch": 0.87, "learning_rate": 2.2937671781132488e-07, "loss": 1.2863, "step": 45938 }, { "epoch": 0.87, "learning_rate": 2.293128004556755e-07, "loss": 0.9225, "step": 45939 }, { "epoch": 0.87, "learning_rate": 2.2924889157870222e-07, "loss": 0.8652, "step": 45940 }, { "epoch": 0.87, "learning_rate": 2.291849911806443e-07, "loss": 0.8275, "step": 45941 }, { "epoch": 0.87, "learning_rate": 2.2912109926174013e-07, "loss": 0.9065, "step": 45942 }, { "epoch": 0.87, "learning_rate": 2.2905721582222735e-07, "loss": 1.0157, "step": 45943 }, { "epoch": 0.87, "learning_rate": 2.2899334086234625e-07, "loss": 0.9949, "step": 45944 }, { "epoch": 0.87, "learning_rate": 2.2892947438233391e-07, "loss": 1.0323, "step": 45945 }, { "epoch": 0.87, "learning_rate": 2.2886561638242933e-07, "loss": 0.9497, "step": 45946 }, { "epoch": 0.87, "learning_rate": 2.2880176686287086e-07, "loss": 0.9291, "step": 45947 }, { "epoch": 0.87, "learning_rate": 2.287379258238967e-07, "loss": 0.9214, "step": 45948 }, { "epoch": 0.87, "learning_rate": 2.286740932657458e-07, "loss": 0.941, "step": 45949 }, { "epoch": 0.87, "learning_rate": 2.2861026918865603e-07, "loss": 0.9454, "step": 45950 }, { "epoch": 0.87, "learning_rate": 2.2854645359286665e-07, "loss": 0.9876, "step": 45951 }, { "epoch": 0.87, "learning_rate": 2.2848264647861386e-07, "loss": 0.9055, "step": 45952 }, { "epoch": 0.87, "learning_rate": 2.2841884784613827e-07, "loss": 0.8798, "step": 45953 }, { "epoch": 0.87, "learning_rate": 2.283550576956767e-07, "loss": 0.9184, "step": 45954 }, { "epoch": 0.87, "learning_rate": 2.282912760274672e-07, "loss": 1.0787, "step": 45955 }, { "epoch": 0.87, "learning_rate": 2.2822750284174938e-07, "loss": 1.0023, "step": 45956 }, { "epoch": 0.87, "learning_rate": 2.281637381387597e-07, "loss": 0.8278, "step": 45957 }, { "epoch": 0.87, "learning_rate": 2.2809998191873711e-07, "loss": 0.6857, "step": 45958 }, { "epoch": 0.87, "learning_rate": 2.280362341819195e-07, "loss": 0.6401, "step": 45959 }, { "epoch": 0.87, "learning_rate": 2.27972494928545e-07, "loss": 0.9612, "step": 45960 }, { "epoch": 0.87, "learning_rate": 2.2790876415885176e-07, "loss": 0.75, "step": 45961 }, { "epoch": 0.87, "learning_rate": 2.278450418730771e-07, "loss": 0.9641, "step": 45962 }, { "epoch": 0.87, "learning_rate": 2.2778132807146024e-07, "loss": 0.8725, "step": 45963 }, { "epoch": 0.87, "learning_rate": 2.2771762275423713e-07, "loss": 0.9322, "step": 45964 }, { "epoch": 0.87, "learning_rate": 2.2765392592164758e-07, "loss": 1.0518, "step": 45965 }, { "epoch": 0.87, "learning_rate": 2.2759023757392806e-07, "loss": 0.7321, "step": 45966 }, { "epoch": 0.87, "learning_rate": 2.2752655771131726e-07, "loss": 0.7738, "step": 45967 }, { "epoch": 0.87, "learning_rate": 2.274628863340525e-07, "loss": 1.0975, "step": 45968 }, { "epoch": 0.87, "learning_rate": 2.2739922344237137e-07, "loss": 1.0393, "step": 45969 }, { "epoch": 0.87, "learning_rate": 2.2733556903651227e-07, "loss": 0.8867, "step": 45970 }, { "epoch": 0.87, "learning_rate": 2.2727192311671226e-07, "loss": 0.9987, "step": 45971 }, { "epoch": 0.87, "learning_rate": 2.2720828568320945e-07, "loss": 0.7976, "step": 45972 }, { "epoch": 0.87, "learning_rate": 2.2714465673624065e-07, "loss": 0.9452, "step": 45973 }, { "epoch": 0.87, "learning_rate": 2.2708103627604477e-07, "loss": 0.9102, "step": 45974 }, { "epoch": 0.87, "learning_rate": 2.2701742430285833e-07, "loss": 1.0847, "step": 45975 }, { "epoch": 0.87, "learning_rate": 2.2695382081691835e-07, "loss": 0.8794, "step": 45976 }, { "epoch": 0.87, "learning_rate": 2.2689022581846436e-07, "loss": 0.7427, "step": 45977 }, { "epoch": 0.87, "learning_rate": 2.2682663930773203e-07, "loss": 0.8025, "step": 45978 }, { "epoch": 0.87, "learning_rate": 2.2676306128495918e-07, "loss": 0.8165, "step": 45979 }, { "epoch": 0.87, "learning_rate": 2.266994917503834e-07, "loss": 0.9435, "step": 45980 }, { "epoch": 0.87, "learning_rate": 2.2663593070424207e-07, "loss": 1.3894, "step": 45981 }, { "epoch": 0.87, "learning_rate": 2.265723781467724e-07, "loss": 0.8221, "step": 45982 }, { "epoch": 0.87, "learning_rate": 2.2650883407821207e-07, "loss": 0.8953, "step": 45983 }, { "epoch": 0.87, "learning_rate": 2.2644529849879805e-07, "loss": 0.7954, "step": 45984 }, { "epoch": 0.87, "learning_rate": 2.263817714087671e-07, "loss": 0.7625, "step": 45985 }, { "epoch": 0.87, "learning_rate": 2.2631825280835739e-07, "loss": 0.8262, "step": 45986 }, { "epoch": 0.87, "learning_rate": 2.2625474269780538e-07, "loss": 0.9047, "step": 45987 }, { "epoch": 0.87, "learning_rate": 2.2619124107734842e-07, "loss": 0.907, "step": 45988 }, { "epoch": 0.87, "learning_rate": 2.2612774794722374e-07, "loss": 0.8986, "step": 45989 }, { "epoch": 0.87, "learning_rate": 2.2606426330766818e-07, "loss": 1.0092, "step": 45990 }, { "epoch": 0.87, "learning_rate": 2.2600078715891898e-07, "loss": 0.9164, "step": 45991 }, { "epoch": 0.87, "learning_rate": 2.2593731950121323e-07, "loss": 0.8058, "step": 45992 }, { "epoch": 0.87, "learning_rate": 2.258738603347882e-07, "loss": 0.981, "step": 45993 }, { "epoch": 0.87, "learning_rate": 2.2581040965987954e-07, "loss": 1.0207, "step": 45994 }, { "epoch": 0.87, "learning_rate": 2.2574696747672597e-07, "loss": 0.9714, "step": 45995 }, { "epoch": 0.87, "learning_rate": 2.2568353378556313e-07, "loss": 0.8484, "step": 45996 }, { "epoch": 0.87, "learning_rate": 2.2562010858662746e-07, "loss": 0.8863, "step": 45997 }, { "epoch": 0.87, "learning_rate": 2.25556691880158e-07, "loss": 0.8393, "step": 45998 }, { "epoch": 0.87, "learning_rate": 2.2549328366638924e-07, "loss": 1.0873, "step": 45999 }, { "epoch": 0.87, "learning_rate": 2.2542988394555903e-07, "loss": 1.1556, "step": 46000 }, { "epoch": 0.87, "learning_rate": 2.253664927179039e-07, "loss": 1.0182, "step": 46001 }, { "epoch": 0.87, "learning_rate": 2.2530310998366028e-07, "loss": 0.8045, "step": 46002 }, { "epoch": 0.87, "learning_rate": 2.2523973574306523e-07, "loss": 0.9406, "step": 46003 }, { "epoch": 0.87, "learning_rate": 2.251763699963555e-07, "loss": 0.6934, "step": 46004 }, { "epoch": 0.87, "learning_rate": 2.2511301274376756e-07, "loss": 0.8192, "step": 46005 }, { "epoch": 0.87, "learning_rate": 2.2504966398553735e-07, "loss": 0.9394, "step": 46006 }, { "epoch": 0.87, "learning_rate": 2.2498632372190244e-07, "loss": 0.7875, "step": 46007 }, { "epoch": 0.87, "learning_rate": 2.2492299195309876e-07, "loss": 0.8291, "step": 46008 }, { "epoch": 0.87, "learning_rate": 2.2485966867936275e-07, "loss": 0.9184, "step": 46009 }, { "epoch": 0.87, "learning_rate": 2.2479635390093096e-07, "loss": 0.9154, "step": 46010 }, { "epoch": 0.87, "learning_rate": 2.2473304761803983e-07, "loss": 0.803, "step": 46011 }, { "epoch": 0.87, "learning_rate": 2.2466974983092553e-07, "loss": 1.0781, "step": 46012 }, { "epoch": 0.87, "learning_rate": 2.2460646053982486e-07, "loss": 0.932, "step": 46013 }, { "epoch": 0.87, "learning_rate": 2.245431797449743e-07, "loss": 0.8008, "step": 46014 }, { "epoch": 0.87, "learning_rate": 2.244799074466089e-07, "loss": 0.8529, "step": 46015 }, { "epoch": 0.87, "learning_rate": 2.2441664364496656e-07, "loss": 0.8097, "step": 46016 }, { "epoch": 0.87, "learning_rate": 2.2435338834028236e-07, "loss": 1.0154, "step": 46017 }, { "epoch": 0.87, "learning_rate": 2.242901415327922e-07, "loss": 0.913, "step": 46018 }, { "epoch": 0.87, "learning_rate": 2.24226903222734e-07, "loss": 1.1353, "step": 46019 }, { "epoch": 0.87, "learning_rate": 2.2416367341034223e-07, "loss": 0.8353, "step": 46020 }, { "epoch": 0.87, "learning_rate": 2.241004520958534e-07, "loss": 0.7861, "step": 46021 }, { "epoch": 0.87, "learning_rate": 2.2403723927950372e-07, "loss": 0.8603, "step": 46022 }, { "epoch": 0.87, "learning_rate": 2.2397403496152936e-07, "loss": 0.7215, "step": 46023 }, { "epoch": 0.87, "learning_rate": 2.2391083914216598e-07, "loss": 0.7152, "step": 46024 }, { "epoch": 0.87, "learning_rate": 2.2384765182165008e-07, "loss": 0.9369, "step": 46025 }, { "epoch": 0.87, "learning_rate": 2.2378447300021727e-07, "loss": 1.0697, "step": 46026 }, { "epoch": 0.87, "learning_rate": 2.2372130267810293e-07, "loss": 0.7404, "step": 46027 }, { "epoch": 0.87, "learning_rate": 2.236581408555441e-07, "loss": 0.763, "step": 46028 }, { "epoch": 0.87, "learning_rate": 2.235949875327756e-07, "loss": 0.8288, "step": 46029 }, { "epoch": 0.87, "learning_rate": 2.2353184271003358e-07, "loss": 0.9018, "step": 46030 }, { "epoch": 0.87, "learning_rate": 2.2346870638755402e-07, "loss": 0.9881, "step": 46031 }, { "epoch": 0.87, "learning_rate": 2.2340557856557228e-07, "loss": 0.8533, "step": 46032 }, { "epoch": 0.87, "learning_rate": 2.2334245924432452e-07, "loss": 0.7695, "step": 46033 }, { "epoch": 0.87, "learning_rate": 2.2327934842404615e-07, "loss": 0.7539, "step": 46034 }, { "epoch": 0.87, "learning_rate": 2.2321624610497332e-07, "loss": 0.9556, "step": 46035 }, { "epoch": 0.87, "learning_rate": 2.2315315228734035e-07, "loss": 1.0018, "step": 46036 }, { "epoch": 0.87, "learning_rate": 2.2309006697138453e-07, "loss": 1.0908, "step": 46037 }, { "epoch": 0.87, "learning_rate": 2.230269901573401e-07, "loss": 0.9699, "step": 46038 }, { "epoch": 0.87, "learning_rate": 2.2296392184544268e-07, "loss": 0.997, "step": 46039 }, { "epoch": 0.87, "learning_rate": 2.229008620359291e-07, "loss": 0.9962, "step": 46040 }, { "epoch": 0.87, "learning_rate": 2.2283781072903355e-07, "loss": 0.8003, "step": 46041 }, { "epoch": 0.87, "learning_rate": 2.227747679249917e-07, "loss": 0.5953, "step": 46042 }, { "epoch": 0.87, "learning_rate": 2.2271173362403892e-07, "loss": 0.9921, "step": 46043 }, { "epoch": 0.87, "learning_rate": 2.2264870782641084e-07, "loss": 1.1814, "step": 46044 }, { "epoch": 0.87, "learning_rate": 2.2258569053234257e-07, "loss": 0.7187, "step": 46045 }, { "epoch": 0.87, "learning_rate": 2.225226817420695e-07, "loss": 1.0229, "step": 46046 }, { "epoch": 0.87, "learning_rate": 2.2245968145582747e-07, "loss": 0.8447, "step": 46047 }, { "epoch": 0.87, "learning_rate": 2.2239668967384998e-07, "loss": 1.0033, "step": 46048 }, { "epoch": 0.87, "learning_rate": 2.2233370639637458e-07, "loss": 0.8502, "step": 46049 }, { "epoch": 0.87, "learning_rate": 2.22270731623635e-07, "loss": 1.0272, "step": 46050 }, { "epoch": 0.87, "learning_rate": 2.222077653558663e-07, "loss": 0.83, "step": 46051 }, { "epoch": 0.87, "learning_rate": 2.2214480759330414e-07, "loss": 0.9349, "step": 46052 }, { "epoch": 0.87, "learning_rate": 2.2208185833618333e-07, "loss": 0.901, "step": 46053 }, { "epoch": 0.87, "learning_rate": 2.2201891758473926e-07, "loss": 0.8578, "step": 46054 }, { "epoch": 0.87, "learning_rate": 2.2195598533920642e-07, "loss": 1.0805, "step": 46055 }, { "epoch": 0.87, "learning_rate": 2.2189306159982077e-07, "loss": 0.9355, "step": 46056 }, { "epoch": 0.87, "learning_rate": 2.2183014636681545e-07, "loss": 1.056, "step": 46057 }, { "epoch": 0.87, "learning_rate": 2.2176723964042745e-07, "loss": 0.8457, "step": 46058 }, { "epoch": 0.87, "learning_rate": 2.2170434142089054e-07, "loss": 0.771, "step": 46059 }, { "epoch": 0.87, "learning_rate": 2.2164145170843892e-07, "loss": 0.7006, "step": 46060 }, { "epoch": 0.87, "learning_rate": 2.215785705033094e-07, "loss": 0.9529, "step": 46061 }, { "epoch": 0.87, "learning_rate": 2.2151569780573535e-07, "loss": 1.1277, "step": 46062 }, { "epoch": 0.87, "learning_rate": 2.214528336159516e-07, "loss": 1.1374, "step": 46063 }, { "epoch": 0.87, "learning_rate": 2.2138997793419298e-07, "loss": 0.8509, "step": 46064 }, { "epoch": 0.87, "learning_rate": 2.2132713076069456e-07, "loss": 0.7828, "step": 46065 }, { "epoch": 0.87, "learning_rate": 2.2126429209569062e-07, "loss": 0.8694, "step": 46066 }, { "epoch": 0.87, "learning_rate": 2.212014619394162e-07, "loss": 0.9635, "step": 46067 }, { "epoch": 0.87, "learning_rate": 2.211386402921059e-07, "loss": 1.1343, "step": 46068 }, { "epoch": 0.87, "learning_rate": 2.2107582715399313e-07, "loss": 0.9991, "step": 46069 }, { "epoch": 0.87, "learning_rate": 2.2101302252531432e-07, "loss": 0.7869, "step": 46070 }, { "epoch": 0.87, "learning_rate": 2.2095022640630236e-07, "loss": 0.9674, "step": 46071 }, { "epoch": 0.87, "learning_rate": 2.2088743879719267e-07, "loss": 0.788, "step": 46072 }, { "epoch": 0.87, "learning_rate": 2.2082465969821916e-07, "loss": 0.8746, "step": 46073 }, { "epoch": 0.87, "learning_rate": 2.2076188910961665e-07, "loss": 1.0207, "step": 46074 }, { "epoch": 0.87, "learning_rate": 2.2069912703161944e-07, "loss": 1.0502, "step": 46075 }, { "epoch": 0.87, "learning_rate": 2.2063637346446148e-07, "loss": 0.9236, "step": 46076 }, { "epoch": 0.87, "learning_rate": 2.2057362840837814e-07, "loss": 0.7, "step": 46077 }, { "epoch": 0.87, "learning_rate": 2.2051089186360203e-07, "loss": 1.0149, "step": 46078 }, { "epoch": 0.87, "learning_rate": 2.2044816383036932e-07, "loss": 0.6833, "step": 46079 }, { "epoch": 0.87, "learning_rate": 2.2038544430891262e-07, "loss": 0.9766, "step": 46080 }, { "epoch": 0.87, "learning_rate": 2.2032273329946645e-07, "loss": 1.3305, "step": 46081 }, { "epoch": 0.87, "learning_rate": 2.2026003080226622e-07, "loss": 0.9601, "step": 46082 }, { "epoch": 0.87, "learning_rate": 2.2019733681754474e-07, "loss": 0.8596, "step": 46083 }, { "epoch": 0.87, "learning_rate": 2.201346513455363e-07, "loss": 0.9994, "step": 46084 }, { "epoch": 0.87, "learning_rate": 2.2007197438647543e-07, "loss": 0.6572, "step": 46085 }, { "epoch": 0.87, "learning_rate": 2.2000930594059556e-07, "loss": 0.9359, "step": 46086 }, { "epoch": 0.87, "learning_rate": 2.1994664600813148e-07, "loss": 1.0001, "step": 46087 }, { "epoch": 0.87, "learning_rate": 2.1988399458931636e-07, "loss": 1.062, "step": 46088 }, { "epoch": 0.87, "learning_rate": 2.1982135168438502e-07, "loss": 1.154, "step": 46089 }, { "epoch": 0.87, "learning_rate": 2.1975871729357e-07, "loss": 0.9401, "step": 46090 }, { "epoch": 0.87, "learning_rate": 2.1969609141710702e-07, "loss": 0.843, "step": 46091 }, { "epoch": 0.87, "learning_rate": 2.1963347405522834e-07, "loss": 0.8501, "step": 46092 }, { "epoch": 0.87, "learning_rate": 2.1957086520816823e-07, "loss": 1.2137, "step": 46093 }, { "epoch": 0.87, "learning_rate": 2.1950826487616068e-07, "loss": 1.0895, "step": 46094 }, { "epoch": 0.87, "learning_rate": 2.1944567305943937e-07, "loss": 0.8914, "step": 46095 }, { "epoch": 0.87, "learning_rate": 2.19383089758238e-07, "loss": 0.721, "step": 46096 }, { "epoch": 0.87, "learning_rate": 2.1932051497279033e-07, "loss": 0.9116, "step": 46097 }, { "epoch": 0.87, "learning_rate": 2.1925794870333027e-07, "loss": 0.9374, "step": 46098 }, { "epoch": 0.87, "learning_rate": 2.1919539095009019e-07, "loss": 0.6965, "step": 46099 }, { "epoch": 0.87, "learning_rate": 2.1913284171330568e-07, "loss": 0.777, "step": 46100 }, { "epoch": 0.87, "learning_rate": 2.1907030099320854e-07, "loss": 0.7146, "step": 46101 }, { "epoch": 0.87, "learning_rate": 2.1900776879003272e-07, "loss": 0.9716, "step": 46102 }, { "epoch": 0.87, "learning_rate": 2.1894524510401278e-07, "loss": 0.9297, "step": 46103 }, { "epoch": 0.87, "learning_rate": 2.1888272993538075e-07, "loss": 0.8188, "step": 46104 }, { "epoch": 0.87, "learning_rate": 2.1882022328437086e-07, "loss": 1.0089, "step": 46105 }, { "epoch": 0.87, "learning_rate": 2.1875772515121602e-07, "loss": 1.0209, "step": 46106 }, { "epoch": 0.87, "learning_rate": 2.186952355361502e-07, "loss": 0.9232, "step": 46107 }, { "epoch": 0.87, "learning_rate": 2.1863275443940623e-07, "loss": 0.8509, "step": 46108 }, { "epoch": 0.87, "learning_rate": 2.185702818612176e-07, "loss": 0.7833, "step": 46109 }, { "epoch": 0.87, "learning_rate": 2.1850781780181823e-07, "loss": 0.7433, "step": 46110 }, { "epoch": 0.87, "learning_rate": 2.184453622614402e-07, "loss": 1.028, "step": 46111 }, { "epoch": 0.87, "learning_rate": 2.1838291524031718e-07, "loss": 1.1727, "step": 46112 }, { "epoch": 0.87, "learning_rate": 2.1832047673868234e-07, "loss": 0.8137, "step": 46113 }, { "epoch": 0.87, "learning_rate": 2.182580467567691e-07, "loss": 0.8828, "step": 46114 }, { "epoch": 0.87, "learning_rate": 2.1819562529481002e-07, "loss": 0.8441, "step": 46115 }, { "epoch": 0.87, "learning_rate": 2.1813321235303887e-07, "loss": 1.0146, "step": 46116 }, { "epoch": 0.87, "learning_rate": 2.1807080793168845e-07, "loss": 0.915, "step": 46117 }, { "epoch": 0.87, "learning_rate": 2.180084120309911e-07, "loss": 0.9061, "step": 46118 }, { "epoch": 0.87, "learning_rate": 2.1794602465118108e-07, "loss": 1.0862, "step": 46119 }, { "epoch": 0.87, "learning_rate": 2.1788364579249017e-07, "loss": 0.7706, "step": 46120 }, { "epoch": 0.87, "learning_rate": 2.1782127545515175e-07, "loss": 1.0227, "step": 46121 }, { "epoch": 0.87, "learning_rate": 2.1775891363939872e-07, "loss": 0.631, "step": 46122 }, { "epoch": 0.87, "learning_rate": 2.1769656034546423e-07, "loss": 0.9089, "step": 46123 }, { "epoch": 0.87, "learning_rate": 2.1763421557358055e-07, "loss": 1.0008, "step": 46124 }, { "epoch": 0.87, "learning_rate": 2.175718793239806e-07, "loss": 1.1978, "step": 46125 }, { "epoch": 0.87, "learning_rate": 2.175095515968978e-07, "loss": 0.8173, "step": 46126 }, { "epoch": 0.87, "learning_rate": 2.174472323925636e-07, "loss": 0.8848, "step": 46127 }, { "epoch": 0.87, "learning_rate": 2.1738492171121173e-07, "loss": 0.874, "step": 46128 }, { "epoch": 0.87, "learning_rate": 2.1732261955307505e-07, "loss": 0.7537, "step": 46129 }, { "epoch": 0.87, "learning_rate": 2.1726032591838503e-07, "loss": 0.9887, "step": 46130 }, { "epoch": 0.87, "learning_rate": 2.1719804080737566e-07, "loss": 1.0629, "step": 46131 }, { "epoch": 0.87, "learning_rate": 2.1713576422027845e-07, "loss": 0.8043, "step": 46132 }, { "epoch": 0.87, "learning_rate": 2.170734961573262e-07, "loss": 0.7265, "step": 46133 }, { "epoch": 0.87, "learning_rate": 2.1701123661875155e-07, "loss": 0.9848, "step": 46134 }, { "epoch": 0.87, "learning_rate": 2.169489856047871e-07, "loss": 0.786, "step": 46135 }, { "epoch": 0.87, "learning_rate": 2.1688674311566489e-07, "loss": 0.7579, "step": 46136 }, { "epoch": 0.87, "learning_rate": 2.1682450915161774e-07, "loss": 1.1187, "step": 46137 }, { "epoch": 0.87, "learning_rate": 2.1676228371287827e-07, "loss": 0.7463, "step": 46138 }, { "epoch": 0.87, "learning_rate": 2.167000667996777e-07, "loss": 0.661, "step": 46139 }, { "epoch": 0.87, "learning_rate": 2.1663785841224972e-07, "loss": 1.1066, "step": 46140 }, { "epoch": 0.87, "learning_rate": 2.1657565855082552e-07, "loss": 0.8414, "step": 46141 }, { "epoch": 0.87, "learning_rate": 2.16513467215638e-07, "loss": 0.7799, "step": 46142 }, { "epoch": 0.87, "learning_rate": 2.1645128440691914e-07, "loss": 1.1991, "step": 46143 }, { "epoch": 0.87, "learning_rate": 2.1638911012490104e-07, "loss": 1.0571, "step": 46144 }, { "epoch": 0.87, "learning_rate": 2.16326944369816e-07, "loss": 0.9099, "step": 46145 }, { "epoch": 0.87, "learning_rate": 2.1626478714189602e-07, "loss": 0.6499, "step": 46146 }, { "epoch": 0.87, "learning_rate": 2.1620263844137402e-07, "loss": 0.6914, "step": 46147 }, { "epoch": 0.87, "learning_rate": 2.1614049826848034e-07, "loss": 0.8132, "step": 46148 }, { "epoch": 0.87, "learning_rate": 2.160783666234484e-07, "loss": 1.0132, "step": 46149 }, { "epoch": 0.87, "learning_rate": 2.160162435065105e-07, "loss": 1.0262, "step": 46150 }, { "epoch": 0.87, "learning_rate": 2.159541289178968e-07, "loss": 0.8759, "step": 46151 }, { "epoch": 0.87, "learning_rate": 2.1589202285784123e-07, "loss": 0.8773, "step": 46152 }, { "epoch": 0.87, "learning_rate": 2.1582992532657444e-07, "loss": 0.9187, "step": 46153 }, { "epoch": 0.87, "learning_rate": 2.1576783632432875e-07, "loss": 0.7639, "step": 46154 }, { "epoch": 0.87, "learning_rate": 2.1570575585133563e-07, "loss": 0.7309, "step": 46155 }, { "epoch": 0.87, "learning_rate": 2.1564368390782742e-07, "loss": 1.0459, "step": 46156 }, { "epoch": 0.87, "learning_rate": 2.1558162049403557e-07, "loss": 0.9107, "step": 46157 }, { "epoch": 0.87, "learning_rate": 2.1551956561019216e-07, "loss": 0.8252, "step": 46158 }, { "epoch": 0.87, "learning_rate": 2.154575192565289e-07, "loss": 0.8846, "step": 46159 }, { "epoch": 0.87, "learning_rate": 2.153954814332762e-07, "loss": 0.783, "step": 46160 }, { "epoch": 0.87, "learning_rate": 2.1533345214066775e-07, "loss": 0.9766, "step": 46161 }, { "epoch": 0.87, "learning_rate": 2.1527143137893363e-07, "loss": 1.2962, "step": 46162 }, { "epoch": 0.87, "learning_rate": 2.1520941914830617e-07, "loss": 1.0656, "step": 46163 }, { "epoch": 0.87, "learning_rate": 2.151474154490163e-07, "loss": 1.0823, "step": 46164 }, { "epoch": 0.87, "learning_rate": 2.1508542028129632e-07, "loss": 0.9157, "step": 46165 }, { "epoch": 0.87, "learning_rate": 2.1502343364537715e-07, "loss": 0.6653, "step": 46166 }, { "epoch": 0.87, "learning_rate": 2.149614555414903e-07, "loss": 0.8585, "step": 46167 }, { "epoch": 0.87, "learning_rate": 2.1489948596986777e-07, "loss": 0.8939, "step": 46168 }, { "epoch": 0.87, "learning_rate": 2.1483752493073968e-07, "loss": 0.926, "step": 46169 }, { "epoch": 0.87, "learning_rate": 2.147755724243386e-07, "loss": 0.8845, "step": 46170 }, { "epoch": 0.87, "learning_rate": 2.1471362845089605e-07, "loss": 0.9462, "step": 46171 }, { "epoch": 0.87, "learning_rate": 2.146516930106418e-07, "loss": 0.9543, "step": 46172 }, { "epoch": 0.87, "learning_rate": 2.1458976610380904e-07, "loss": 0.9189, "step": 46173 }, { "epoch": 0.87, "learning_rate": 2.145278477306273e-07, "loss": 0.9216, "step": 46174 }, { "epoch": 0.87, "learning_rate": 2.1446593789132885e-07, "loss": 1.0046, "step": 46175 }, { "epoch": 0.87, "learning_rate": 2.1440403658614412e-07, "loss": 0.9643, "step": 46176 }, { "epoch": 0.87, "learning_rate": 2.1434214381530483e-07, "loss": 0.9492, "step": 46177 }, { "epoch": 0.87, "learning_rate": 2.142802595790419e-07, "loss": 0.8524, "step": 46178 }, { "epoch": 0.87, "learning_rate": 2.142183838775866e-07, "loss": 0.8223, "step": 46179 }, { "epoch": 0.87, "learning_rate": 2.1415651671117005e-07, "loss": 0.9961, "step": 46180 }, { "epoch": 0.87, "learning_rate": 2.140946580800221e-07, "loss": 1.0638, "step": 46181 }, { "epoch": 0.87, "learning_rate": 2.1403280798437538e-07, "loss": 0.9559, "step": 46182 }, { "epoch": 0.87, "learning_rate": 2.1397096642445963e-07, "loss": 1.0472, "step": 46183 }, { "epoch": 0.87, "learning_rate": 2.139091334005064e-07, "loss": 0.9363, "step": 46184 }, { "epoch": 0.87, "learning_rate": 2.138473089127463e-07, "loss": 0.825, "step": 46185 }, { "epoch": 0.87, "learning_rate": 2.1378549296141e-07, "loss": 1.0933, "step": 46186 }, { "epoch": 0.87, "learning_rate": 2.1372368554672894e-07, "loss": 1.086, "step": 46187 }, { "epoch": 0.87, "learning_rate": 2.136618866689333e-07, "loss": 0.7331, "step": 46188 }, { "epoch": 0.87, "learning_rate": 2.1360009632825474e-07, "loss": 0.9255, "step": 46189 }, { "epoch": 0.87, "learning_rate": 2.1353831452492203e-07, "loss": 0.5959, "step": 46190 }, { "epoch": 0.87, "learning_rate": 2.13476541259168e-07, "loss": 0.8499, "step": 46191 }, { "epoch": 0.87, "learning_rate": 2.134147765312228e-07, "loss": 0.7735, "step": 46192 }, { "epoch": 0.87, "learning_rate": 2.1335302034131562e-07, "loss": 0.9943, "step": 46193 }, { "epoch": 0.87, "learning_rate": 2.1329127268967935e-07, "loss": 1.136, "step": 46194 }, { "epoch": 0.87, "learning_rate": 2.1322953357654275e-07, "loss": 0.8964, "step": 46195 }, { "epoch": 0.87, "learning_rate": 2.1316780300213695e-07, "loss": 0.8557, "step": 46196 }, { "epoch": 0.87, "learning_rate": 2.131060809666924e-07, "loss": 0.9283, "step": 46197 }, { "epoch": 0.87, "learning_rate": 2.1304436747043966e-07, "loss": 0.8973, "step": 46198 }, { "epoch": 0.87, "learning_rate": 2.1298266251360916e-07, "loss": 0.9514, "step": 46199 }, { "epoch": 0.87, "learning_rate": 2.1292096609643125e-07, "loss": 0.925, "step": 46200 }, { "epoch": 0.87, "learning_rate": 2.128592782191369e-07, "loss": 0.9405, "step": 46201 }, { "epoch": 0.87, "learning_rate": 2.12797598881955e-07, "loss": 0.8943, "step": 46202 }, { "epoch": 0.87, "learning_rate": 2.127359280851174e-07, "loss": 0.8923, "step": 46203 }, { "epoch": 0.87, "learning_rate": 2.1267426582885358e-07, "loss": 0.8315, "step": 46204 }, { "epoch": 0.87, "learning_rate": 2.1261261211339367e-07, "loss": 0.95, "step": 46205 }, { "epoch": 0.87, "learning_rate": 2.125509669389683e-07, "loss": 0.9915, "step": 46206 }, { "epoch": 0.87, "learning_rate": 2.1248933030580732e-07, "loss": 1.0806, "step": 46207 }, { "epoch": 0.87, "learning_rate": 2.1242770221414105e-07, "loss": 0.9479, "step": 46208 }, { "epoch": 0.87, "learning_rate": 2.123660826641996e-07, "loss": 0.8532, "step": 46209 }, { "epoch": 0.87, "learning_rate": 2.1230447165621366e-07, "loss": 0.8314, "step": 46210 }, { "epoch": 0.87, "learning_rate": 2.1224286919041158e-07, "loss": 0.7259, "step": 46211 }, { "epoch": 0.87, "learning_rate": 2.121812752670252e-07, "loss": 1.2248, "step": 46212 }, { "epoch": 0.87, "learning_rate": 2.12119689886284e-07, "loss": 1.1459, "step": 46213 }, { "epoch": 0.87, "learning_rate": 2.12058113048417e-07, "loss": 1.0469, "step": 46214 }, { "epoch": 0.87, "learning_rate": 2.1199654475365567e-07, "loss": 0.8136, "step": 46215 }, { "epoch": 0.87, "learning_rate": 2.119349850022287e-07, "loss": 0.9232, "step": 46216 }, { "epoch": 0.87, "learning_rate": 2.118734337943662e-07, "loss": 1.0371, "step": 46217 }, { "epoch": 0.87, "learning_rate": 2.1181189113029828e-07, "loss": 1.2174, "step": 46218 }, { "epoch": 0.87, "learning_rate": 2.1175035701025442e-07, "loss": 1.0214, "step": 46219 }, { "epoch": 0.87, "learning_rate": 2.1168883143446478e-07, "loss": 0.7451, "step": 46220 }, { "epoch": 0.87, "learning_rate": 2.1162731440315888e-07, "loss": 0.8937, "step": 46221 }, { "epoch": 0.87, "learning_rate": 2.115658059165668e-07, "loss": 0.8475, "step": 46222 }, { "epoch": 0.87, "learning_rate": 2.1150430597491696e-07, "loss": 0.8617, "step": 46223 }, { "epoch": 0.87, "learning_rate": 2.1144281457844056e-07, "loss": 0.9848, "step": 46224 }, { "epoch": 0.87, "learning_rate": 2.1138133172736634e-07, "loss": 1.1437, "step": 46225 }, { "epoch": 0.87, "learning_rate": 2.1131985742192413e-07, "loss": 0.8755, "step": 46226 }, { "epoch": 0.87, "learning_rate": 2.1125839166234314e-07, "loss": 0.934, "step": 46227 }, { "epoch": 0.87, "learning_rate": 2.111969344488532e-07, "loss": 0.8635, "step": 46228 }, { "epoch": 0.87, "learning_rate": 2.1113548578168386e-07, "loss": 0.8186, "step": 46229 }, { "epoch": 0.87, "learning_rate": 2.1107404566106438e-07, "loss": 0.9296, "step": 46230 }, { "epoch": 0.87, "learning_rate": 2.1101261408722456e-07, "loss": 0.9237, "step": 46231 }, { "epoch": 0.87, "learning_rate": 2.1095119106039257e-07, "loss": 0.6227, "step": 46232 }, { "epoch": 0.87, "learning_rate": 2.1088977658079933e-07, "loss": 1.0458, "step": 46233 }, { "epoch": 0.87, "learning_rate": 2.1082837064867385e-07, "loss": 0.6944, "step": 46234 }, { "epoch": 0.87, "learning_rate": 2.1076697326424395e-07, "loss": 0.9496, "step": 46235 }, { "epoch": 0.87, "learning_rate": 2.1070558442774114e-07, "loss": 0.8032, "step": 46236 }, { "epoch": 0.87, "learning_rate": 2.1064420413939273e-07, "loss": 1.0665, "step": 46237 }, { "epoch": 0.87, "learning_rate": 2.1058283239942884e-07, "loss": 1.066, "step": 46238 }, { "epoch": 0.87, "learning_rate": 2.105214692080787e-07, "loss": 0.8997, "step": 46239 }, { "epoch": 0.87, "learning_rate": 2.1046011456557074e-07, "loss": 0.9904, "step": 46240 }, { "epoch": 0.87, "learning_rate": 2.103987684721348e-07, "loss": 0.9255, "step": 46241 }, { "epoch": 0.87, "learning_rate": 2.1033743092799957e-07, "loss": 0.9641, "step": 46242 }, { "epoch": 0.87, "learning_rate": 2.102761019333946e-07, "loss": 0.868, "step": 46243 }, { "epoch": 0.87, "learning_rate": 2.1021478148854773e-07, "loss": 0.8939, "step": 46244 }, { "epoch": 0.87, "learning_rate": 2.1015346959368939e-07, "loss": 1.0027, "step": 46245 }, { "epoch": 0.87, "learning_rate": 2.1009216624904737e-07, "loss": 0.8413, "step": 46246 }, { "epoch": 0.87, "learning_rate": 2.1003087145485102e-07, "loss": 0.756, "step": 46247 }, { "epoch": 0.87, "learning_rate": 2.0996958521132926e-07, "loss": 0.9179, "step": 46248 }, { "epoch": 0.87, "learning_rate": 2.0990830751871083e-07, "loss": 0.9349, "step": 46249 }, { "epoch": 0.87, "learning_rate": 2.0984703837722442e-07, "loss": 1.1068, "step": 46250 }, { "epoch": 0.87, "learning_rate": 2.0978577778709902e-07, "loss": 0.9942, "step": 46251 }, { "epoch": 0.87, "learning_rate": 2.0972452574856362e-07, "loss": 0.8489, "step": 46252 }, { "epoch": 0.87, "learning_rate": 2.0966328226184608e-07, "loss": 0.8832, "step": 46253 }, { "epoch": 0.87, "learning_rate": 2.0960204732717565e-07, "loss": 0.8156, "step": 46254 }, { "epoch": 0.87, "learning_rate": 2.0954082094478163e-07, "loss": 0.9338, "step": 46255 }, { "epoch": 0.87, "learning_rate": 2.0947960311489103e-07, "loss": 0.9578, "step": 46256 }, { "epoch": 0.87, "learning_rate": 2.0941839383773422e-07, "loss": 0.8676, "step": 46257 }, { "epoch": 0.87, "learning_rate": 2.0935719311353852e-07, "loss": 0.6984, "step": 46258 }, { "epoch": 0.87, "learning_rate": 2.0929600094253294e-07, "loss": 0.8516, "step": 46259 }, { "epoch": 0.87, "learning_rate": 2.0923481732494561e-07, "loss": 0.9052, "step": 46260 }, { "epoch": 0.87, "learning_rate": 2.0917364226100552e-07, "loss": 0.6809, "step": 46261 }, { "epoch": 0.87, "learning_rate": 2.091124757509405e-07, "loss": 0.7734, "step": 46262 }, { "epoch": 0.87, "learning_rate": 2.0905131779497933e-07, "loss": 1.0334, "step": 46263 }, { "epoch": 0.87, "learning_rate": 2.0899016839335095e-07, "loss": 1.0256, "step": 46264 }, { "epoch": 0.87, "learning_rate": 2.0892902754628185e-07, "loss": 1.0386, "step": 46265 }, { "epoch": 0.87, "learning_rate": 2.0886789525400269e-07, "loss": 0.7815, "step": 46266 }, { "epoch": 0.87, "learning_rate": 2.0880677151673996e-07, "loss": 0.5899, "step": 46267 }, { "epoch": 0.87, "learning_rate": 2.087456563347226e-07, "loss": 0.9868, "step": 46268 }, { "epoch": 0.87, "learning_rate": 2.0868454970817854e-07, "loss": 1.0477, "step": 46269 }, { "epoch": 0.87, "learning_rate": 2.0862345163733617e-07, "loss": 0.8278, "step": 46270 }, { "epoch": 0.87, "learning_rate": 2.0856236212242363e-07, "loss": 0.8553, "step": 46271 }, { "epoch": 0.87, "learning_rate": 2.0850128116366885e-07, "loss": 0.7576, "step": 46272 }, { "epoch": 0.87, "learning_rate": 2.0844020876130024e-07, "loss": 0.8928, "step": 46273 }, { "epoch": 0.87, "learning_rate": 2.083791449155456e-07, "loss": 0.9395, "step": 46274 }, { "epoch": 0.87, "learning_rate": 2.0831808962663291e-07, "loss": 0.8651, "step": 46275 }, { "epoch": 0.87, "learning_rate": 2.0825704289479055e-07, "loss": 0.9533, "step": 46276 }, { "epoch": 0.87, "learning_rate": 2.0819600472024525e-07, "loss": 0.9075, "step": 46277 }, { "epoch": 0.87, "learning_rate": 2.081349751032269e-07, "loss": 0.969, "step": 46278 }, { "epoch": 0.87, "learning_rate": 2.0807395404396162e-07, "loss": 0.834, "step": 46279 }, { "epoch": 0.87, "learning_rate": 2.0801294154267794e-07, "loss": 0.921, "step": 46280 }, { "epoch": 0.87, "learning_rate": 2.0795193759960363e-07, "loss": 1.0815, "step": 46281 }, { "epoch": 0.87, "learning_rate": 2.0789094221496663e-07, "loss": 0.9088, "step": 46282 }, { "epoch": 0.87, "learning_rate": 2.0782995538899453e-07, "loss": 0.9163, "step": 46283 }, { "epoch": 0.87, "learning_rate": 2.0776897712191518e-07, "loss": 0.7889, "step": 46284 }, { "epoch": 0.87, "learning_rate": 2.0770800741395675e-07, "loss": 0.8763, "step": 46285 }, { "epoch": 0.87, "learning_rate": 2.0764704626534516e-07, "loss": 0.8205, "step": 46286 }, { "epoch": 0.87, "learning_rate": 2.075860936763102e-07, "loss": 0.8786, "step": 46287 }, { "epoch": 0.87, "learning_rate": 2.0752514964707815e-07, "loss": 0.9568, "step": 46288 }, { "epoch": 0.87, "learning_rate": 2.0746421417787628e-07, "loss": 1.0033, "step": 46289 }, { "epoch": 0.87, "learning_rate": 2.0740328726893355e-07, "loss": 0.797, "step": 46290 }, { "epoch": 0.87, "learning_rate": 2.073423689204765e-07, "loss": 0.8312, "step": 46291 }, { "epoch": 0.87, "learning_rate": 2.0728145913273267e-07, "loss": 0.7542, "step": 46292 }, { "epoch": 0.87, "learning_rate": 2.0722055790592943e-07, "loss": 0.888, "step": 46293 }, { "epoch": 0.87, "learning_rate": 2.0715966524029434e-07, "loss": 1.0019, "step": 46294 }, { "epoch": 0.87, "learning_rate": 2.0709878113605503e-07, "loss": 0.839, "step": 46295 }, { "epoch": 0.87, "learning_rate": 2.0703790559343822e-07, "loss": 0.8768, "step": 46296 }, { "epoch": 0.87, "learning_rate": 2.069770386126721e-07, "loss": 0.8486, "step": 46297 }, { "epoch": 0.87, "learning_rate": 2.0691618019398258e-07, "loss": 0.8059, "step": 46298 }, { "epoch": 0.87, "learning_rate": 2.0685533033759863e-07, "loss": 1.1132, "step": 46299 }, { "epoch": 0.87, "learning_rate": 2.0679448904374623e-07, "loss": 1.0495, "step": 46300 }, { "epoch": 0.87, "learning_rate": 2.067336563126529e-07, "loss": 1.0361, "step": 46301 }, { "epoch": 0.87, "learning_rate": 2.0667283214454547e-07, "loss": 0.913, "step": 46302 }, { "epoch": 0.87, "learning_rate": 2.066120165396518e-07, "loss": 0.9111, "step": 46303 }, { "epoch": 0.87, "learning_rate": 2.0655120949819833e-07, "loss": 0.8602, "step": 46304 }, { "epoch": 0.87, "learning_rate": 2.0649041102041217e-07, "loss": 1.0694, "step": 46305 }, { "epoch": 0.87, "learning_rate": 2.0642962110652115e-07, "loss": 0.7921, "step": 46306 }, { "epoch": 0.87, "learning_rate": 2.0636883975675065e-07, "loss": 1.2372, "step": 46307 }, { "epoch": 0.87, "learning_rate": 2.063080669713294e-07, "loss": 0.9628, "step": 46308 }, { "epoch": 0.87, "learning_rate": 2.0624730275048328e-07, "loss": 0.748, "step": 46309 }, { "epoch": 0.87, "learning_rate": 2.0618654709443882e-07, "loss": 0.8072, "step": 46310 }, { "epoch": 0.87, "learning_rate": 2.0612580000342415e-07, "loss": 0.9442, "step": 46311 }, { "epoch": 0.87, "learning_rate": 2.060650614776652e-07, "loss": 0.9388, "step": 46312 }, { "epoch": 0.87, "learning_rate": 2.06004331517389e-07, "loss": 0.9792, "step": 46313 }, { "epoch": 0.87, "learning_rate": 2.059436101228221e-07, "loss": 1.0947, "step": 46314 }, { "epoch": 0.87, "learning_rate": 2.0588289729419147e-07, "loss": 0.9264, "step": 46315 }, { "epoch": 0.87, "learning_rate": 2.058221930317239e-07, "loss": 0.8286, "step": 46316 }, { "epoch": 0.87, "learning_rate": 2.0576149733564587e-07, "loss": 0.903, "step": 46317 }, { "epoch": 0.87, "learning_rate": 2.0570081020618444e-07, "loss": 1.0633, "step": 46318 }, { "epoch": 0.87, "learning_rate": 2.056401316435652e-07, "loss": 0.9093, "step": 46319 }, { "epoch": 0.87, "learning_rate": 2.0557946164801585e-07, "loss": 0.9174, "step": 46320 }, { "epoch": 0.87, "learning_rate": 2.0551880021976224e-07, "loss": 0.7733, "step": 46321 }, { "epoch": 0.87, "learning_rate": 2.0545814735903113e-07, "loss": 0.8659, "step": 46322 }, { "epoch": 0.87, "learning_rate": 2.0539750306604876e-07, "loss": 0.7737, "step": 46323 }, { "epoch": 0.87, "learning_rate": 2.053368673410419e-07, "loss": 0.9592, "step": 46324 }, { "epoch": 0.87, "learning_rate": 2.0527624018423675e-07, "loss": 1.3145, "step": 46325 }, { "epoch": 0.87, "learning_rate": 2.0521562159585978e-07, "loss": 0.9159, "step": 46326 }, { "epoch": 0.87, "learning_rate": 2.0515501157613776e-07, "loss": 0.7, "step": 46327 }, { "epoch": 0.87, "learning_rate": 2.050944101252958e-07, "loss": 0.7189, "step": 46328 }, { "epoch": 0.87, "learning_rate": 2.0503381724356176e-07, "loss": 0.7355, "step": 46329 }, { "epoch": 0.87, "learning_rate": 2.0497323293116046e-07, "loss": 0.9967, "step": 46330 }, { "epoch": 0.87, "learning_rate": 2.0491265718831864e-07, "loss": 1.2139, "step": 46331 }, { "epoch": 0.87, "learning_rate": 2.0485209001526313e-07, "loss": 0.9638, "step": 46332 }, { "epoch": 0.87, "learning_rate": 2.0479153141221924e-07, "loss": 0.8839, "step": 46333 }, { "epoch": 0.87, "learning_rate": 2.047309813794135e-07, "loss": 0.9818, "step": 46334 }, { "epoch": 0.87, "learning_rate": 2.046704399170718e-07, "loss": 0.8998, "step": 46335 }, { "epoch": 0.87, "learning_rate": 2.046099070254204e-07, "loss": 0.7466, "step": 46336 }, { "epoch": 0.87, "learning_rate": 2.0454938270468517e-07, "loss": 0.9209, "step": 46337 }, { "epoch": 0.87, "learning_rate": 2.0448886695509208e-07, "loss": 1.0675, "step": 46338 }, { "epoch": 0.87, "learning_rate": 2.0442835977686758e-07, "loss": 0.8442, "step": 46339 }, { "epoch": 0.87, "learning_rate": 2.0436786117023654e-07, "loss": 0.8349, "step": 46340 }, { "epoch": 0.87, "learning_rate": 2.0430737113542625e-07, "loss": 0.894, "step": 46341 }, { "epoch": 0.87, "learning_rate": 2.0424688967266127e-07, "loss": 0.7413, "step": 46342 }, { "epoch": 0.87, "learning_rate": 2.0418641678216833e-07, "loss": 1.0311, "step": 46343 }, { "epoch": 0.87, "learning_rate": 2.0412595246417283e-07, "loss": 1.079, "step": 46344 }, { "epoch": 0.87, "learning_rate": 2.0406549671890041e-07, "loss": 1.0349, "step": 46345 }, { "epoch": 0.87, "learning_rate": 2.0400504954657757e-07, "loss": 0.8862, "step": 46346 }, { "epoch": 0.87, "learning_rate": 2.0394461094742886e-07, "loss": 0.9412, "step": 46347 }, { "epoch": 0.87, "learning_rate": 2.0388418092168126e-07, "loss": 0.8163, "step": 46348 }, { "epoch": 0.87, "learning_rate": 2.0382375946955913e-07, "loss": 0.9653, "step": 46349 }, { "epoch": 0.87, "learning_rate": 2.0376334659128888e-07, "loss": 1.1146, "step": 46350 }, { "epoch": 0.87, "learning_rate": 2.0370294228709592e-07, "loss": 0.9063, "step": 46351 }, { "epoch": 0.87, "learning_rate": 2.036425465572056e-07, "loss": 0.9153, "step": 46352 }, { "epoch": 0.87, "learning_rate": 2.0358215940184362e-07, "loss": 0.7325, "step": 46353 }, { "epoch": 0.87, "learning_rate": 2.035217808212356e-07, "loss": 0.8684, "step": 46354 }, { "epoch": 0.87, "learning_rate": 2.0346141081560715e-07, "loss": 1.0085, "step": 46355 }, { "epoch": 0.87, "learning_rate": 2.0340104938518262e-07, "loss": 1.1558, "step": 46356 }, { "epoch": 0.87, "learning_rate": 2.0334069653018844e-07, "loss": 1.0183, "step": 46357 }, { "epoch": 0.87, "learning_rate": 2.032803522508503e-07, "loss": 0.8852, "step": 46358 }, { "epoch": 0.87, "learning_rate": 2.0322001654739189e-07, "loss": 0.9884, "step": 46359 }, { "epoch": 0.87, "learning_rate": 2.031596894200405e-07, "loss": 0.8262, "step": 46360 }, { "epoch": 0.87, "learning_rate": 2.0309937086901986e-07, "loss": 0.8222, "step": 46361 }, { "epoch": 0.87, "learning_rate": 2.0303906089455565e-07, "loss": 1.1696, "step": 46362 }, { "epoch": 0.87, "learning_rate": 2.029787594968735e-07, "loss": 0.9758, "step": 46363 }, { "epoch": 0.87, "learning_rate": 2.0291846667619796e-07, "loss": 0.8842, "step": 46364 }, { "epoch": 0.87, "learning_rate": 2.028581824327544e-07, "loss": 0.9536, "step": 46365 }, { "epoch": 0.87, "learning_rate": 2.027979067667682e-07, "loss": 0.8508, "step": 46366 }, { "epoch": 0.87, "learning_rate": 2.0273763967846443e-07, "loss": 0.7766, "step": 46367 }, { "epoch": 0.87, "learning_rate": 2.0267738116806713e-07, "loss": 1.0588, "step": 46368 }, { "epoch": 0.87, "learning_rate": 2.0261713123580274e-07, "loss": 1.0621, "step": 46369 }, { "epoch": 0.87, "learning_rate": 2.0255688988189526e-07, "loss": 0.9438, "step": 46370 }, { "epoch": 0.87, "learning_rate": 2.0249665710656978e-07, "loss": 0.7937, "step": 46371 }, { "epoch": 0.87, "learning_rate": 2.0243643291005144e-07, "loss": 0.6385, "step": 46372 }, { "epoch": 0.87, "learning_rate": 2.0237621729256503e-07, "loss": 1.0217, "step": 46373 }, { "epoch": 0.87, "learning_rate": 2.0231601025433533e-07, "loss": 1.0412, "step": 46374 }, { "epoch": 0.87, "learning_rate": 2.0225581179558722e-07, "loss": 1.0432, "step": 46375 }, { "epoch": 0.87, "learning_rate": 2.0219562191654608e-07, "loss": 1.0062, "step": 46376 }, { "epoch": 0.87, "learning_rate": 2.0213544061743502e-07, "loss": 0.952, "step": 46377 }, { "epoch": 0.88, "learning_rate": 2.0207526789847999e-07, "loss": 0.9153, "step": 46378 }, { "epoch": 0.88, "learning_rate": 2.0201510375990608e-07, "loss": 0.9111, "step": 46379 }, { "epoch": 0.88, "learning_rate": 2.0195494820193645e-07, "loss": 0.8901, "step": 46380 }, { "epoch": 0.88, "learning_rate": 2.018948012247976e-07, "loss": 0.9065, "step": 46381 }, { "epoch": 0.88, "learning_rate": 2.018346628287124e-07, "loss": 0.9498, "step": 46382 }, { "epoch": 0.88, "learning_rate": 2.017745330139062e-07, "loss": 0.8698, "step": 46383 }, { "epoch": 0.88, "learning_rate": 2.0171441178060331e-07, "loss": 0.9377, "step": 46384 }, { "epoch": 0.88, "learning_rate": 2.0165429912902852e-07, "loss": 0.7325, "step": 46385 }, { "epoch": 0.88, "learning_rate": 2.015941950594061e-07, "loss": 0.868, "step": 46386 }, { "epoch": 0.88, "learning_rate": 2.0153409957196058e-07, "loss": 1.1155, "step": 46387 }, { "epoch": 0.88, "learning_rate": 2.014740126669165e-07, "loss": 0.9383, "step": 46388 }, { "epoch": 0.88, "learning_rate": 2.0141393434449707e-07, "loss": 0.9805, "step": 46389 }, { "epoch": 0.88, "learning_rate": 2.0135386460492846e-07, "loss": 1.0274, "step": 46390 }, { "epoch": 0.88, "learning_rate": 2.012938034484338e-07, "loss": 0.8859, "step": 46391 }, { "epoch": 0.88, "learning_rate": 2.0123375087523738e-07, "loss": 0.8414, "step": 46392 }, { "epoch": 0.88, "learning_rate": 2.0117370688556375e-07, "loss": 1.1798, "step": 46393 }, { "epoch": 0.88, "learning_rate": 2.011136714796369e-07, "loss": 1.0382, "step": 46394 }, { "epoch": 0.88, "learning_rate": 2.0105364465768106e-07, "loss": 1.0483, "step": 46395 }, { "epoch": 0.88, "learning_rate": 2.0099362641992082e-07, "loss": 1.0649, "step": 46396 }, { "epoch": 0.88, "learning_rate": 2.0093361676657985e-07, "loss": 0.8022, "step": 46397 }, { "epoch": 0.88, "learning_rate": 2.008736156978816e-07, "loss": 0.7781, "step": 46398 }, { "epoch": 0.88, "learning_rate": 2.0081362321405118e-07, "loss": 0.8478, "step": 46399 }, { "epoch": 0.88, "learning_rate": 2.0075363931531282e-07, "loss": 1.0162, "step": 46400 }, { "epoch": 0.88, "learning_rate": 2.006936640018889e-07, "loss": 1.0461, "step": 46401 }, { "epoch": 0.88, "learning_rate": 2.00633697274005e-07, "loss": 0.881, "step": 46402 }, { "epoch": 0.88, "learning_rate": 2.005737391318843e-07, "loss": 0.9294, "step": 46403 }, { "epoch": 0.88, "learning_rate": 2.0051378957575058e-07, "loss": 0.7358, "step": 46404 }, { "epoch": 0.88, "learning_rate": 2.0045384860582772e-07, "loss": 1.138, "step": 46405 }, { "epoch": 0.88, "learning_rate": 2.0039391622233977e-07, "loss": 0.8835, "step": 46406 }, { "epoch": 0.88, "learning_rate": 2.0033399242551044e-07, "loss": 0.9543, "step": 46407 }, { "epoch": 0.88, "learning_rate": 2.002740772155637e-07, "loss": 0.8855, "step": 46408 }, { "epoch": 0.88, "learning_rate": 2.0021417059272325e-07, "loss": 0.8076, "step": 46409 }, { "epoch": 0.88, "learning_rate": 2.001542725572117e-07, "loss": 0.9149, "step": 46410 }, { "epoch": 0.88, "learning_rate": 2.0009438310925444e-07, "loss": 0.8802, "step": 46411 }, { "epoch": 0.88, "learning_rate": 2.0003450224907377e-07, "loss": 0.8756, "step": 46412 }, { "epoch": 0.88, "learning_rate": 1.99974629976894e-07, "loss": 0.8187, "step": 46413 }, { "epoch": 0.88, "learning_rate": 1.9991476629293822e-07, "loss": 0.9129, "step": 46414 }, { "epoch": 0.88, "learning_rate": 1.9985491119743018e-07, "loss": 0.9496, "step": 46415 }, { "epoch": 0.88, "learning_rate": 1.9979506469059328e-07, "loss": 0.8624, "step": 46416 }, { "epoch": 0.88, "learning_rate": 1.9973522677265129e-07, "loss": 0.69, "step": 46417 }, { "epoch": 0.88, "learning_rate": 1.9967539744382785e-07, "loss": 1.0646, "step": 46418 }, { "epoch": 0.88, "learning_rate": 1.9961557670434506e-07, "loss": 1.131, "step": 46419 }, { "epoch": 0.88, "learning_rate": 1.995557645544277e-07, "loss": 0.7887, "step": 46420 }, { "epoch": 0.88, "learning_rate": 1.994959609942987e-07, "loss": 1.0382, "step": 46421 }, { "epoch": 0.88, "learning_rate": 1.994361660241806e-07, "loss": 1.0228, "step": 46422 }, { "epoch": 0.88, "learning_rate": 1.9937637964429823e-07, "loss": 0.9312, "step": 46423 }, { "epoch": 0.88, "learning_rate": 1.993166018548734e-07, "loss": 0.9944, "step": 46424 }, { "epoch": 0.88, "learning_rate": 1.9925683265613006e-07, "loss": 1.2512, "step": 46425 }, { "epoch": 0.88, "learning_rate": 1.991970720482908e-07, "loss": 0.727, "step": 46426 }, { "epoch": 0.88, "learning_rate": 1.9913732003157936e-07, "loss": 0.8149, "step": 46427 }, { "epoch": 0.88, "learning_rate": 1.9907757660621862e-07, "loss": 0.7833, "step": 46428 }, { "epoch": 0.88, "learning_rate": 1.9901784177243144e-07, "loss": 1.0037, "step": 46429 }, { "epoch": 0.88, "learning_rate": 1.989581155304418e-07, "loss": 0.7454, "step": 46430 }, { "epoch": 0.88, "learning_rate": 1.9889839788047095e-07, "loss": 1.0425, "step": 46431 }, { "epoch": 0.88, "learning_rate": 1.9883868882274394e-07, "loss": 0.9232, "step": 46432 }, { "epoch": 0.88, "learning_rate": 1.9877898835748228e-07, "loss": 0.8203, "step": 46433 }, { "epoch": 0.88, "learning_rate": 1.987192964849091e-07, "loss": 0.8631, "step": 46434 }, { "epoch": 0.88, "learning_rate": 1.9865961320524763e-07, "loss": 0.8858, "step": 46435 }, { "epoch": 0.88, "learning_rate": 1.9859993851872068e-07, "loss": 0.6392, "step": 46436 }, { "epoch": 0.88, "learning_rate": 1.9854027242555085e-07, "loss": 0.9483, "step": 46437 }, { "epoch": 0.88, "learning_rate": 1.9848061492596132e-07, "loss": 0.8857, "step": 46438 }, { "epoch": 0.88, "learning_rate": 1.984209660201747e-07, "loss": 0.8143, "step": 46439 }, { "epoch": 0.88, "learning_rate": 1.98361325708413e-07, "loss": 0.9292, "step": 46440 }, { "epoch": 0.88, "learning_rate": 1.9830169399089993e-07, "loss": 0.8859, "step": 46441 }, { "epoch": 0.88, "learning_rate": 1.9824207086785812e-07, "loss": 0.7097, "step": 46442 }, { "epoch": 0.88, "learning_rate": 1.9818245633950905e-07, "loss": 1.1891, "step": 46443 }, { "epoch": 0.88, "learning_rate": 1.9812285040607698e-07, "loss": 0.9723, "step": 46444 }, { "epoch": 0.88, "learning_rate": 1.980632530677834e-07, "loss": 0.9356, "step": 46445 }, { "epoch": 0.88, "learning_rate": 1.9800366432485064e-07, "loss": 0.7366, "step": 46446 }, { "epoch": 0.88, "learning_rate": 1.9794408417750182e-07, "loss": 0.8468, "step": 46447 }, { "epoch": 0.88, "learning_rate": 1.978845126259593e-07, "loss": 0.8518, "step": 46448 }, { "epoch": 0.88, "learning_rate": 1.978249496704454e-07, "loss": 0.9718, "step": 46449 }, { "epoch": 0.88, "learning_rate": 1.9776539531118244e-07, "loss": 1.0251, "step": 46450 }, { "epoch": 0.88, "learning_rate": 1.977058495483933e-07, "loss": 0.7867, "step": 46451 }, { "epoch": 0.88, "learning_rate": 1.9764631238229915e-07, "loss": 0.878, "step": 46452 }, { "epoch": 0.88, "learning_rate": 1.97586783813124e-07, "loss": 0.9521, "step": 46453 }, { "epoch": 0.88, "learning_rate": 1.9752726384108857e-07, "loss": 0.8765, "step": 46454 }, { "epoch": 0.88, "learning_rate": 1.9746775246641592e-07, "loss": 0.9623, "step": 46455 }, { "epoch": 0.88, "learning_rate": 1.9740824968932787e-07, "loss": 1.0578, "step": 46456 }, { "epoch": 0.88, "learning_rate": 1.9734875551004702e-07, "loss": 0.8942, "step": 46457 }, { "epoch": 0.88, "learning_rate": 1.9728926992879538e-07, "loss": 0.7807, "step": 46458 }, { "epoch": 0.88, "learning_rate": 1.9722979294579475e-07, "loss": 0.723, "step": 46459 }, { "epoch": 0.88, "learning_rate": 1.9717032456126827e-07, "loss": 0.78, "step": 46460 }, { "epoch": 0.88, "learning_rate": 1.9711086477543606e-07, "loss": 0.7024, "step": 46461 }, { "epoch": 0.88, "learning_rate": 1.970514135885218e-07, "loss": 1.1124, "step": 46462 }, { "epoch": 0.88, "learning_rate": 1.969919710007473e-07, "loss": 1.1296, "step": 46463 }, { "epoch": 0.88, "learning_rate": 1.9693253701233317e-07, "loss": 0.9681, "step": 46464 }, { "epoch": 0.88, "learning_rate": 1.968731116235034e-07, "loss": 0.9361, "step": 46465 }, { "epoch": 0.88, "learning_rate": 1.9681369483447844e-07, "loss": 0.9368, "step": 46466 }, { "epoch": 0.88, "learning_rate": 1.9675428664548053e-07, "loss": 0.8427, "step": 46467 }, { "epoch": 0.88, "learning_rate": 1.9669488705673119e-07, "loss": 1.175, "step": 46468 }, { "epoch": 0.88, "learning_rate": 1.9663549606845272e-07, "loss": 1.0505, "step": 46469 }, { "epoch": 0.88, "learning_rate": 1.9657611368086693e-07, "loss": 0.8112, "step": 46470 }, { "epoch": 0.88, "learning_rate": 1.9651673989419502e-07, "loss": 0.8208, "step": 46471 }, { "epoch": 0.88, "learning_rate": 1.9645737470865956e-07, "loss": 0.8357, "step": 46472 }, { "epoch": 0.88, "learning_rate": 1.9639801812448067e-07, "loss": 0.7949, "step": 46473 }, { "epoch": 0.88, "learning_rate": 1.963386701418818e-07, "loss": 1.0438, "step": 46474 }, { "epoch": 0.88, "learning_rate": 1.962793307610833e-07, "loss": 0.9733, "step": 46475 }, { "epoch": 0.88, "learning_rate": 1.9621999998230696e-07, "loss": 1.0833, "step": 46476 }, { "epoch": 0.88, "learning_rate": 1.961606778057748e-07, "loss": 0.9315, "step": 46477 }, { "epoch": 0.88, "learning_rate": 1.9610136423170778e-07, "loss": 0.9273, "step": 46478 }, { "epoch": 0.88, "learning_rate": 1.9604205926032793e-07, "loss": 0.8425, "step": 46479 }, { "epoch": 0.88, "learning_rate": 1.9598276289185618e-07, "loss": 0.955, "step": 46480 }, { "epoch": 0.88, "learning_rate": 1.9592347512651462e-07, "loss": 1.0046, "step": 46481 }, { "epoch": 0.88, "learning_rate": 1.9586419596452328e-07, "loss": 0.9651, "step": 46482 }, { "epoch": 0.88, "learning_rate": 1.958049254061048e-07, "loss": 0.7758, "step": 46483 }, { "epoch": 0.88, "learning_rate": 1.9574566345148066e-07, "loss": 0.8036, "step": 46484 }, { "epoch": 0.88, "learning_rate": 1.9568641010087043e-07, "loss": 1.0013, "step": 46485 }, { "epoch": 0.88, "learning_rate": 1.956271653544975e-07, "loss": 0.8021, "step": 46486 }, { "epoch": 0.88, "learning_rate": 1.9556792921258171e-07, "loss": 1.137, "step": 46487 }, { "epoch": 0.88, "learning_rate": 1.955087016753446e-07, "loss": 0.8174, "step": 46488 }, { "epoch": 0.88, "learning_rate": 1.954494827430073e-07, "loss": 0.9891, "step": 46489 }, { "epoch": 0.88, "learning_rate": 1.9539027241579107e-07, "loss": 0.8322, "step": 46490 }, { "epoch": 0.88, "learning_rate": 1.9533107069391682e-07, "loss": 1.058, "step": 46491 }, { "epoch": 0.88, "learning_rate": 1.952718775776055e-07, "loss": 0.876, "step": 46492 }, { "epoch": 0.88, "learning_rate": 1.952126930670789e-07, "loss": 1.0588, "step": 46493 }, { "epoch": 0.88, "learning_rate": 1.9515351716255682e-07, "loss": 0.9406, "step": 46494 }, { "epoch": 0.88, "learning_rate": 1.950943498642613e-07, "loss": 1.0159, "step": 46495 }, { "epoch": 0.88, "learning_rate": 1.950351911724127e-07, "loss": 0.7084, "step": 46496 }, { "epoch": 0.88, "learning_rate": 1.94976041087232e-07, "loss": 0.7763, "step": 46497 }, { "epoch": 0.88, "learning_rate": 1.9491689960893982e-07, "loss": 0.749, "step": 46498 }, { "epoch": 0.88, "learning_rate": 1.9485776673775742e-07, "loss": 0.8484, "step": 46499 }, { "epoch": 0.88, "learning_rate": 1.947986424739054e-07, "loss": 1.1836, "step": 46500 }, { "epoch": 0.88, "learning_rate": 1.9473952681760473e-07, "loss": 0.9116, "step": 46501 }, { "epoch": 0.88, "learning_rate": 1.946804197690763e-07, "loss": 0.6809, "step": 46502 }, { "epoch": 0.88, "learning_rate": 1.9462132132853973e-07, "loss": 1.0601, "step": 46503 }, { "epoch": 0.88, "learning_rate": 1.945622314962167e-07, "loss": 0.7818, "step": 46504 }, { "epoch": 0.88, "learning_rate": 1.9450315027232823e-07, "loss": 0.7858, "step": 46505 }, { "epoch": 0.88, "learning_rate": 1.9444407765709328e-07, "loss": 1.0477, "step": 46506 }, { "epoch": 0.88, "learning_rate": 1.943850136507344e-07, "loss": 1.0419, "step": 46507 }, { "epoch": 0.88, "learning_rate": 1.9432595825347066e-07, "loss": 1.0333, "step": 46508 }, { "epoch": 0.88, "learning_rate": 1.9426691146552324e-07, "loss": 0.9449, "step": 46509 }, { "epoch": 0.88, "learning_rate": 1.942078732871125e-07, "loss": 0.8369, "step": 46510 }, { "epoch": 0.88, "learning_rate": 1.941488437184588e-07, "loss": 0.7759, "step": 46511 }, { "epoch": 0.88, "learning_rate": 1.940898227597826e-07, "loss": 1.0856, "step": 46512 }, { "epoch": 0.88, "learning_rate": 1.9403081041130422e-07, "loss": 1.0891, "step": 46513 }, { "epoch": 0.88, "learning_rate": 1.939718066732449e-07, "loss": 0.9959, "step": 46514 }, { "epoch": 0.88, "learning_rate": 1.9391281154582276e-07, "loss": 0.7382, "step": 46515 }, { "epoch": 0.88, "learning_rate": 1.938538250292607e-07, "loss": 0.8641, "step": 46516 }, { "epoch": 0.88, "learning_rate": 1.9379484712377716e-07, "loss": 0.9534, "step": 46517 }, { "epoch": 0.88, "learning_rate": 1.9373587782959308e-07, "loss": 0.9584, "step": 46518 }, { "epoch": 0.88, "learning_rate": 1.9367691714692828e-07, "loss": 0.9986, "step": 46519 }, { "epoch": 0.88, "learning_rate": 1.9361796507600338e-07, "loss": 0.7363, "step": 46520 }, { "epoch": 0.88, "learning_rate": 1.9355902161703827e-07, "loss": 0.7731, "step": 46521 }, { "epoch": 0.88, "learning_rate": 1.93500086770253e-07, "loss": 1.0113, "step": 46522 }, { "epoch": 0.88, "learning_rate": 1.9344116053586797e-07, "loss": 0.8232, "step": 46523 }, { "epoch": 0.88, "learning_rate": 1.9338224291410245e-07, "loss": 0.8726, "step": 46524 }, { "epoch": 0.88, "learning_rate": 1.933233339051771e-07, "loss": 1.1859, "step": 46525 }, { "epoch": 0.88, "learning_rate": 1.93264433509312e-07, "loss": 0.8185, "step": 46526 }, { "epoch": 0.88, "learning_rate": 1.9320554172672618e-07, "loss": 0.879, "step": 46527 }, { "epoch": 0.88, "learning_rate": 1.931466585576408e-07, "loss": 0.9405, "step": 46528 }, { "epoch": 0.88, "learning_rate": 1.9308778400227463e-07, "loss": 0.8026, "step": 46529 }, { "epoch": 0.88, "learning_rate": 1.93028918060848e-07, "loss": 1.0723, "step": 46530 }, { "epoch": 0.88, "learning_rate": 1.9297006073358076e-07, "loss": 0.9327, "step": 46531 }, { "epoch": 0.88, "learning_rate": 1.9291121202069246e-07, "loss": 0.9808, "step": 46532 }, { "epoch": 0.88, "learning_rate": 1.928523719224032e-07, "loss": 0.9843, "step": 46533 }, { "epoch": 0.88, "learning_rate": 1.9279354043893223e-07, "loss": 0.883, "step": 46534 }, { "epoch": 0.88, "learning_rate": 1.9273471757049966e-07, "loss": 0.9713, "step": 46535 }, { "epoch": 0.88, "learning_rate": 1.926759033173245e-07, "loss": 0.7639, "step": 46536 }, { "epoch": 0.88, "learning_rate": 1.9261709767962739e-07, "loss": 1.0158, "step": 46537 }, { "epoch": 0.88, "learning_rate": 1.9255830065762677e-07, "loss": 1.0329, "step": 46538 }, { "epoch": 0.88, "learning_rate": 1.9249951225154273e-07, "loss": 1.0776, "step": 46539 }, { "epoch": 0.88, "learning_rate": 1.9244073246159484e-07, "loss": 0.9742, "step": 46540 }, { "epoch": 0.88, "learning_rate": 1.9238196128800264e-07, "loss": 0.8597, "step": 46541 }, { "epoch": 0.88, "learning_rate": 1.9232319873098538e-07, "loss": 0.7183, "step": 46542 }, { "epoch": 0.88, "learning_rate": 1.9226444479076233e-07, "loss": 1.1368, "step": 46543 }, { "epoch": 0.88, "learning_rate": 1.9220569946755362e-07, "loss": 1.0531, "step": 46544 }, { "epoch": 0.88, "learning_rate": 1.921469627615774e-07, "loss": 1.0, "step": 46545 }, { "epoch": 0.88, "learning_rate": 1.9208823467305375e-07, "loss": 0.9789, "step": 46546 }, { "epoch": 0.88, "learning_rate": 1.9202951520220253e-07, "loss": 0.9909, "step": 46547 }, { "epoch": 0.88, "learning_rate": 1.9197080434924158e-07, "loss": 0.8236, "step": 46548 }, { "epoch": 0.88, "learning_rate": 1.919121021143916e-07, "loss": 0.9737, "step": 46549 }, { "epoch": 0.88, "learning_rate": 1.918534084978707e-07, "loss": 0.9824, "step": 46550 }, { "epoch": 0.88, "learning_rate": 1.917947234998982e-07, "loss": 0.9316, "step": 46551 }, { "epoch": 0.88, "learning_rate": 1.917360471206936e-07, "loss": 0.9438, "step": 46552 }, { "epoch": 0.88, "learning_rate": 1.9167737936047565e-07, "loss": 0.9441, "step": 46553 }, { "epoch": 0.88, "learning_rate": 1.9161872021946386e-07, "loss": 0.6978, "step": 46554 }, { "epoch": 0.88, "learning_rate": 1.91560069697877e-07, "loss": 1.0208, "step": 46555 }, { "epoch": 0.88, "learning_rate": 1.9150142779593428e-07, "loss": 0.9314, "step": 46556 }, { "epoch": 0.88, "learning_rate": 1.9144279451385362e-07, "loss": 1.0508, "step": 46557 }, { "epoch": 0.88, "learning_rate": 1.9138416985185565e-07, "loss": 0.8944, "step": 46558 }, { "epoch": 0.88, "learning_rate": 1.91325553810158e-07, "loss": 0.8675, "step": 46559 }, { "epoch": 0.88, "learning_rate": 1.912669463889799e-07, "loss": 0.7799, "step": 46560 }, { "epoch": 0.88, "learning_rate": 1.912083475885404e-07, "loss": 1.0346, "step": 46561 }, { "epoch": 0.88, "learning_rate": 1.9114975740905816e-07, "loss": 1.0049, "step": 46562 }, { "epoch": 0.88, "learning_rate": 1.9109117585075166e-07, "loss": 0.9507, "step": 46563 }, { "epoch": 0.88, "learning_rate": 1.9103260291384013e-07, "loss": 1.0245, "step": 46564 }, { "epoch": 0.88, "learning_rate": 1.909740385985423e-07, "loss": 0.9562, "step": 46565 }, { "epoch": 0.88, "learning_rate": 1.9091548290507605e-07, "loss": 0.7542, "step": 46566 }, { "epoch": 0.88, "learning_rate": 1.9085693583366095e-07, "loss": 0.8066, "step": 46567 }, { "epoch": 0.88, "learning_rate": 1.907983973845154e-07, "loss": 1.0016, "step": 46568 }, { "epoch": 0.88, "learning_rate": 1.907398675578573e-07, "loss": 0.9485, "step": 46569 }, { "epoch": 0.88, "learning_rate": 1.9068134635390646e-07, "loss": 0.9237, "step": 46570 }, { "epoch": 0.88, "learning_rate": 1.9062283377288022e-07, "loss": 0.7694, "step": 46571 }, { "epoch": 0.88, "learning_rate": 1.9056432981499757e-07, "loss": 0.8192, "step": 46572 }, { "epoch": 0.88, "learning_rate": 1.9050583448047667e-07, "loss": 0.8647, "step": 46573 }, { "epoch": 0.88, "learning_rate": 1.904473477695365e-07, "loss": 0.8131, "step": 46574 }, { "epoch": 0.88, "learning_rate": 1.9038886968239494e-07, "loss": 0.9748, "step": 46575 }, { "epoch": 0.88, "learning_rate": 1.9033040021927047e-07, "loss": 0.9833, "step": 46576 }, { "epoch": 0.88, "learning_rate": 1.9027193938038202e-07, "loss": 0.7546, "step": 46577 }, { "epoch": 0.88, "learning_rate": 1.9021348716594694e-07, "loss": 0.899, "step": 46578 }, { "epoch": 0.88, "learning_rate": 1.901550435761837e-07, "loss": 0.7647, "step": 46579 }, { "epoch": 0.88, "learning_rate": 1.9009660861131095e-07, "loss": 0.9498, "step": 46580 }, { "epoch": 0.88, "learning_rate": 1.9003818227154634e-07, "loss": 0.9338, "step": 46581 }, { "epoch": 0.88, "learning_rate": 1.8997976455710858e-07, "loss": 0.9187, "step": 46582 }, { "epoch": 0.88, "learning_rate": 1.8992135546821555e-07, "loss": 1.0399, "step": 46583 }, { "epoch": 0.88, "learning_rate": 1.8986295500508567e-07, "loss": 1.0609, "step": 46584 }, { "epoch": 0.88, "learning_rate": 1.89804563167936e-07, "loss": 0.7219, "step": 46585 }, { "epoch": 0.88, "learning_rate": 1.897461799569858e-07, "loss": 0.8459, "step": 46586 }, { "epoch": 0.88, "learning_rate": 1.896878053724524e-07, "loss": 1.1276, "step": 46587 }, { "epoch": 0.88, "learning_rate": 1.8962943941455342e-07, "loss": 0.9451, "step": 46588 }, { "epoch": 0.88, "learning_rate": 1.895710820835081e-07, "loss": 0.9235, "step": 46589 }, { "epoch": 0.88, "learning_rate": 1.8951273337953296e-07, "loss": 0.8137, "step": 46590 }, { "epoch": 0.88, "learning_rate": 1.8945439330284643e-07, "loss": 0.8396, "step": 46591 }, { "epoch": 0.88, "learning_rate": 1.8939606185366666e-07, "loss": 0.8839, "step": 46592 }, { "epoch": 0.88, "learning_rate": 1.893377390322107e-07, "loss": 1.0289, "step": 46593 }, { "epoch": 0.88, "learning_rate": 1.8927942483869726e-07, "loss": 0.8368, "step": 46594 }, { "epoch": 0.88, "learning_rate": 1.8922111927334312e-07, "loss": 0.9649, "step": 46595 }, { "epoch": 0.88, "learning_rate": 1.891628223363673e-07, "loss": 0.8149, "step": 46596 }, { "epoch": 0.88, "learning_rate": 1.8910453402798568e-07, "loss": 1.016, "step": 46597 }, { "epoch": 0.88, "learning_rate": 1.8904625434841756e-07, "loss": 0.6074, "step": 46598 }, { "epoch": 0.88, "learning_rate": 1.8898798329787972e-07, "loss": 0.9159, "step": 46599 }, { "epoch": 0.88, "learning_rate": 1.8892972087658974e-07, "loss": 0.8984, "step": 46600 }, { "epoch": 0.88, "learning_rate": 1.8887146708476523e-07, "loss": 0.9562, "step": 46601 }, { "epoch": 0.88, "learning_rate": 1.888132219226238e-07, "loss": 1.0115, "step": 46602 }, { "epoch": 0.88, "learning_rate": 1.8875498539038306e-07, "loss": 0.9507, "step": 46603 }, { "epoch": 0.88, "learning_rate": 1.8869675748826034e-07, "loss": 0.6843, "step": 46604 }, { "epoch": 0.88, "learning_rate": 1.8863853821647347e-07, "loss": 0.9612, "step": 46605 }, { "epoch": 0.88, "learning_rate": 1.8858032757523848e-07, "loss": 1.4587, "step": 46606 }, { "epoch": 0.88, "learning_rate": 1.8852212556477484e-07, "loss": 0.9211, "step": 46607 }, { "epoch": 0.88, "learning_rate": 1.8846393218529796e-07, "loss": 0.7988, "step": 46608 }, { "epoch": 0.88, "learning_rate": 1.8840574743702544e-07, "loss": 0.9531, "step": 46609 }, { "epoch": 0.88, "learning_rate": 1.88347571320176e-07, "loss": 0.8423, "step": 46610 }, { "epoch": 0.88, "learning_rate": 1.882894038349653e-07, "loss": 0.8297, "step": 46611 }, { "epoch": 0.88, "learning_rate": 1.882312449816112e-07, "loss": 1.1291, "step": 46612 }, { "epoch": 0.88, "learning_rate": 1.881730947603308e-07, "loss": 0.7876, "step": 46613 }, { "epoch": 0.88, "learning_rate": 1.881149531713411e-07, "loss": 0.957, "step": 46614 }, { "epoch": 0.88, "learning_rate": 1.8805682021485945e-07, "loss": 0.886, "step": 46615 }, { "epoch": 0.88, "learning_rate": 1.8799869589110232e-07, "loss": 0.7567, "step": 46616 }, { "epoch": 0.88, "learning_rate": 1.879405802002879e-07, "loss": 0.9886, "step": 46617 }, { "epoch": 0.88, "learning_rate": 1.8788247314263152e-07, "loss": 1.1661, "step": 46618 }, { "epoch": 0.88, "learning_rate": 1.8782437471835224e-07, "loss": 0.9745, "step": 46619 }, { "epoch": 0.88, "learning_rate": 1.8776628492766512e-07, "loss": 1.0688, "step": 46620 }, { "epoch": 0.88, "learning_rate": 1.877082037707878e-07, "loss": 0.8679, "step": 46621 }, { "epoch": 0.88, "learning_rate": 1.876501312479373e-07, "loss": 0.7446, "step": 46622 }, { "epoch": 0.88, "learning_rate": 1.875920673593301e-07, "loss": 0.8954, "step": 46623 }, { "epoch": 0.88, "learning_rate": 1.875340121051833e-07, "loss": 1.1023, "step": 46624 }, { "epoch": 0.88, "learning_rate": 1.874759654857136e-07, "loss": 1.0513, "step": 46625 }, { "epoch": 0.88, "learning_rate": 1.874179275011384e-07, "loss": 0.9161, "step": 46626 }, { "epoch": 0.88, "learning_rate": 1.8735989815167277e-07, "loss": 1.0165, "step": 46627 }, { "epoch": 0.88, "learning_rate": 1.8730187743753513e-07, "loss": 0.8683, "step": 46628 }, { "epoch": 0.88, "learning_rate": 1.872438653589409e-07, "loss": 0.8052, "step": 46629 }, { "epoch": 0.88, "learning_rate": 1.8718586191610683e-07, "loss": 1.1059, "step": 46630 }, { "epoch": 0.88, "learning_rate": 1.8712786710925079e-07, "loss": 1.0855, "step": 46631 }, { "epoch": 0.88, "learning_rate": 1.8706988093858764e-07, "loss": 0.8981, "step": 46632 }, { "epoch": 0.88, "learning_rate": 1.8701190340433496e-07, "loss": 0.9013, "step": 46633 }, { "epoch": 0.88, "learning_rate": 1.8695393450670868e-07, "loss": 0.7771, "step": 46634 }, { "epoch": 0.88, "learning_rate": 1.8689597424592558e-07, "loss": 0.8658, "step": 46635 }, { "epoch": 0.88, "learning_rate": 1.8683802262220218e-07, "loss": 0.8643, "step": 46636 }, { "epoch": 0.88, "learning_rate": 1.867800796357544e-07, "loss": 0.9241, "step": 46637 }, { "epoch": 0.88, "learning_rate": 1.8672214528679955e-07, "loss": 1.0126, "step": 46638 }, { "epoch": 0.88, "learning_rate": 1.866642195755522e-07, "loss": 0.9688, "step": 46639 }, { "epoch": 0.88, "learning_rate": 1.8660630250223078e-07, "loss": 0.9098, "step": 46640 }, { "epoch": 0.88, "learning_rate": 1.8654839406704984e-07, "loss": 0.8843, "step": 46641 }, { "epoch": 0.88, "learning_rate": 1.8649049427022642e-07, "loss": 0.7712, "step": 46642 }, { "epoch": 0.88, "learning_rate": 1.8643260311197646e-07, "loss": 1.0718, "step": 46643 }, { "epoch": 0.88, "learning_rate": 1.8637472059251648e-07, "loss": 0.9742, "step": 46644 }, { "epoch": 0.88, "learning_rate": 1.8631684671206212e-07, "loss": 1.0389, "step": 46645 }, { "epoch": 0.88, "learning_rate": 1.862589814708299e-07, "loss": 0.8367, "step": 46646 }, { "epoch": 0.88, "learning_rate": 1.8620112486903597e-07, "loss": 0.8742, "step": 46647 }, { "epoch": 0.88, "learning_rate": 1.861432769068952e-07, "loss": 0.9612, "step": 46648 }, { "epoch": 0.88, "learning_rate": 1.860854375846255e-07, "loss": 1.1131, "step": 46649 }, { "epoch": 0.88, "learning_rate": 1.8602760690244137e-07, "loss": 0.7783, "step": 46650 }, { "epoch": 0.88, "learning_rate": 1.859697848605585e-07, "loss": 0.9734, "step": 46651 }, { "epoch": 0.88, "learning_rate": 1.8591197145919475e-07, "loss": 0.8253, "step": 46652 }, { "epoch": 0.88, "learning_rate": 1.8585416669856415e-07, "loss": 0.7997, "step": 46653 }, { "epoch": 0.88, "learning_rate": 1.8579637057888317e-07, "loss": 0.8967, "step": 46654 }, { "epoch": 0.88, "learning_rate": 1.8573858310036746e-07, "loss": 1.0825, "step": 46655 }, { "epoch": 0.88, "learning_rate": 1.85680804263233e-07, "loss": 0.8741, "step": 46656 }, { "epoch": 0.88, "learning_rate": 1.8562303406769565e-07, "loss": 0.8574, "step": 46657 }, { "epoch": 0.88, "learning_rate": 1.855652725139706e-07, "loss": 0.9226, "step": 46658 }, { "epoch": 0.88, "learning_rate": 1.855075196022746e-07, "loss": 0.7973, "step": 46659 }, { "epoch": 0.88, "learning_rate": 1.854497753328216e-07, "loss": 0.9009, "step": 46660 }, { "epoch": 0.88, "learning_rate": 1.85392039705829e-07, "loss": 0.9673, "step": 46661 }, { "epoch": 0.88, "learning_rate": 1.8533431272151098e-07, "loss": 0.9841, "step": 46662 }, { "epoch": 0.88, "learning_rate": 1.8527659438008384e-07, "loss": 0.8439, "step": 46663 }, { "epoch": 0.88, "learning_rate": 1.852188846817629e-07, "loss": 0.7134, "step": 46664 }, { "epoch": 0.88, "learning_rate": 1.8516118362676362e-07, "loss": 0.7779, "step": 46665 }, { "epoch": 0.88, "learning_rate": 1.8510349121530158e-07, "loss": 0.8547, "step": 46666 }, { "epoch": 0.88, "learning_rate": 1.850458074475922e-07, "loss": 0.7149, "step": 46667 }, { "epoch": 0.88, "learning_rate": 1.849881323238509e-07, "loss": 1.0787, "step": 46668 }, { "epoch": 0.88, "learning_rate": 1.8493046584429242e-07, "loss": 0.8912, "step": 46669 }, { "epoch": 0.88, "learning_rate": 1.8487280800913333e-07, "loss": 0.9365, "step": 46670 }, { "epoch": 0.88, "learning_rate": 1.8481515881858786e-07, "loss": 0.8757, "step": 46671 }, { "epoch": 0.88, "learning_rate": 1.8475751827287086e-07, "loss": 0.7445, "step": 46672 }, { "epoch": 0.88, "learning_rate": 1.8469988637219937e-07, "loss": 0.8925, "step": 46673 }, { "epoch": 0.88, "learning_rate": 1.8464226311678712e-07, "loss": 0.801, "step": 46674 }, { "epoch": 0.88, "learning_rate": 1.8458464850684977e-07, "loss": 0.7273, "step": 46675 }, { "epoch": 0.88, "learning_rate": 1.8452704254260212e-07, "loss": 1.0212, "step": 46676 }, { "epoch": 0.88, "learning_rate": 1.8446944522425958e-07, "loss": 0.8219, "step": 46677 }, { "epoch": 0.88, "learning_rate": 1.8441185655203724e-07, "loss": 0.7287, "step": 46678 }, { "epoch": 0.88, "learning_rate": 1.8435427652614995e-07, "loss": 0.9483, "step": 46679 }, { "epoch": 0.88, "learning_rate": 1.8429670514681309e-07, "loss": 0.9454, "step": 46680 }, { "epoch": 0.88, "learning_rate": 1.8423914241424061e-07, "loss": 1.0605, "step": 46681 }, { "epoch": 0.88, "learning_rate": 1.8418158832864906e-07, "loss": 1.0165, "step": 46682 }, { "epoch": 0.88, "learning_rate": 1.8412404289025215e-07, "loss": 0.9656, "step": 46683 }, { "epoch": 0.88, "learning_rate": 1.8406650609926468e-07, "loss": 1.0437, "step": 46684 }, { "epoch": 0.88, "learning_rate": 1.8400897795590234e-07, "loss": 0.8843, "step": 46685 }, { "epoch": 0.88, "learning_rate": 1.839514584603791e-07, "loss": 0.7915, "step": 46686 }, { "epoch": 0.88, "learning_rate": 1.8389394761291006e-07, "loss": 1.1503, "step": 46687 }, { "epoch": 0.88, "learning_rate": 1.8383644541371038e-07, "loss": 1.0154, "step": 46688 }, { "epoch": 0.88, "learning_rate": 1.8377895186299454e-07, "loss": 0.7556, "step": 46689 }, { "epoch": 0.88, "learning_rate": 1.8372146696097633e-07, "loss": 1.0158, "step": 46690 }, { "epoch": 0.88, "learning_rate": 1.8366399070787188e-07, "loss": 0.8683, "step": 46691 }, { "epoch": 0.88, "learning_rate": 1.836065231038947e-07, "loss": 0.7907, "step": 46692 }, { "epoch": 0.88, "learning_rate": 1.8354906414925932e-07, "loss": 0.9334, "step": 46693 }, { "epoch": 0.88, "learning_rate": 1.834916138441817e-07, "loss": 0.9106, "step": 46694 }, { "epoch": 0.88, "learning_rate": 1.8343417218887465e-07, "loss": 0.942, "step": 46695 }, { "epoch": 0.88, "learning_rate": 1.8337673918355365e-07, "loss": 1.0719, "step": 46696 }, { "epoch": 0.88, "learning_rate": 1.8331931482843264e-07, "loss": 0.7988, "step": 46697 }, { "epoch": 0.88, "learning_rate": 1.8326189912372644e-07, "loss": 0.8955, "step": 46698 }, { "epoch": 0.88, "learning_rate": 1.8320449206964936e-07, "loss": 0.8759, "step": 46699 }, { "epoch": 0.88, "learning_rate": 1.8314709366641536e-07, "loss": 1.0619, "step": 46700 }, { "epoch": 0.88, "learning_rate": 1.8308970391423986e-07, "loss": 0.8982, "step": 46701 }, { "epoch": 0.88, "learning_rate": 1.8303232281333517e-07, "loss": 0.8057, "step": 46702 }, { "epoch": 0.88, "learning_rate": 1.8297495036391777e-07, "loss": 1.0153, "step": 46703 }, { "epoch": 0.88, "learning_rate": 1.8291758656620055e-07, "loss": 0.7689, "step": 46704 }, { "epoch": 0.88, "learning_rate": 1.8286023142039783e-07, "loss": 0.714, "step": 46705 }, { "epoch": 0.88, "learning_rate": 1.828028849267241e-07, "loss": 0.8866, "step": 46706 }, { "epoch": 0.88, "learning_rate": 1.8274554708539337e-07, "loss": 0.8858, "step": 46707 }, { "epoch": 0.88, "learning_rate": 1.8268821789661968e-07, "loss": 0.9561, "step": 46708 }, { "epoch": 0.88, "learning_rate": 1.8263089736061696e-07, "loss": 0.9114, "step": 46709 }, { "epoch": 0.88, "learning_rate": 1.8257358547760006e-07, "loss": 0.9708, "step": 46710 }, { "epoch": 0.88, "learning_rate": 1.8251628224778134e-07, "loss": 0.8452, "step": 46711 }, { "epoch": 0.88, "learning_rate": 1.824589876713767e-07, "loss": 0.8996, "step": 46712 }, { "epoch": 0.88, "learning_rate": 1.824017017485988e-07, "loss": 1.0162, "step": 46713 }, { "epoch": 0.88, "learning_rate": 1.8234442447966127e-07, "loss": 1.1209, "step": 46714 }, { "epoch": 0.88, "learning_rate": 1.822871558647796e-07, "loss": 0.9128, "step": 46715 }, { "epoch": 0.88, "learning_rate": 1.82229895904166e-07, "loss": 0.8062, "step": 46716 }, { "epoch": 0.88, "learning_rate": 1.8217264459803512e-07, "loss": 0.8807, "step": 46717 }, { "epoch": 0.88, "learning_rate": 1.8211540194660039e-07, "loss": 1.0276, "step": 46718 }, { "epoch": 0.88, "learning_rate": 1.8205816795007575e-07, "loss": 1.026, "step": 46719 }, { "epoch": 0.88, "learning_rate": 1.8200094260867496e-07, "loss": 0.7381, "step": 46720 }, { "epoch": 0.88, "learning_rate": 1.8194372592261146e-07, "loss": 0.7944, "step": 46721 }, { "epoch": 0.88, "learning_rate": 1.8188651789209922e-07, "loss": 0.6909, "step": 46722 }, { "epoch": 0.88, "learning_rate": 1.8182931851735115e-07, "loss": 0.8496, "step": 46723 }, { "epoch": 0.88, "learning_rate": 1.8177212779858206e-07, "loss": 0.9361, "step": 46724 }, { "epoch": 0.88, "learning_rate": 1.817149457360043e-07, "loss": 1.1144, "step": 46725 }, { "epoch": 0.88, "learning_rate": 1.8165777232983184e-07, "loss": 0.7318, "step": 46726 }, { "epoch": 0.88, "learning_rate": 1.8160060758027815e-07, "loss": 0.8766, "step": 46727 }, { "epoch": 0.88, "learning_rate": 1.8154345148755692e-07, "loss": 0.8918, "step": 46728 }, { "epoch": 0.88, "learning_rate": 1.8148630405188106e-07, "loss": 0.7445, "step": 46729 }, { "epoch": 0.88, "learning_rate": 1.8142916527346426e-07, "loss": 0.7987, "step": 46730 }, { "epoch": 0.88, "learning_rate": 1.8137203515252055e-07, "loss": 1.0022, "step": 46731 }, { "epoch": 0.88, "learning_rate": 1.813149136892617e-07, "loss": 0.8102, "step": 46732 }, { "epoch": 0.88, "learning_rate": 1.812578008839025e-07, "loss": 0.8276, "step": 46733 }, { "epoch": 0.88, "learning_rate": 1.812006967366553e-07, "loss": 0.7639, "step": 46734 }, { "epoch": 0.88, "learning_rate": 1.81143601247733e-07, "loss": 1.0666, "step": 46735 }, { "epoch": 0.88, "learning_rate": 1.8108651441735041e-07, "loss": 0.914, "step": 46736 }, { "epoch": 0.88, "learning_rate": 1.8102943624571933e-07, "loss": 1.1913, "step": 46737 }, { "epoch": 0.88, "learning_rate": 1.809723667330532e-07, "loss": 0.9248, "step": 46738 }, { "epoch": 0.88, "learning_rate": 1.8091530587956512e-07, "loss": 0.8143, "step": 46739 }, { "epoch": 0.88, "learning_rate": 1.8085825368546806e-07, "loss": 0.7596, "step": 46740 }, { "epoch": 0.88, "learning_rate": 1.8080121015097513e-07, "loss": 0.9311, "step": 46741 }, { "epoch": 0.88, "learning_rate": 1.807441752762995e-07, "loss": 0.9268, "step": 46742 }, { "epoch": 0.88, "learning_rate": 1.8068714906165462e-07, "loss": 1.1238, "step": 46743 }, { "epoch": 0.88, "learning_rate": 1.8063013150725174e-07, "loss": 0.9071, "step": 46744 }, { "epoch": 0.88, "learning_rate": 1.8057312261330562e-07, "loss": 0.8196, "step": 46745 }, { "epoch": 0.88, "learning_rate": 1.8051612238002807e-07, "loss": 0.9743, "step": 46746 }, { "epoch": 0.88, "learning_rate": 1.8045913080763227e-07, "loss": 0.8029, "step": 46747 }, { "epoch": 0.88, "learning_rate": 1.8040214789633083e-07, "loss": 0.8063, "step": 46748 }, { "epoch": 0.88, "learning_rate": 1.8034517364633657e-07, "loss": 0.9409, "step": 46749 }, { "epoch": 0.88, "learning_rate": 1.8028820805786245e-07, "loss": 0.8506, "step": 46750 }, { "epoch": 0.88, "learning_rate": 1.8023125113112105e-07, "loss": 0.7997, "step": 46751 }, { "epoch": 0.88, "learning_rate": 1.8017430286632525e-07, "loss": 0.7524, "step": 46752 }, { "epoch": 0.88, "learning_rate": 1.8011736326368683e-07, "loss": 0.7692, "step": 46753 }, { "epoch": 0.88, "learning_rate": 1.800604323234198e-07, "loss": 0.8291, "step": 46754 }, { "epoch": 0.88, "learning_rate": 1.8000351004573562e-07, "loss": 0.9828, "step": 46755 }, { "epoch": 0.88, "learning_rate": 1.7994659643084694e-07, "loss": 0.9587, "step": 46756 }, { "epoch": 0.88, "learning_rate": 1.7988969147896716e-07, "loss": 1.0912, "step": 46757 }, { "epoch": 0.88, "learning_rate": 1.7983279519030754e-07, "loss": 1.0013, "step": 46758 }, { "epoch": 0.88, "learning_rate": 1.797759075650815e-07, "loss": 0.8629, "step": 46759 }, { "epoch": 0.88, "learning_rate": 1.7971902860350083e-07, "loss": 0.7382, "step": 46760 }, { "epoch": 0.88, "learning_rate": 1.7966215830577837e-07, "loss": 0.6259, "step": 46761 }, { "epoch": 0.88, "learning_rate": 1.7960529667212622e-07, "loss": 0.9294, "step": 46762 }, { "epoch": 0.88, "learning_rate": 1.7954844370275643e-07, "loss": 1.1797, "step": 46763 }, { "epoch": 0.88, "learning_rate": 1.794915993978824e-07, "loss": 0.8909, "step": 46764 }, { "epoch": 0.88, "learning_rate": 1.7943476375771457e-07, "loss": 1.0771, "step": 46765 }, { "epoch": 0.88, "learning_rate": 1.7937793678246719e-07, "loss": 0.9444, "step": 46766 }, { "epoch": 0.88, "learning_rate": 1.793211184723509e-07, "loss": 0.7996, "step": 46767 }, { "epoch": 0.88, "learning_rate": 1.7926430882757834e-07, "loss": 1.2268, "step": 46768 }, { "epoch": 0.88, "learning_rate": 1.7920750784836182e-07, "loss": 1.1077, "step": 46769 }, { "epoch": 0.88, "learning_rate": 1.7915071553491315e-07, "loss": 0.8853, "step": 46770 }, { "epoch": 0.88, "learning_rate": 1.7909393188744461e-07, "loss": 0.8388, "step": 46771 }, { "epoch": 0.88, "learning_rate": 1.790371569061683e-07, "loss": 0.6859, "step": 46772 }, { "epoch": 0.88, "learning_rate": 1.789803905912965e-07, "loss": 0.7482, "step": 46773 }, { "epoch": 0.88, "learning_rate": 1.7892363294303967e-07, "loss": 0.8878, "step": 46774 }, { "epoch": 0.88, "learning_rate": 1.78866883961612e-07, "loss": 1.021, "step": 46775 }, { "epoch": 0.88, "learning_rate": 1.7881014364722366e-07, "loss": 0.8378, "step": 46776 }, { "epoch": 0.88, "learning_rate": 1.787534120000864e-07, "loss": 0.8338, "step": 46777 }, { "epoch": 0.88, "learning_rate": 1.7869668902041393e-07, "loss": 1.1731, "step": 46778 }, { "epoch": 0.88, "learning_rate": 1.7863997470841638e-07, "loss": 0.8824, "step": 46779 }, { "epoch": 0.88, "learning_rate": 1.785832690643058e-07, "loss": 0.9158, "step": 46780 }, { "epoch": 0.88, "learning_rate": 1.7852657208829422e-07, "loss": 1.0692, "step": 46781 }, { "epoch": 0.88, "learning_rate": 1.7846988378059315e-07, "loss": 1.0365, "step": 46782 }, { "epoch": 0.88, "learning_rate": 1.784132041414144e-07, "loss": 1.0806, "step": 46783 }, { "epoch": 0.88, "learning_rate": 1.7835653317096967e-07, "loss": 0.9264, "step": 46784 }, { "epoch": 0.88, "learning_rate": 1.782998708694708e-07, "loss": 0.6694, "step": 46785 }, { "epoch": 0.88, "learning_rate": 1.7824321723712818e-07, "loss": 0.7086, "step": 46786 }, { "epoch": 0.88, "learning_rate": 1.781865722741552e-07, "loss": 0.9758, "step": 46787 }, { "epoch": 0.88, "learning_rate": 1.7812993598076174e-07, "loss": 0.8454, "step": 46788 }, { "epoch": 0.88, "learning_rate": 1.7807330835716009e-07, "loss": 0.7861, "step": 46789 }, { "epoch": 0.88, "learning_rate": 1.7801668940356147e-07, "loss": 0.8793, "step": 46790 }, { "epoch": 0.88, "learning_rate": 1.7796007912017715e-07, "loss": 0.7318, "step": 46791 }, { "epoch": 0.88, "learning_rate": 1.7790347750721888e-07, "loss": 0.8973, "step": 46792 }, { "epoch": 0.88, "learning_rate": 1.7784688456489786e-07, "loss": 1.1639, "step": 46793 }, { "epoch": 0.88, "learning_rate": 1.777903002934256e-07, "loss": 0.8488, "step": 46794 }, { "epoch": 0.88, "learning_rate": 1.7773372469301247e-07, "loss": 0.6766, "step": 46795 }, { "epoch": 0.88, "learning_rate": 1.7767715776387112e-07, "loss": 0.9599, "step": 46796 }, { "epoch": 0.88, "learning_rate": 1.776205995062119e-07, "loss": 0.9509, "step": 46797 }, { "epoch": 0.88, "learning_rate": 1.775640499202455e-07, "loss": 0.8629, "step": 46798 }, { "epoch": 0.88, "learning_rate": 1.7750750900618453e-07, "loss": 0.9725, "step": 46799 }, { "epoch": 0.88, "learning_rate": 1.7745097676423906e-07, "loss": 1.0683, "step": 46800 }, { "epoch": 0.88, "learning_rate": 1.7739445319462033e-07, "loss": 0.9022, "step": 46801 }, { "epoch": 0.88, "learning_rate": 1.773379382975396e-07, "loss": 0.8634, "step": 46802 }, { "epoch": 0.88, "learning_rate": 1.7728143207320775e-07, "loss": 0.8217, "step": 46803 }, { "epoch": 0.88, "learning_rate": 1.7722493452183577e-07, "loss": 0.8331, "step": 46804 }, { "epoch": 0.88, "learning_rate": 1.7716844564363483e-07, "loss": 1.0255, "step": 46805 }, { "epoch": 0.88, "learning_rate": 1.7711196543881594e-07, "loss": 1.0108, "step": 46806 }, { "epoch": 0.88, "learning_rate": 1.7705549390758885e-07, "loss": 0.8444, "step": 46807 }, { "epoch": 0.88, "learning_rate": 1.7699903105016626e-07, "loss": 0.9609, "step": 46808 }, { "epoch": 0.88, "learning_rate": 1.7694257686675764e-07, "loss": 0.8727, "step": 46809 }, { "epoch": 0.88, "learning_rate": 1.7688613135757426e-07, "loss": 0.8245, "step": 46810 }, { "epoch": 0.88, "learning_rate": 1.7682969452282678e-07, "loss": 0.9554, "step": 46811 }, { "epoch": 0.88, "learning_rate": 1.767732663627261e-07, "loss": 0.9722, "step": 46812 }, { "epoch": 0.88, "learning_rate": 1.7671684687748297e-07, "loss": 0.9653, "step": 46813 }, { "epoch": 0.88, "learning_rate": 1.7666043606730742e-07, "loss": 0.9632, "step": 46814 }, { "epoch": 0.88, "learning_rate": 1.7660403393241098e-07, "loss": 0.7896, "step": 46815 }, { "epoch": 0.88, "learning_rate": 1.7654764047300376e-07, "loss": 1.1278, "step": 46816 }, { "epoch": 0.88, "learning_rate": 1.7649125568929642e-07, "loss": 0.8452, "step": 46817 }, { "epoch": 0.88, "learning_rate": 1.7643487958149936e-07, "loss": 0.918, "step": 46818 }, { "epoch": 0.88, "learning_rate": 1.763785121498232e-07, "loss": 0.9485, "step": 46819 }, { "epoch": 0.88, "learning_rate": 1.763221533944784e-07, "loss": 0.8443, "step": 46820 }, { "epoch": 0.88, "learning_rate": 1.7626580331567555e-07, "loss": 1.0392, "step": 46821 }, { "epoch": 0.88, "learning_rate": 1.7620946191362537e-07, "loss": 1.0145, "step": 46822 }, { "epoch": 0.88, "learning_rate": 1.7615312918853682e-07, "loss": 0.7798, "step": 46823 }, { "epoch": 0.88, "learning_rate": 1.760968051406217e-07, "loss": 0.9623, "step": 46824 }, { "epoch": 0.88, "learning_rate": 1.7604048977009041e-07, "loss": 0.9929, "step": 46825 }, { "epoch": 0.88, "learning_rate": 1.7598418307715165e-07, "loss": 0.9619, "step": 46826 }, { "epoch": 0.88, "learning_rate": 1.7592788506201773e-07, "loss": 0.8823, "step": 46827 }, { "epoch": 0.88, "learning_rate": 1.7587159572489743e-07, "loss": 0.7877, "step": 46828 }, { "epoch": 0.88, "learning_rate": 1.758153150660011e-07, "loss": 0.7883, "step": 46829 }, { "epoch": 0.88, "learning_rate": 1.7575904308553937e-07, "loss": 0.8074, "step": 46830 }, { "epoch": 0.88, "learning_rate": 1.7570277978372185e-07, "loss": 1.211, "step": 46831 }, { "epoch": 0.88, "learning_rate": 1.7564652516075892e-07, "loss": 0.984, "step": 46832 }, { "epoch": 0.88, "learning_rate": 1.7559027921686066e-07, "loss": 0.6607, "step": 46833 }, { "epoch": 0.88, "learning_rate": 1.755340419522375e-07, "loss": 0.9159, "step": 46834 }, { "epoch": 0.88, "learning_rate": 1.7547781336709814e-07, "loss": 0.8423, "step": 46835 }, { "epoch": 0.88, "learning_rate": 1.7542159346165432e-07, "loss": 0.9278, "step": 46836 }, { "epoch": 0.88, "learning_rate": 1.7536538223611426e-07, "loss": 1.0366, "step": 46837 }, { "epoch": 0.88, "learning_rate": 1.753091796906889e-07, "loss": 0.828, "step": 46838 }, { "epoch": 0.88, "learning_rate": 1.7525298582558746e-07, "loss": 0.8378, "step": 46839 }, { "epoch": 0.88, "learning_rate": 1.751968006410204e-07, "loss": 0.8423, "step": 46840 }, { "epoch": 0.88, "learning_rate": 1.7514062413719695e-07, "loss": 0.7827, "step": 46841 }, { "epoch": 0.88, "learning_rate": 1.7508445631432725e-07, "loss": 0.8084, "step": 46842 }, { "epoch": 0.88, "learning_rate": 1.7502829717262139e-07, "loss": 1.0305, "step": 46843 }, { "epoch": 0.88, "learning_rate": 1.749721467122878e-07, "loss": 0.9634, "step": 46844 }, { "epoch": 0.88, "learning_rate": 1.7491600493353716e-07, "loss": 0.9719, "step": 46845 }, { "epoch": 0.88, "learning_rate": 1.7485987183657932e-07, "loss": 0.9034, "step": 46846 }, { "epoch": 0.88, "learning_rate": 1.748037474216227e-07, "loss": 0.7856, "step": 46847 }, { "epoch": 0.88, "learning_rate": 1.7474763168887827e-07, "loss": 0.8556, "step": 46848 }, { "epoch": 0.88, "learning_rate": 1.7469152463855443e-07, "loss": 0.9487, "step": 46849 }, { "epoch": 0.88, "learning_rate": 1.7463542627086132e-07, "loss": 0.9156, "step": 46850 }, { "epoch": 0.88, "learning_rate": 1.7457933658600822e-07, "loss": 0.8207, "step": 46851 }, { "epoch": 0.88, "learning_rate": 1.745232555842047e-07, "loss": 0.918, "step": 46852 }, { "epoch": 0.88, "learning_rate": 1.744671832656597e-07, "loss": 0.8646, "step": 46853 }, { "epoch": 0.88, "learning_rate": 1.744111196305831e-07, "loss": 0.8789, "step": 46854 }, { "epoch": 0.88, "learning_rate": 1.7435506467918444e-07, "loss": 1.0301, "step": 46855 }, { "epoch": 0.88, "learning_rate": 1.742990184116719e-07, "loss": 0.8976, "step": 46856 }, { "epoch": 0.88, "learning_rate": 1.742429808282564e-07, "loss": 0.9308, "step": 46857 }, { "epoch": 0.88, "learning_rate": 1.7418695192914586e-07, "loss": 0.8305, "step": 46858 }, { "epoch": 0.88, "learning_rate": 1.7413093171454982e-07, "loss": 0.8293, "step": 46859 }, { "epoch": 0.88, "learning_rate": 1.740749201846778e-07, "loss": 0.8049, "step": 46860 }, { "epoch": 0.88, "learning_rate": 1.7401891733973857e-07, "loss": 0.9356, "step": 46861 }, { "epoch": 0.88, "learning_rate": 1.739629231799414e-07, "loss": 1.0391, "step": 46862 }, { "epoch": 0.88, "learning_rate": 1.7390693770549528e-07, "loss": 0.879, "step": 46863 }, { "epoch": 0.88, "learning_rate": 1.7385096091660974e-07, "loss": 0.887, "step": 46864 }, { "epoch": 0.88, "learning_rate": 1.7379499281349272e-07, "loss": 0.9101, "step": 46865 }, { "epoch": 0.88, "learning_rate": 1.7373903339635428e-07, "loss": 0.773, "step": 46866 }, { "epoch": 0.88, "learning_rate": 1.7368308266540318e-07, "loss": 0.8699, "step": 46867 }, { "epoch": 0.88, "learning_rate": 1.7362714062084728e-07, "loss": 0.9709, "step": 46868 }, { "epoch": 0.88, "learning_rate": 1.735712072628973e-07, "loss": 0.9285, "step": 46869 }, { "epoch": 0.88, "learning_rate": 1.7351528259176077e-07, "loss": 0.9911, "step": 46870 }, { "epoch": 0.88, "learning_rate": 1.7345936660764674e-07, "loss": 1.0388, "step": 46871 }, { "epoch": 0.88, "learning_rate": 1.734034593107642e-07, "loss": 0.8746, "step": 46872 }, { "epoch": 0.88, "learning_rate": 1.733475607013216e-07, "loss": 0.8844, "step": 46873 }, { "epoch": 0.88, "learning_rate": 1.732916707795279e-07, "loss": 1.1001, "step": 46874 }, { "epoch": 0.88, "learning_rate": 1.732357895455919e-07, "loss": 0.8928, "step": 46875 }, { "epoch": 0.88, "learning_rate": 1.7317991699972253e-07, "loss": 1.0096, "step": 46876 }, { "epoch": 0.88, "learning_rate": 1.7312405314212717e-07, "loss": 0.9992, "step": 46877 }, { "epoch": 0.88, "learning_rate": 1.730681979730159e-07, "loss": 0.9097, "step": 46878 }, { "epoch": 0.88, "learning_rate": 1.7301235149259632e-07, "loss": 1.0272, "step": 46879 }, { "epoch": 0.88, "learning_rate": 1.729565137010772e-07, "loss": 0.916, "step": 46880 }, { "epoch": 0.88, "learning_rate": 1.729006845986672e-07, "loss": 1.1282, "step": 46881 }, { "epoch": 0.88, "learning_rate": 1.7284486418557483e-07, "loss": 1.0404, "step": 46882 }, { "epoch": 0.88, "learning_rate": 1.7278905246200822e-07, "loss": 0.891, "step": 46883 }, { "epoch": 0.88, "learning_rate": 1.727332494281761e-07, "loss": 0.8753, "step": 46884 }, { "epoch": 0.88, "learning_rate": 1.7267745508428636e-07, "loss": 0.8752, "step": 46885 }, { "epoch": 0.88, "learning_rate": 1.7262166943054797e-07, "loss": 0.8274, "step": 46886 }, { "epoch": 0.88, "learning_rate": 1.725658924671686e-07, "loss": 1.0917, "step": 46887 }, { "epoch": 0.88, "learning_rate": 1.7251012419435748e-07, "loss": 1.0907, "step": 46888 }, { "epoch": 0.88, "learning_rate": 1.724543646123214e-07, "loss": 0.7264, "step": 46889 }, { "epoch": 0.88, "learning_rate": 1.7239861372126992e-07, "loss": 0.7407, "step": 46890 }, { "epoch": 0.88, "learning_rate": 1.7234287152141038e-07, "loss": 0.776, "step": 46891 }, { "epoch": 0.88, "learning_rate": 1.7228713801295122e-07, "loss": 0.8779, "step": 46892 }, { "epoch": 0.88, "learning_rate": 1.7223141319610059e-07, "loss": 0.9826, "step": 46893 }, { "epoch": 0.88, "learning_rate": 1.7217569707106641e-07, "loss": 0.8744, "step": 46894 }, { "epoch": 0.88, "learning_rate": 1.721199896380568e-07, "loss": 0.7981, "step": 46895 }, { "epoch": 0.88, "learning_rate": 1.7206429089727973e-07, "loss": 0.903, "step": 46896 }, { "epoch": 0.88, "learning_rate": 1.7200860084894382e-07, "loss": 0.9422, "step": 46897 }, { "epoch": 0.88, "learning_rate": 1.7195291949325537e-07, "loss": 0.8761, "step": 46898 }, { "epoch": 0.88, "learning_rate": 1.7189724683042418e-07, "loss": 1.2319, "step": 46899 }, { "epoch": 0.88, "learning_rate": 1.7184158286065705e-07, "loss": 1.0233, "step": 46900 }, { "epoch": 0.88, "learning_rate": 1.7178592758416157e-07, "loss": 0.9304, "step": 46901 }, { "epoch": 0.88, "learning_rate": 1.7173028100114675e-07, "loss": 0.9475, "step": 46902 }, { "epoch": 0.88, "learning_rate": 1.7167464311181937e-07, "loss": 0.7538, "step": 46903 }, { "epoch": 0.88, "learning_rate": 1.7161901391638757e-07, "loss": 0.6559, "step": 46904 }, { "epoch": 0.88, "learning_rate": 1.7156339341505873e-07, "loss": 0.9769, "step": 46905 }, { "epoch": 0.88, "learning_rate": 1.71507781608041e-07, "loss": 0.8967, "step": 46906 }, { "epoch": 0.88, "learning_rate": 1.714521784955417e-07, "loss": 0.8123, "step": 46907 }, { "epoch": 0.89, "learning_rate": 1.7139658407776872e-07, "loss": 0.7947, "step": 46908 }, { "epoch": 0.89, "learning_rate": 1.7134099835492996e-07, "loss": 0.721, "step": 46909 }, { "epoch": 0.89, "learning_rate": 1.7128542132723136e-07, "loss": 0.8915, "step": 46910 }, { "epoch": 0.89, "learning_rate": 1.7122985299488276e-07, "loss": 0.96, "step": 46911 }, { "epoch": 0.89, "learning_rate": 1.7117429335808982e-07, "loss": 1.0313, "step": 46912 }, { "epoch": 0.89, "learning_rate": 1.7111874241706073e-07, "loss": 0.7274, "step": 46913 }, { "epoch": 0.89, "learning_rate": 1.7106320017200308e-07, "loss": 0.9005, "step": 46914 }, { "epoch": 0.89, "learning_rate": 1.7100766662312391e-07, "loss": 0.8049, "step": 46915 }, { "epoch": 0.89, "learning_rate": 1.7095214177063057e-07, "loss": 0.875, "step": 46916 }, { "epoch": 0.89, "learning_rate": 1.7089662561473068e-07, "loss": 0.8766, "step": 46917 }, { "epoch": 0.89, "learning_rate": 1.708411181556316e-07, "loss": 1.066, "step": 46918 }, { "epoch": 0.89, "learning_rate": 1.7078561939353976e-07, "loss": 0.9614, "step": 46919 }, { "epoch": 0.89, "learning_rate": 1.7073012932866367e-07, "loss": 0.9151, "step": 46920 }, { "epoch": 0.89, "learning_rate": 1.7067464796120952e-07, "loss": 0.8826, "step": 46921 }, { "epoch": 0.89, "learning_rate": 1.706191752913844e-07, "loss": 0.8411, "step": 46922 }, { "epoch": 0.89, "learning_rate": 1.705637113193967e-07, "loss": 0.7094, "step": 46923 }, { "epoch": 0.89, "learning_rate": 1.7050825604545211e-07, "loss": 0.8954, "step": 46924 }, { "epoch": 0.89, "learning_rate": 1.7045280946975827e-07, "loss": 0.9899, "step": 46925 }, { "epoch": 0.89, "learning_rate": 1.703973715925225e-07, "loss": 0.9834, "step": 46926 }, { "epoch": 0.89, "learning_rate": 1.703419424139513e-07, "loss": 0.7583, "step": 46927 }, { "epoch": 0.89, "learning_rate": 1.70286521934252e-07, "loss": 0.8747, "step": 46928 }, { "epoch": 0.89, "learning_rate": 1.7023111015363135e-07, "loss": 0.6768, "step": 46929 }, { "epoch": 0.89, "learning_rate": 1.7017570707229648e-07, "loss": 1.0316, "step": 46930 }, { "epoch": 0.89, "learning_rate": 1.7012031269045354e-07, "loss": 1.0955, "step": 46931 }, { "epoch": 0.89, "learning_rate": 1.7006492700831072e-07, "loss": 1.0357, "step": 46932 }, { "epoch": 0.89, "learning_rate": 1.7000955002607345e-07, "loss": 0.9307, "step": 46933 }, { "epoch": 0.89, "learning_rate": 1.6995418174394928e-07, "loss": 0.8467, "step": 46934 }, { "epoch": 0.89, "learning_rate": 1.6989882216214476e-07, "loss": 0.9595, "step": 46935 }, { "epoch": 0.89, "learning_rate": 1.6984347128086637e-07, "loss": 0.9887, "step": 46936 }, { "epoch": 0.89, "learning_rate": 1.6978812910032116e-07, "loss": 0.9143, "step": 46937 }, { "epoch": 0.89, "learning_rate": 1.6973279562071564e-07, "loss": 1.0079, "step": 46938 }, { "epoch": 0.89, "learning_rate": 1.6967747084225687e-07, "loss": 0.8905, "step": 46939 }, { "epoch": 0.89, "learning_rate": 1.6962215476515e-07, "loss": 0.9254, "step": 46940 }, { "epoch": 0.89, "learning_rate": 1.695668473896034e-07, "loss": 0.7596, "step": 46941 }, { "epoch": 0.89, "learning_rate": 1.6951154871582248e-07, "loss": 0.8012, "step": 46942 }, { "epoch": 0.89, "learning_rate": 1.694562587440135e-07, "loss": 1.0463, "step": 46943 }, { "epoch": 0.89, "learning_rate": 1.6940097747438405e-07, "loss": 1.1699, "step": 46944 }, { "epoch": 0.89, "learning_rate": 1.6934570490713954e-07, "loss": 0.9095, "step": 46945 }, { "epoch": 0.89, "learning_rate": 1.6929044104248697e-07, "loss": 0.8255, "step": 46946 }, { "epoch": 0.89, "learning_rate": 1.692351858806321e-07, "loss": 1.0244, "step": 46947 }, { "epoch": 0.89, "learning_rate": 1.691799394217819e-07, "loss": 0.9213, "step": 46948 }, { "epoch": 0.89, "learning_rate": 1.691247016661421e-07, "loss": 0.9531, "step": 46949 }, { "epoch": 0.89, "learning_rate": 1.6906947261391914e-07, "loss": 1.1577, "step": 46950 }, { "epoch": 0.89, "learning_rate": 1.6901425226531986e-07, "loss": 0.6944, "step": 46951 }, { "epoch": 0.89, "learning_rate": 1.6895904062054908e-07, "loss": 0.7716, "step": 46952 }, { "epoch": 0.89, "learning_rate": 1.6890383767981467e-07, "loss": 0.6832, "step": 46953 }, { "epoch": 0.89, "learning_rate": 1.688486434433212e-07, "loss": 0.797, "step": 46954 }, { "epoch": 0.89, "learning_rate": 1.6879345791127572e-07, "loss": 0.7466, "step": 46955 }, { "epoch": 0.89, "learning_rate": 1.687382810838839e-07, "loss": 0.8609, "step": 46956 }, { "epoch": 0.89, "learning_rate": 1.686831129613517e-07, "loss": 0.7127, "step": 46957 }, { "epoch": 0.89, "learning_rate": 1.6862795354388534e-07, "loss": 0.8249, "step": 46958 }, { "epoch": 0.89, "learning_rate": 1.6857280283169075e-07, "loss": 0.7367, "step": 46959 }, { "epoch": 0.89, "learning_rate": 1.6851766082497418e-07, "loss": 0.8596, "step": 46960 }, { "epoch": 0.89, "learning_rate": 1.6846252752394043e-07, "loss": 0.6866, "step": 46961 }, { "epoch": 0.89, "learning_rate": 1.6840740292879715e-07, "loss": 1.008, "step": 46962 }, { "epoch": 0.89, "learning_rate": 1.6835228703974832e-07, "loss": 0.8558, "step": 46963 }, { "epoch": 0.89, "learning_rate": 1.6829717985700044e-07, "loss": 0.6901, "step": 46964 }, { "epoch": 0.89, "learning_rate": 1.6824208138076003e-07, "loss": 0.6859, "step": 46965 }, { "epoch": 0.89, "learning_rate": 1.681869916112319e-07, "loss": 0.8951, "step": 46966 }, { "epoch": 0.89, "learning_rate": 1.6813191054862205e-07, "loss": 0.7412, "step": 46967 }, { "epoch": 0.89, "learning_rate": 1.6807683819313608e-07, "loss": 1.0267, "step": 46968 }, { "epoch": 0.89, "learning_rate": 1.680217745449797e-07, "loss": 0.8712, "step": 46969 }, { "epoch": 0.89, "learning_rate": 1.6796671960435856e-07, "loss": 1.1432, "step": 46970 }, { "epoch": 0.89, "learning_rate": 1.6791167337147835e-07, "loss": 0.8105, "step": 46971 }, { "epoch": 0.89, "learning_rate": 1.6785663584654444e-07, "loss": 0.8732, "step": 46972 }, { "epoch": 0.89, "learning_rate": 1.6780160702976195e-07, "loss": 0.9251, "step": 46973 }, { "epoch": 0.89, "learning_rate": 1.6774658692133738e-07, "loss": 1.0341, "step": 46974 }, { "epoch": 0.89, "learning_rate": 1.6769157552147502e-07, "loss": 1.1089, "step": 46975 }, { "epoch": 0.89, "learning_rate": 1.676365728303811e-07, "loss": 1.0991, "step": 46976 }, { "epoch": 0.89, "learning_rate": 1.6758157884826043e-07, "loss": 0.7576, "step": 46977 }, { "epoch": 0.89, "learning_rate": 1.675265935753187e-07, "loss": 0.7766, "step": 46978 }, { "epoch": 0.89, "learning_rate": 1.6747161701176128e-07, "loss": 0.7552, "step": 46979 }, { "epoch": 0.89, "learning_rate": 1.674166491577933e-07, "loss": 0.9954, "step": 46980 }, { "epoch": 0.89, "learning_rate": 1.6736169001362045e-07, "loss": 0.9738, "step": 46981 }, { "epoch": 0.89, "learning_rate": 1.673067395794467e-07, "loss": 0.7915, "step": 46982 }, { "epoch": 0.89, "learning_rate": 1.6725179785547858e-07, "loss": 0.9127, "step": 46983 }, { "epoch": 0.89, "learning_rate": 1.671968648419206e-07, "loss": 0.9658, "step": 46984 }, { "epoch": 0.89, "learning_rate": 1.6714194053897765e-07, "loss": 0.9057, "step": 46985 }, { "epoch": 0.89, "learning_rate": 1.670870249468559e-07, "loss": 0.9115, "step": 46986 }, { "epoch": 0.89, "learning_rate": 1.6703211806575915e-07, "loss": 0.9993, "step": 46987 }, { "epoch": 0.89, "learning_rate": 1.6697721989589328e-07, "loss": 0.9741, "step": 46988 }, { "epoch": 0.89, "learning_rate": 1.6692233043746258e-07, "loss": 1.015, "step": 46989 }, { "epoch": 0.89, "learning_rate": 1.668674496906725e-07, "loss": 0.8886, "step": 46990 }, { "epoch": 0.89, "learning_rate": 1.6681257765572778e-07, "loss": 0.7841, "step": 46991 }, { "epoch": 0.89, "learning_rate": 1.6675771433283332e-07, "loss": 0.7557, "step": 46992 }, { "epoch": 0.89, "learning_rate": 1.6670285972219453e-07, "loss": 1.0983, "step": 46993 }, { "epoch": 0.89, "learning_rate": 1.666480138240148e-07, "loss": 0.8735, "step": 46994 }, { "epoch": 0.89, "learning_rate": 1.6659317663850094e-07, "loss": 0.9244, "step": 46995 }, { "epoch": 0.89, "learning_rate": 1.6653834816585585e-07, "loss": 0.9838, "step": 46996 }, { "epoch": 0.89, "learning_rate": 1.6648352840628518e-07, "loss": 0.9676, "step": 46997 }, { "epoch": 0.89, "learning_rate": 1.664287173599935e-07, "loss": 0.6802, "step": 46998 }, { "epoch": 0.89, "learning_rate": 1.6637391502718535e-07, "loss": 0.9761, "step": 46999 }, { "epoch": 0.89, "learning_rate": 1.663191214080656e-07, "loss": 0.9724, "step": 47000 }, { "epoch": 0.89, "learning_rate": 1.6626433650283853e-07, "loss": 0.9914, "step": 47001 }, { "epoch": 0.89, "learning_rate": 1.6620956031170947e-07, "loss": 0.9385, "step": 47002 }, { "epoch": 0.89, "learning_rate": 1.661547928348814e-07, "loss": 1.0082, "step": 47003 }, { "epoch": 0.89, "learning_rate": 1.6610003407256047e-07, "loss": 0.8705, "step": 47004 }, { "epoch": 0.89, "learning_rate": 1.6604528402495018e-07, "loss": 0.7818, "step": 47005 }, { "epoch": 0.89, "learning_rate": 1.6599054269225507e-07, "loss": 1.0727, "step": 47006 }, { "epoch": 0.89, "learning_rate": 1.6593581007468023e-07, "loss": 0.8624, "step": 47007 }, { "epoch": 0.89, "learning_rate": 1.6588108617242914e-07, "loss": 0.916, "step": 47008 }, { "epoch": 0.89, "learning_rate": 1.6582637098570636e-07, "loss": 1.0143, "step": 47009 }, { "epoch": 0.89, "learning_rate": 1.657716645147167e-07, "loss": 0.854, "step": 47010 }, { "epoch": 0.89, "learning_rate": 1.6571696675966392e-07, "loss": 0.8188, "step": 47011 }, { "epoch": 0.89, "learning_rate": 1.6566227772075226e-07, "loss": 1.0157, "step": 47012 }, { "epoch": 0.89, "learning_rate": 1.6560759739818633e-07, "loss": 0.9628, "step": 47013 }, { "epoch": 0.89, "learning_rate": 1.6555292579217035e-07, "loss": 1.066, "step": 47014 }, { "epoch": 0.89, "learning_rate": 1.6549826290290728e-07, "loss": 0.8879, "step": 47015 }, { "epoch": 0.89, "learning_rate": 1.65443608730603e-07, "loss": 0.6457, "step": 47016 }, { "epoch": 0.89, "learning_rate": 1.6538896327546043e-07, "loss": 0.757, "step": 47017 }, { "epoch": 0.89, "learning_rate": 1.653343265376836e-07, "loss": 1.1427, "step": 47018 }, { "epoch": 0.89, "learning_rate": 1.6527969851747704e-07, "loss": 0.8209, "step": 47019 }, { "epoch": 0.89, "learning_rate": 1.6522507921504448e-07, "loss": 0.9227, "step": 47020 }, { "epoch": 0.89, "learning_rate": 1.6517046863058995e-07, "loss": 0.8837, "step": 47021 }, { "epoch": 0.89, "learning_rate": 1.6511586676431713e-07, "loss": 0.9453, "step": 47022 }, { "epoch": 0.89, "learning_rate": 1.650612736164306e-07, "loss": 0.9355, "step": 47023 }, { "epoch": 0.89, "learning_rate": 1.6500668918713269e-07, "loss": 0.829, "step": 47024 }, { "epoch": 0.89, "learning_rate": 1.6495211347662909e-07, "loss": 1.0642, "step": 47025 }, { "epoch": 0.89, "learning_rate": 1.6489754648512242e-07, "loss": 1.0413, "step": 47026 }, { "epoch": 0.89, "learning_rate": 1.6484298821281636e-07, "loss": 0.9213, "step": 47027 }, { "epoch": 0.89, "learning_rate": 1.6478843865991578e-07, "loss": 0.7318, "step": 47028 }, { "epoch": 0.89, "learning_rate": 1.6473389782662302e-07, "loss": 0.9069, "step": 47029 }, { "epoch": 0.89, "learning_rate": 1.6467936571314236e-07, "loss": 0.7959, "step": 47030 }, { "epoch": 0.89, "learning_rate": 1.6462484231967724e-07, "loss": 0.8897, "step": 47031 }, { "epoch": 0.89, "learning_rate": 1.6457032764643137e-07, "loss": 0.8691, "step": 47032 }, { "epoch": 0.89, "learning_rate": 1.6451582169360852e-07, "loss": 0.7817, "step": 47033 }, { "epoch": 0.89, "learning_rate": 1.6446132446141182e-07, "loss": 0.882, "step": 47034 }, { "epoch": 0.89, "learning_rate": 1.6440683595004532e-07, "loss": 0.9652, "step": 47035 }, { "epoch": 0.89, "learning_rate": 1.643523561597113e-07, "loss": 0.9257, "step": 47036 }, { "epoch": 0.89, "learning_rate": 1.6429788509061462e-07, "loss": 1.0811, "step": 47037 }, { "epoch": 0.89, "learning_rate": 1.642434227429579e-07, "loss": 1.0094, "step": 47038 }, { "epoch": 0.89, "learning_rate": 1.6418896911694432e-07, "loss": 1.0399, "step": 47039 }, { "epoch": 0.89, "learning_rate": 1.6413452421277788e-07, "loss": 0.8797, "step": 47040 }, { "epoch": 0.89, "learning_rate": 1.6408008803066116e-07, "loss": 0.8817, "step": 47041 }, { "epoch": 0.89, "learning_rate": 1.6402566057079793e-07, "loss": 0.8699, "step": 47042 }, { "epoch": 0.89, "learning_rate": 1.6397124183339136e-07, "loss": 1.2689, "step": 47043 }, { "epoch": 0.89, "learning_rate": 1.6391683181864487e-07, "loss": 1.1337, "step": 47044 }, { "epoch": 0.89, "learning_rate": 1.6386243052676083e-07, "loss": 0.8698, "step": 47045 }, { "epoch": 0.89, "learning_rate": 1.6380803795794292e-07, "loss": 0.8003, "step": 47046 }, { "epoch": 0.89, "learning_rate": 1.6375365411239409e-07, "loss": 0.9615, "step": 47047 }, { "epoch": 0.89, "learning_rate": 1.6369927899031746e-07, "loss": 0.6891, "step": 47048 }, { "epoch": 0.89, "learning_rate": 1.6364491259191624e-07, "loss": 0.8972, "step": 47049 }, { "epoch": 0.89, "learning_rate": 1.635905549173933e-07, "loss": 0.9127, "step": 47050 }, { "epoch": 0.89, "learning_rate": 1.635362059669518e-07, "loss": 0.8717, "step": 47051 }, { "epoch": 0.89, "learning_rate": 1.6348186574079383e-07, "loss": 1.0421, "step": 47052 }, { "epoch": 0.89, "learning_rate": 1.6342753423912312e-07, "loss": 0.9688, "step": 47053 }, { "epoch": 0.89, "learning_rate": 1.6337321146214307e-07, "loss": 0.912, "step": 47054 }, { "epoch": 0.89, "learning_rate": 1.633188974100547e-07, "loss": 0.9789, "step": 47055 }, { "epoch": 0.89, "learning_rate": 1.6326459208306304e-07, "loss": 0.9578, "step": 47056 }, { "epoch": 0.89, "learning_rate": 1.6321029548136912e-07, "loss": 0.7607, "step": 47057 }, { "epoch": 0.89, "learning_rate": 1.6315600760517636e-07, "loss": 0.881, "step": 47058 }, { "epoch": 0.89, "learning_rate": 1.6310172845468736e-07, "loss": 0.7291, "step": 47059 }, { "epoch": 0.89, "learning_rate": 1.6304745803010502e-07, "loss": 1.0126, "step": 47060 }, { "epoch": 0.89, "learning_rate": 1.629931963316317e-07, "loss": 0.675, "step": 47061 }, { "epoch": 0.89, "learning_rate": 1.6293894335947025e-07, "loss": 0.861, "step": 47062 }, { "epoch": 0.89, "learning_rate": 1.6288469911382332e-07, "loss": 0.9936, "step": 47063 }, { "epoch": 0.89, "learning_rate": 1.6283046359489267e-07, "loss": 0.989, "step": 47064 }, { "epoch": 0.89, "learning_rate": 1.6277623680288208e-07, "loss": 0.9495, "step": 47065 }, { "epoch": 0.89, "learning_rate": 1.6272201873799297e-07, "loss": 0.8481, "step": 47066 }, { "epoch": 0.89, "learning_rate": 1.6266780940042803e-07, "loss": 0.7641, "step": 47067 }, { "epoch": 0.89, "learning_rate": 1.6261360879039012e-07, "loss": 0.8674, "step": 47068 }, { "epoch": 0.89, "learning_rate": 1.625594169080813e-07, "loss": 0.9853, "step": 47069 }, { "epoch": 0.89, "learning_rate": 1.6250523375370364e-07, "loss": 0.9453, "step": 47070 }, { "epoch": 0.89, "learning_rate": 1.6245105932746003e-07, "loss": 0.8529, "step": 47071 }, { "epoch": 0.89, "learning_rate": 1.623968936295528e-07, "loss": 0.7488, "step": 47072 }, { "epoch": 0.89, "learning_rate": 1.6234273666018318e-07, "loss": 0.8347, "step": 47073 }, { "epoch": 0.89, "learning_rate": 1.6228858841955463e-07, "loss": 0.8613, "step": 47074 }, { "epoch": 0.89, "learning_rate": 1.6223444890786892e-07, "loss": 1.1136, "step": 47075 }, { "epoch": 0.89, "learning_rate": 1.6218031812532758e-07, "loss": 0.9998, "step": 47076 }, { "epoch": 0.89, "learning_rate": 1.6212619607213375e-07, "loss": 0.861, "step": 47077 }, { "epoch": 0.89, "learning_rate": 1.6207208274848895e-07, "loss": 0.9418, "step": 47078 }, { "epoch": 0.89, "learning_rate": 1.6201797815459496e-07, "loss": 0.7918, "step": 47079 }, { "epoch": 0.89, "learning_rate": 1.619638822906544e-07, "loss": 0.8006, "step": 47080 }, { "epoch": 0.89, "learning_rate": 1.6190979515686904e-07, "loss": 1.182, "step": 47081 }, { "epoch": 0.89, "learning_rate": 1.618557167534407e-07, "loss": 0.7097, "step": 47082 }, { "epoch": 0.89, "learning_rate": 1.618016470805714e-07, "loss": 0.8464, "step": 47083 }, { "epoch": 0.89, "learning_rate": 1.6174758613846348e-07, "loss": 0.8686, "step": 47084 }, { "epoch": 0.89, "learning_rate": 1.6169353392731763e-07, "loss": 0.6786, "step": 47085 }, { "epoch": 0.89, "learning_rate": 1.6163949044733728e-07, "loss": 1.1074, "step": 47086 }, { "epoch": 0.89, "learning_rate": 1.6158545569872286e-07, "loss": 1.0134, "step": 47087 }, { "epoch": 0.89, "learning_rate": 1.6153142968167667e-07, "loss": 0.8776, "step": 47088 }, { "epoch": 0.89, "learning_rate": 1.6147741239640054e-07, "loss": 0.9886, "step": 47089 }, { "epoch": 0.89, "learning_rate": 1.614234038430959e-07, "loss": 0.9406, "step": 47090 }, { "epoch": 0.89, "learning_rate": 1.613694040219649e-07, "loss": 1.0375, "step": 47091 }, { "epoch": 0.89, "learning_rate": 1.613154129332084e-07, "loss": 0.8871, "step": 47092 }, { "epoch": 0.89, "learning_rate": 1.612614305770291e-07, "loss": 1.0482, "step": 47093 }, { "epoch": 0.89, "learning_rate": 1.6120745695362705e-07, "loss": 0.954, "step": 47094 }, { "epoch": 0.89, "learning_rate": 1.611534920632049e-07, "loss": 0.7273, "step": 47095 }, { "epoch": 0.89, "learning_rate": 1.6109953590596443e-07, "loss": 0.7336, "step": 47096 }, { "epoch": 0.89, "learning_rate": 1.6104558848210578e-07, "loss": 0.8091, "step": 47097 }, { "epoch": 0.89, "learning_rate": 1.6099164979183206e-07, "loss": 0.7967, "step": 47098 }, { "epoch": 0.89, "learning_rate": 1.6093771983534346e-07, "loss": 0.8968, "step": 47099 }, { "epoch": 0.89, "learning_rate": 1.6088379861284142e-07, "loss": 1.11, "step": 47100 }, { "epoch": 0.89, "learning_rate": 1.6082988612452777e-07, "loss": 0.9732, "step": 47101 }, { "epoch": 0.89, "learning_rate": 1.6077598237060343e-07, "loss": 0.9621, "step": 47102 }, { "epoch": 0.89, "learning_rate": 1.607220873512702e-07, "loss": 0.902, "step": 47103 }, { "epoch": 0.89, "learning_rate": 1.6066820106672876e-07, "loss": 0.7922, "step": 47104 }, { "epoch": 0.89, "learning_rate": 1.6061432351718087e-07, "loss": 0.8911, "step": 47105 }, { "epoch": 0.89, "learning_rate": 1.605604547028264e-07, "loss": 0.9606, "step": 47106 }, { "epoch": 0.89, "learning_rate": 1.6050659462386846e-07, "loss": 1.1442, "step": 47107 }, { "epoch": 0.89, "learning_rate": 1.6045274328050699e-07, "loss": 0.8549, "step": 47108 }, { "epoch": 0.89, "learning_rate": 1.6039890067294284e-07, "loss": 0.8423, "step": 47109 }, { "epoch": 0.89, "learning_rate": 1.6034506680137784e-07, "loss": 0.8828, "step": 47110 }, { "epoch": 0.89, "learning_rate": 1.602912416660124e-07, "loss": 0.7792, "step": 47111 }, { "epoch": 0.89, "learning_rate": 1.6023742526704772e-07, "loss": 0.993, "step": 47112 }, { "epoch": 0.89, "learning_rate": 1.6018361760468476e-07, "loss": 0.96, "step": 47113 }, { "epoch": 0.89, "learning_rate": 1.6012981867912475e-07, "loss": 0.786, "step": 47114 }, { "epoch": 0.89, "learning_rate": 1.600760284905678e-07, "loss": 1.0353, "step": 47115 }, { "epoch": 0.89, "learning_rate": 1.6002224703921543e-07, "loss": 0.8273, "step": 47116 }, { "epoch": 0.89, "learning_rate": 1.5996847432526859e-07, "loss": 0.8127, "step": 47117 }, { "epoch": 0.89, "learning_rate": 1.599147103489268e-07, "loss": 0.7501, "step": 47118 }, { "epoch": 0.89, "learning_rate": 1.5986095511039275e-07, "loss": 0.9195, "step": 47119 }, { "epoch": 0.89, "learning_rate": 1.5980720860986564e-07, "loss": 0.9165, "step": 47120 }, { "epoch": 0.89, "learning_rate": 1.5975347084754678e-07, "loss": 0.8431, "step": 47121 }, { "epoch": 0.89, "learning_rate": 1.5969974182363652e-07, "loss": 0.8921, "step": 47122 }, { "epoch": 0.89, "learning_rate": 1.596460215383358e-07, "loss": 0.6862, "step": 47123 }, { "epoch": 0.89, "learning_rate": 1.5959230999184506e-07, "loss": 1.0376, "step": 47124 }, { "epoch": 0.89, "learning_rate": 1.5953860718436465e-07, "loss": 0.8775, "step": 47125 }, { "epoch": 0.89, "learning_rate": 1.5948491311609609e-07, "loss": 0.8671, "step": 47126 }, { "epoch": 0.89, "learning_rate": 1.5943122778723813e-07, "loss": 0.8528, "step": 47127 }, { "epoch": 0.89, "learning_rate": 1.593775511979928e-07, "loss": 1.0705, "step": 47128 }, { "epoch": 0.89, "learning_rate": 1.5932388334855996e-07, "loss": 1.0503, "step": 47129 }, { "epoch": 0.89, "learning_rate": 1.5927022423913973e-07, "loss": 0.9262, "step": 47130 }, { "epoch": 0.89, "learning_rate": 1.5921657386993278e-07, "loss": 1.0079, "step": 47131 }, { "epoch": 0.89, "learning_rate": 1.5916293224113921e-07, "loss": 1.0187, "step": 47132 }, { "epoch": 0.89, "learning_rate": 1.591092993529597e-07, "loss": 1.0905, "step": 47133 }, { "epoch": 0.89, "learning_rate": 1.5905567520559412e-07, "loss": 0.9005, "step": 47134 }, { "epoch": 0.89, "learning_rate": 1.590020597992434e-07, "loss": 0.8121, "step": 47135 }, { "epoch": 0.89, "learning_rate": 1.5894845313410623e-07, "loss": 0.8984, "step": 47136 }, { "epoch": 0.89, "learning_rate": 1.5889485521038445e-07, "loss": 1.1104, "step": 47137 }, { "epoch": 0.89, "learning_rate": 1.5884126602827758e-07, "loss": 1.1357, "step": 47138 }, { "epoch": 0.89, "learning_rate": 1.5878768558798497e-07, "loss": 0.9348, "step": 47139 }, { "epoch": 0.89, "learning_rate": 1.5873411388970833e-07, "loss": 0.8882, "step": 47140 }, { "epoch": 0.89, "learning_rate": 1.5868055093364614e-07, "loss": 0.8406, "step": 47141 }, { "epoch": 0.89, "learning_rate": 1.586269967199991e-07, "loss": 0.8657, "step": 47142 }, { "epoch": 0.89, "learning_rate": 1.58573451248967e-07, "loss": 0.8793, "step": 47143 }, { "epoch": 0.89, "learning_rate": 1.5851991452074971e-07, "loss": 0.8606, "step": 47144 }, { "epoch": 0.89, "learning_rate": 1.5846638653554736e-07, "loss": 0.6171, "step": 47145 }, { "epoch": 0.89, "learning_rate": 1.5841286729355975e-07, "loss": 0.8035, "step": 47146 }, { "epoch": 0.89, "learning_rate": 1.5835935679498705e-07, "loss": 0.7912, "step": 47147 }, { "epoch": 0.89, "learning_rate": 1.583058550400282e-07, "loss": 0.9701, "step": 47148 }, { "epoch": 0.89, "learning_rate": 1.5825236202888395e-07, "loss": 1.0209, "step": 47149 }, { "epoch": 0.89, "learning_rate": 1.5819887776175325e-07, "loss": 0.9424, "step": 47150 }, { "epoch": 0.89, "learning_rate": 1.5814540223883623e-07, "loss": 0.7928, "step": 47151 }, { "epoch": 0.89, "learning_rate": 1.5809193546033246e-07, "loss": 0.6355, "step": 47152 }, { "epoch": 0.89, "learning_rate": 1.5803847742644153e-07, "loss": 0.9618, "step": 47153 }, { "epoch": 0.89, "learning_rate": 1.5798502813736322e-07, "loss": 0.9915, "step": 47154 }, { "epoch": 0.89, "learning_rate": 1.5793158759329684e-07, "loss": 0.9465, "step": 47155 }, { "epoch": 0.89, "learning_rate": 1.5787815579444254e-07, "loss": 1.0392, "step": 47156 }, { "epoch": 0.89, "learning_rate": 1.5782473274099875e-07, "loss": 0.8495, "step": 47157 }, { "epoch": 0.89, "learning_rate": 1.5777131843316585e-07, "loss": 0.9821, "step": 47158 }, { "epoch": 0.89, "learning_rate": 1.577179128711437e-07, "loss": 0.8814, "step": 47159 }, { "epoch": 0.89, "learning_rate": 1.576645160551299e-07, "loss": 0.8263, "step": 47160 }, { "epoch": 0.89, "learning_rate": 1.5761112798532596e-07, "loss": 0.8983, "step": 47161 }, { "epoch": 0.89, "learning_rate": 1.575577486619298e-07, "loss": 0.9271, "step": 47162 }, { "epoch": 0.89, "learning_rate": 1.5750437808514124e-07, "loss": 1.119, "step": 47163 }, { "epoch": 0.89, "learning_rate": 1.5745101625515928e-07, "loss": 0.8959, "step": 47164 }, { "epoch": 0.89, "learning_rate": 1.573976631721838e-07, "loss": 0.92, "step": 47165 }, { "epoch": 0.89, "learning_rate": 1.5734431883641322e-07, "loss": 0.6631, "step": 47166 }, { "epoch": 0.89, "learning_rate": 1.5729098324804737e-07, "loss": 1.076, "step": 47167 }, { "epoch": 0.89, "learning_rate": 1.5723765640728557e-07, "loss": 1.0234, "step": 47168 }, { "epoch": 0.89, "learning_rate": 1.5718433831432566e-07, "loss": 1.0389, "step": 47169 }, { "epoch": 0.89, "learning_rate": 1.5713102896936838e-07, "loss": 0.6552, "step": 47170 }, { "epoch": 0.89, "learning_rate": 1.5707772837261158e-07, "loss": 1.0897, "step": 47171 }, { "epoch": 0.89, "learning_rate": 1.5702443652425485e-07, "loss": 0.7761, "step": 47172 }, { "epoch": 0.89, "learning_rate": 1.5697115342449692e-07, "loss": 0.7738, "step": 47173 }, { "epoch": 0.89, "learning_rate": 1.569178790735368e-07, "loss": 1.0305, "step": 47174 }, { "epoch": 0.89, "learning_rate": 1.5686461347157373e-07, "loss": 1.0347, "step": 47175 }, { "epoch": 0.89, "learning_rate": 1.568113566188059e-07, "loss": 0.8508, "step": 47176 }, { "epoch": 0.89, "learning_rate": 1.567581085154335e-07, "loss": 0.9322, "step": 47177 }, { "epoch": 0.89, "learning_rate": 1.567048691616535e-07, "loss": 0.7763, "step": 47178 }, { "epoch": 0.89, "learning_rate": 1.566516385576661e-07, "loss": 0.831, "step": 47179 }, { "epoch": 0.89, "learning_rate": 1.5659841670366993e-07, "loss": 0.8926, "step": 47180 }, { "epoch": 0.89, "learning_rate": 1.565452035998627e-07, "loss": 1.1234, "step": 47181 }, { "epoch": 0.89, "learning_rate": 1.564919992464445e-07, "loss": 0.9278, "step": 47182 }, { "epoch": 0.89, "learning_rate": 1.5643880364361292e-07, "loss": 0.9305, "step": 47183 }, { "epoch": 0.89, "learning_rate": 1.5638561679156726e-07, "loss": 0.8798, "step": 47184 }, { "epoch": 0.89, "learning_rate": 1.5633243869050573e-07, "loss": 0.9279, "step": 47185 }, { "epoch": 0.89, "learning_rate": 1.5627926934062677e-07, "loss": 0.8175, "step": 47186 }, { "epoch": 0.89, "learning_rate": 1.5622610874212935e-07, "loss": 1.0509, "step": 47187 }, { "epoch": 0.89, "learning_rate": 1.5617295689521195e-07, "loss": 0.9002, "step": 47188 }, { "epoch": 0.89, "learning_rate": 1.5611981380007302e-07, "loss": 0.7388, "step": 47189 }, { "epoch": 0.89, "learning_rate": 1.5606667945691018e-07, "loss": 0.7473, "step": 47190 }, { "epoch": 0.89, "learning_rate": 1.5601355386592327e-07, "loss": 0.8594, "step": 47191 }, { "epoch": 0.89, "learning_rate": 1.5596043702730935e-07, "loss": 0.9908, "step": 47192 }, { "epoch": 0.89, "learning_rate": 1.5590732894126742e-07, "loss": 1.0178, "step": 47193 }, { "epoch": 0.89, "learning_rate": 1.5585422960799567e-07, "loss": 0.8668, "step": 47194 }, { "epoch": 0.89, "learning_rate": 1.558011390276923e-07, "loss": 0.8357, "step": 47195 }, { "epoch": 0.89, "learning_rate": 1.557480572005557e-07, "loss": 1.0464, "step": 47196 }, { "epoch": 0.89, "learning_rate": 1.556949841267838e-07, "loss": 0.9113, "step": 47197 }, { "epoch": 0.89, "learning_rate": 1.5564191980657533e-07, "loss": 0.6594, "step": 47198 }, { "epoch": 0.89, "learning_rate": 1.5558886424012737e-07, "loss": 0.985, "step": 47199 }, { "epoch": 0.89, "learning_rate": 1.555358174276392e-07, "loss": 1.0195, "step": 47200 }, { "epoch": 0.89, "learning_rate": 1.5548277936930868e-07, "loss": 0.9361, "step": 47201 }, { "epoch": 0.89, "learning_rate": 1.554297500653329e-07, "loss": 0.6924, "step": 47202 }, { "epoch": 0.89, "learning_rate": 1.5537672951591114e-07, "loss": 0.6772, "step": 47203 }, { "epoch": 0.89, "learning_rate": 1.553237177212405e-07, "loss": 0.7907, "step": 47204 }, { "epoch": 0.89, "learning_rate": 1.5527071468151912e-07, "loss": 1.1902, "step": 47205 }, { "epoch": 0.89, "learning_rate": 1.5521772039694515e-07, "loss": 0.9815, "step": 47206 }, { "epoch": 0.89, "learning_rate": 1.5516473486771626e-07, "loss": 0.9977, "step": 47207 }, { "epoch": 0.89, "learning_rate": 1.5511175809403033e-07, "loss": 0.8083, "step": 47208 }, { "epoch": 0.89, "learning_rate": 1.5505879007608526e-07, "loss": 0.8169, "step": 47209 }, { "epoch": 0.89, "learning_rate": 1.5500583081407894e-07, "loss": 0.7715, "step": 47210 }, { "epoch": 0.89, "learning_rate": 1.5495288030820844e-07, "loss": 0.9736, "step": 47211 }, { "epoch": 0.89, "learning_rate": 1.5489993855867273e-07, "loss": 1.1264, "step": 47212 }, { "epoch": 0.89, "learning_rate": 1.548470055656681e-07, "loss": 0.816, "step": 47213 }, { "epoch": 0.89, "learning_rate": 1.5479408132939328e-07, "loss": 0.8, "step": 47214 }, { "epoch": 0.89, "learning_rate": 1.54741165850045e-07, "loss": 0.962, "step": 47215 }, { "epoch": 0.89, "learning_rate": 1.5468825912782177e-07, "loss": 0.8876, "step": 47216 }, { "epoch": 0.89, "learning_rate": 1.5463536116292032e-07, "loss": 0.8354, "step": 47217 }, { "epoch": 0.89, "learning_rate": 1.545824719555386e-07, "loss": 0.9551, "step": 47218 }, { "epoch": 0.89, "learning_rate": 1.5452959150587449e-07, "loss": 0.9263, "step": 47219 }, { "epoch": 0.89, "learning_rate": 1.5447671981412394e-07, "loss": 1.0446, "step": 47220 }, { "epoch": 0.89, "learning_rate": 1.5442385688048595e-07, "loss": 0.844, "step": 47221 }, { "epoch": 0.89, "learning_rate": 1.5437100270515787e-07, "loss": 0.8412, "step": 47222 }, { "epoch": 0.89, "learning_rate": 1.5431815728833566e-07, "loss": 0.721, "step": 47223 }, { "epoch": 0.89, "learning_rate": 1.5426532063021833e-07, "loss": 1.0806, "step": 47224 }, { "epoch": 0.89, "learning_rate": 1.5421249273100208e-07, "loss": 0.9419, "step": 47225 }, { "epoch": 0.89, "learning_rate": 1.5415967359088428e-07, "loss": 0.8067, "step": 47226 }, { "epoch": 0.89, "learning_rate": 1.5410686321006258e-07, "loss": 0.7954, "step": 47227 }, { "epoch": 0.89, "learning_rate": 1.540540615887337e-07, "loss": 0.965, "step": 47228 }, { "epoch": 0.89, "learning_rate": 1.5400126872709504e-07, "loss": 0.6987, "step": 47229 }, { "epoch": 0.89, "learning_rate": 1.5394848462534362e-07, "loss": 1.0891, "step": 47230 }, { "epoch": 0.89, "learning_rate": 1.5389570928367736e-07, "loss": 1.0485, "step": 47231 }, { "epoch": 0.89, "learning_rate": 1.5384294270229139e-07, "loss": 1.0502, "step": 47232 }, { "epoch": 0.89, "learning_rate": 1.5379018488138499e-07, "loss": 0.988, "step": 47233 }, { "epoch": 0.89, "learning_rate": 1.537374358211538e-07, "loss": 0.9908, "step": 47234 }, { "epoch": 0.89, "learning_rate": 1.5368469552179495e-07, "loss": 0.8246, "step": 47235 }, { "epoch": 0.89, "learning_rate": 1.5363196398350545e-07, "loss": 1.0001, "step": 47236 }, { "epoch": 0.89, "learning_rate": 1.535792412064824e-07, "loss": 1.2214, "step": 47237 }, { "epoch": 0.89, "learning_rate": 1.5352652719092226e-07, "loss": 0.9092, "step": 47238 }, { "epoch": 0.89, "learning_rate": 1.5347382193702242e-07, "loss": 0.9023, "step": 47239 }, { "epoch": 0.89, "learning_rate": 1.5342112544497966e-07, "loss": 0.882, "step": 47240 }, { "epoch": 0.89, "learning_rate": 1.5336843771498967e-07, "loss": 0.8807, "step": 47241 }, { "epoch": 0.89, "learning_rate": 1.5331575874725029e-07, "loss": 0.8766, "step": 47242 }, { "epoch": 0.89, "learning_rate": 1.5326308854195838e-07, "loss": 1.0181, "step": 47243 }, { "epoch": 0.89, "learning_rate": 1.5321042709930929e-07, "loss": 0.9243, "step": 47244 }, { "epoch": 0.89, "learning_rate": 1.5315777441950146e-07, "loss": 0.8995, "step": 47245 }, { "epoch": 0.89, "learning_rate": 1.5310513050273008e-07, "loss": 0.7402, "step": 47246 }, { "epoch": 0.89, "learning_rate": 1.5305249534919215e-07, "loss": 0.7732, "step": 47247 }, { "epoch": 0.89, "learning_rate": 1.529998689590842e-07, "loss": 0.9265, "step": 47248 }, { "epoch": 0.89, "learning_rate": 1.52947251332603e-07, "loss": 0.901, "step": 47249 }, { "epoch": 0.89, "learning_rate": 1.5289464246994456e-07, "loss": 1.0107, "step": 47250 }, { "epoch": 0.89, "learning_rate": 1.5284204237130563e-07, "loss": 0.7729, "step": 47251 }, { "epoch": 0.89, "learning_rate": 1.5278945103688297e-07, "loss": 0.8768, "step": 47252 }, { "epoch": 0.89, "learning_rate": 1.5273686846687175e-07, "loss": 1.0717, "step": 47253 }, { "epoch": 0.89, "learning_rate": 1.5268429466146984e-07, "loss": 0.8046, "step": 47254 }, { "epoch": 0.89, "learning_rate": 1.5263172962087235e-07, "loss": 0.9989, "step": 47255 }, { "epoch": 0.89, "learning_rate": 1.5257917334527612e-07, "loss": 0.8154, "step": 47256 }, { "epoch": 0.89, "learning_rate": 1.5252662583487733e-07, "loss": 0.8759, "step": 47257 }, { "epoch": 0.89, "learning_rate": 1.5247408708987222e-07, "loss": 0.8033, "step": 47258 }, { "epoch": 0.89, "learning_rate": 1.5242155711045674e-07, "loss": 0.9644, "step": 47259 }, { "epoch": 0.89, "learning_rate": 1.5236903589682716e-07, "loss": 0.793, "step": 47260 }, { "epoch": 0.89, "learning_rate": 1.5231652344917997e-07, "loss": 0.8566, "step": 47261 }, { "epoch": 0.89, "learning_rate": 1.5226401976771028e-07, "loss": 1.0438, "step": 47262 }, { "epoch": 0.89, "learning_rate": 1.5221152485261488e-07, "loss": 0.9826, "step": 47263 }, { "epoch": 0.89, "learning_rate": 1.5215903870409027e-07, "loss": 1.0132, "step": 47264 }, { "epoch": 0.89, "learning_rate": 1.5210656132233103e-07, "loss": 0.7962, "step": 47265 }, { "epoch": 0.89, "learning_rate": 1.5205409270753478e-07, "loss": 0.8687, "step": 47266 }, { "epoch": 0.89, "learning_rate": 1.520016328598961e-07, "loss": 0.7878, "step": 47267 }, { "epoch": 0.89, "learning_rate": 1.5194918177961122e-07, "loss": 1.1941, "step": 47268 }, { "epoch": 0.89, "learning_rate": 1.5189673946687604e-07, "loss": 0.8488, "step": 47269 }, { "epoch": 0.89, "learning_rate": 1.5184430592188659e-07, "loss": 1.0742, "step": 47270 }, { "epoch": 0.89, "learning_rate": 1.517918811448385e-07, "loss": 0.9178, "step": 47271 }, { "epoch": 0.89, "learning_rate": 1.5173946513592748e-07, "loss": 0.8478, "step": 47272 }, { "epoch": 0.89, "learning_rate": 1.5168705789534971e-07, "loss": 0.8401, "step": 47273 }, { "epoch": 0.89, "learning_rate": 1.516346594232998e-07, "loss": 0.9991, "step": 47274 }, { "epoch": 0.89, "learning_rate": 1.515822697199748e-07, "loss": 1.1226, "step": 47275 }, { "epoch": 0.89, "learning_rate": 1.51529888785569e-07, "loss": 0.8476, "step": 47276 }, { "epoch": 0.89, "learning_rate": 1.5147751662027865e-07, "loss": 0.9464, "step": 47277 }, { "epoch": 0.89, "learning_rate": 1.514251532242994e-07, "loss": 1.0831, "step": 47278 }, { "epoch": 0.89, "learning_rate": 1.5137279859782667e-07, "loss": 0.7729, "step": 47279 }, { "epoch": 0.89, "learning_rate": 1.513204527410561e-07, "loss": 0.9925, "step": 47280 }, { "epoch": 0.89, "learning_rate": 1.512681156541823e-07, "loss": 0.9693, "step": 47281 }, { "epoch": 0.89, "learning_rate": 1.5121578733740207e-07, "loss": 0.8259, "step": 47282 }, { "epoch": 0.89, "learning_rate": 1.5116346779090962e-07, "loss": 0.8152, "step": 47283 }, { "epoch": 0.89, "learning_rate": 1.5111115701490042e-07, "loss": 0.7678, "step": 47284 }, { "epoch": 0.89, "learning_rate": 1.5105885500957095e-07, "loss": 0.8055, "step": 47285 }, { "epoch": 0.89, "learning_rate": 1.5100656177511524e-07, "loss": 0.7746, "step": 47286 }, { "epoch": 0.89, "learning_rate": 1.5095427731172897e-07, "loss": 1.0091, "step": 47287 }, { "epoch": 0.89, "learning_rate": 1.509020016196075e-07, "loss": 0.8476, "step": 47288 }, { "epoch": 0.89, "learning_rate": 1.5084973469894598e-07, "loss": 0.9261, "step": 47289 }, { "epoch": 0.89, "learning_rate": 1.5079747654993953e-07, "loss": 1.0192, "step": 47290 }, { "epoch": 0.89, "learning_rate": 1.5074522717278328e-07, "loss": 0.9555, "step": 47291 }, { "epoch": 0.89, "learning_rate": 1.5069298656767263e-07, "loss": 1.0058, "step": 47292 }, { "epoch": 0.89, "learning_rate": 1.5064075473480154e-07, "loss": 1.0222, "step": 47293 }, { "epoch": 0.89, "learning_rate": 1.505885316743666e-07, "loss": 0.7871, "step": 47294 }, { "epoch": 0.89, "learning_rate": 1.5053631738656178e-07, "loss": 0.884, "step": 47295 }, { "epoch": 0.89, "learning_rate": 1.5048411187158218e-07, "loss": 0.7274, "step": 47296 }, { "epoch": 0.89, "learning_rate": 1.5043191512962295e-07, "loss": 0.8517, "step": 47297 }, { "epoch": 0.89, "learning_rate": 1.5037972716087894e-07, "loss": 0.7312, "step": 47298 }, { "epoch": 0.89, "learning_rate": 1.50327547965545e-07, "loss": 0.7924, "step": 47299 }, { "epoch": 0.89, "learning_rate": 1.5027537754381567e-07, "loss": 1.2583, "step": 47300 }, { "epoch": 0.89, "learning_rate": 1.5022321589588662e-07, "loss": 0.8575, "step": 47301 }, { "epoch": 0.89, "learning_rate": 1.5017106302195133e-07, "loss": 0.9254, "step": 47302 }, { "epoch": 0.89, "learning_rate": 1.5011891892220603e-07, "loss": 1.0429, "step": 47303 }, { "epoch": 0.89, "learning_rate": 1.500667835968442e-07, "loss": 0.893, "step": 47304 }, { "epoch": 0.89, "learning_rate": 1.500146570460606e-07, "loss": 1.0153, "step": 47305 }, { "epoch": 0.89, "learning_rate": 1.49962539270051e-07, "loss": 0.9614, "step": 47306 }, { "epoch": 0.89, "learning_rate": 1.4991043026900882e-07, "loss": 1.0122, "step": 47307 }, { "epoch": 0.89, "learning_rate": 1.4985833004312888e-07, "loss": 0.9071, "step": 47308 }, { "epoch": 0.89, "learning_rate": 1.4980623859260606e-07, "loss": 0.81, "step": 47309 }, { "epoch": 0.89, "learning_rate": 1.4975415591763464e-07, "loss": 0.9465, "step": 47310 }, { "epoch": 0.89, "learning_rate": 1.4970208201840918e-07, "loss": 0.8868, "step": 47311 }, { "epoch": 0.89, "learning_rate": 1.4965001689512398e-07, "loss": 1.031, "step": 47312 }, { "epoch": 0.89, "learning_rate": 1.4959796054797388e-07, "loss": 0.9169, "step": 47313 }, { "epoch": 0.89, "learning_rate": 1.4954591297715233e-07, "loss": 0.7939, "step": 47314 }, { "epoch": 0.89, "learning_rate": 1.4949387418285498e-07, "loss": 0.8866, "step": 47315 }, { "epoch": 0.89, "learning_rate": 1.4944184416527507e-07, "loss": 0.76, "step": 47316 }, { "epoch": 0.89, "learning_rate": 1.4938982292460714e-07, "loss": 0.7705, "step": 47317 }, { "epoch": 0.89, "learning_rate": 1.4933781046104573e-07, "loss": 0.8969, "step": 47318 }, { "epoch": 0.89, "learning_rate": 1.492858067747849e-07, "loss": 1.2332, "step": 47319 }, { "epoch": 0.89, "learning_rate": 1.492338118660186e-07, "loss": 0.8066, "step": 47320 }, { "epoch": 0.89, "learning_rate": 1.4918182573494118e-07, "loss": 0.8726, "step": 47321 }, { "epoch": 0.89, "learning_rate": 1.4912984838174715e-07, "loss": 0.7118, "step": 47322 }, { "epoch": 0.89, "learning_rate": 1.4907787980662947e-07, "loss": 0.9721, "step": 47323 }, { "epoch": 0.89, "learning_rate": 1.490259200097838e-07, "loss": 0.8851, "step": 47324 }, { "epoch": 0.89, "learning_rate": 1.489739689914027e-07, "loss": 1.213, "step": 47325 }, { "epoch": 0.89, "learning_rate": 1.4892202675168028e-07, "loss": 0.8013, "step": 47326 }, { "epoch": 0.89, "learning_rate": 1.4887009329081188e-07, "loss": 0.8085, "step": 47327 }, { "epoch": 0.89, "learning_rate": 1.4881816860898985e-07, "loss": 0.8579, "step": 47328 }, { "epoch": 0.89, "learning_rate": 1.4876625270640876e-07, "loss": 0.8071, "step": 47329 }, { "epoch": 0.89, "learning_rate": 1.4871434558326236e-07, "loss": 0.921, "step": 47330 }, { "epoch": 0.89, "learning_rate": 1.4866244723974465e-07, "loss": 1.1503, "step": 47331 }, { "epoch": 0.89, "learning_rate": 1.4861055767604938e-07, "loss": 1.1472, "step": 47332 }, { "epoch": 0.89, "learning_rate": 1.4855867689236998e-07, "loss": 0.9417, "step": 47333 }, { "epoch": 0.89, "learning_rate": 1.4850680488890073e-07, "loss": 0.9043, "step": 47334 }, { "epoch": 0.89, "learning_rate": 1.484549416658343e-07, "loss": 0.7415, "step": 47335 }, { "epoch": 0.89, "learning_rate": 1.4840308722336577e-07, "loss": 0.705, "step": 47336 }, { "epoch": 0.89, "learning_rate": 1.483512415616875e-07, "loss": 1.0869, "step": 47337 }, { "epoch": 0.89, "learning_rate": 1.482994046809938e-07, "loss": 1.2131, "step": 47338 }, { "epoch": 0.89, "learning_rate": 1.482475765814781e-07, "loss": 0.925, "step": 47339 }, { "epoch": 0.89, "learning_rate": 1.4819575726333357e-07, "loss": 0.9579, "step": 47340 }, { "epoch": 0.89, "learning_rate": 1.4814394672675397e-07, "loss": 0.9973, "step": 47341 }, { "epoch": 0.89, "learning_rate": 1.4809214497193303e-07, "loss": 0.7362, "step": 47342 }, { "epoch": 0.89, "learning_rate": 1.480403519990642e-07, "loss": 0.8296, "step": 47343 }, { "epoch": 0.89, "learning_rate": 1.4798856780833954e-07, "loss": 1.0722, "step": 47344 }, { "epoch": 0.89, "learning_rate": 1.4793679239995445e-07, "loss": 0.725, "step": 47345 }, { "epoch": 0.89, "learning_rate": 1.4788502577410102e-07, "loss": 0.7803, "step": 47346 }, { "epoch": 0.89, "learning_rate": 1.4783326793097213e-07, "loss": 1.0239, "step": 47347 }, { "epoch": 0.89, "learning_rate": 1.4778151887076265e-07, "loss": 0.7697, "step": 47348 }, { "epoch": 0.89, "learning_rate": 1.4772977859366432e-07, "loss": 0.8209, "step": 47349 }, { "epoch": 0.89, "learning_rate": 1.4767804709987095e-07, "loss": 1.0083, "step": 47350 }, { "epoch": 0.89, "learning_rate": 1.4762632438957564e-07, "loss": 0.9286, "step": 47351 }, { "epoch": 0.89, "learning_rate": 1.4757461046297162e-07, "loss": 0.9716, "step": 47352 }, { "epoch": 0.89, "learning_rate": 1.4752290532025177e-07, "loss": 1.0281, "step": 47353 }, { "epoch": 0.89, "learning_rate": 1.4747120896160927e-07, "loss": 0.8611, "step": 47354 }, { "epoch": 0.89, "learning_rate": 1.474195213872376e-07, "loss": 0.9404, "step": 47355 }, { "epoch": 0.89, "learning_rate": 1.4736784259732823e-07, "loss": 1.0184, "step": 47356 }, { "epoch": 0.89, "learning_rate": 1.473161725920763e-07, "loss": 0.706, "step": 47357 }, { "epoch": 0.89, "learning_rate": 1.4726451137167307e-07, "loss": 1.0451, "step": 47358 }, { "epoch": 0.89, "learning_rate": 1.4721285893631226e-07, "loss": 0.8381, "step": 47359 }, { "epoch": 0.89, "learning_rate": 1.4716121528618622e-07, "loss": 0.8391, "step": 47360 }, { "epoch": 0.89, "learning_rate": 1.4710958042148837e-07, "loss": 0.679, "step": 47361 }, { "epoch": 0.89, "learning_rate": 1.4705795434241083e-07, "loss": 1.0046, "step": 47362 }, { "epoch": 0.89, "learning_rate": 1.4700633704914701e-07, "loss": 0.8455, "step": 47363 }, { "epoch": 0.89, "learning_rate": 1.4695472854188957e-07, "loss": 0.9293, "step": 47364 }, { "epoch": 0.89, "learning_rate": 1.4690312882083058e-07, "loss": 0.7506, "step": 47365 }, { "epoch": 0.89, "learning_rate": 1.4685153788616374e-07, "loss": 0.9272, "step": 47366 }, { "epoch": 0.89, "learning_rate": 1.467999557380806e-07, "loss": 1.1526, "step": 47367 }, { "epoch": 0.89, "learning_rate": 1.4674838237677401e-07, "loss": 1.0266, "step": 47368 }, { "epoch": 0.89, "learning_rate": 1.4669681780243778e-07, "loss": 0.9579, "step": 47369 }, { "epoch": 0.89, "learning_rate": 1.466452620152628e-07, "loss": 0.966, "step": 47370 }, { "epoch": 0.89, "learning_rate": 1.4659371501544228e-07, "loss": 0.723, "step": 47371 }, { "epoch": 0.89, "learning_rate": 1.4654217680316884e-07, "loss": 0.8134, "step": 47372 }, { "epoch": 0.89, "learning_rate": 1.4649064737863455e-07, "loss": 1.1525, "step": 47373 }, { "epoch": 0.89, "learning_rate": 1.4643912674203203e-07, "loss": 1.1578, "step": 47374 }, { "epoch": 0.89, "learning_rate": 1.463876148935539e-07, "loss": 1.078, "step": 47375 }, { "epoch": 0.89, "learning_rate": 1.4633611183339251e-07, "loss": 0.7685, "step": 47376 }, { "epoch": 0.89, "learning_rate": 1.4628461756173912e-07, "loss": 0.9569, "step": 47377 }, { "epoch": 0.89, "learning_rate": 1.4623313207878742e-07, "loss": 0.887, "step": 47378 }, { "epoch": 0.89, "learning_rate": 1.4618165538472895e-07, "loss": 0.6956, "step": 47379 }, { "epoch": 0.89, "learning_rate": 1.4613018747975577e-07, "loss": 0.808, "step": 47380 }, { "epoch": 0.89, "learning_rate": 1.4607872836406023e-07, "loss": 0.9919, "step": 47381 }, { "epoch": 0.89, "learning_rate": 1.4602727803783494e-07, "loss": 0.9946, "step": 47382 }, { "epoch": 0.89, "learning_rate": 1.4597583650127118e-07, "loss": 1.0448, "step": 47383 }, { "epoch": 0.89, "learning_rate": 1.459244037545618e-07, "loss": 0.7104, "step": 47384 }, { "epoch": 0.89, "learning_rate": 1.458729797978986e-07, "loss": 0.8911, "step": 47385 }, { "epoch": 0.89, "learning_rate": 1.4582156463147312e-07, "loss": 0.7512, "step": 47386 }, { "epoch": 0.89, "learning_rate": 1.4577015825547824e-07, "loss": 0.9546, "step": 47387 }, { "epoch": 0.89, "learning_rate": 1.4571876067010493e-07, "loss": 0.8242, "step": 47388 }, { "epoch": 0.89, "learning_rate": 1.4566737187554553e-07, "loss": 0.9078, "step": 47389 }, { "epoch": 0.89, "learning_rate": 1.4561599187199264e-07, "loss": 1.166, "step": 47390 }, { "epoch": 0.89, "learning_rate": 1.45564620659637e-07, "loss": 0.6931, "step": 47391 }, { "epoch": 0.89, "learning_rate": 1.4551325823867064e-07, "loss": 0.9871, "step": 47392 }, { "epoch": 0.89, "learning_rate": 1.454619046092859e-07, "loss": 1.0283, "step": 47393 }, { "epoch": 0.89, "learning_rate": 1.454105597716743e-07, "loss": 1.01, "step": 47394 }, { "epoch": 0.89, "learning_rate": 1.4535922372602708e-07, "loss": 0.9227, "step": 47395 }, { "epoch": 0.89, "learning_rate": 1.4530789647253656e-07, "loss": 0.9254, "step": 47396 }, { "epoch": 0.89, "learning_rate": 1.452565780113946e-07, "loss": 0.9174, "step": 47397 }, { "epoch": 0.89, "learning_rate": 1.4520526834279154e-07, "loss": 0.863, "step": 47398 }, { "epoch": 0.89, "learning_rate": 1.4515396746692058e-07, "loss": 0.9713, "step": 47399 }, { "epoch": 0.89, "learning_rate": 1.451026753839721e-07, "loss": 1.1823, "step": 47400 }, { "epoch": 0.89, "learning_rate": 1.4505139209413822e-07, "loss": 0.8365, "step": 47401 }, { "epoch": 0.89, "learning_rate": 1.4500011759761014e-07, "loss": 0.8099, "step": 47402 }, { "epoch": 0.89, "learning_rate": 1.4494885189457908e-07, "loss": 1.0256, "step": 47403 }, { "epoch": 0.89, "learning_rate": 1.4489759498523713e-07, "loss": 1.0127, "step": 47404 }, { "epoch": 0.89, "learning_rate": 1.448463468697753e-07, "loss": 0.9684, "step": 47405 }, { "epoch": 0.89, "learning_rate": 1.4479510754838526e-07, "loss": 0.9313, "step": 47406 }, { "epoch": 0.89, "learning_rate": 1.4474387702125753e-07, "loss": 1.0258, "step": 47407 }, { "epoch": 0.89, "learning_rate": 1.4469265528858468e-07, "loss": 0.8427, "step": 47408 }, { "epoch": 0.89, "learning_rate": 1.4464144235055683e-07, "loss": 0.8529, "step": 47409 }, { "epoch": 0.89, "learning_rate": 1.4459023820736522e-07, "loss": 1.0714, "step": 47410 }, { "epoch": 0.89, "learning_rate": 1.4453904285920194e-07, "loss": 1.0925, "step": 47411 }, { "epoch": 0.89, "learning_rate": 1.4448785630625768e-07, "loss": 1.2046, "step": 47412 }, { "epoch": 0.89, "learning_rate": 1.4443667854872333e-07, "loss": 0.7826, "step": 47413 }, { "epoch": 0.89, "learning_rate": 1.443855095867902e-07, "loss": 0.9992, "step": 47414 }, { "epoch": 0.89, "learning_rate": 1.443343494206495e-07, "loss": 0.7668, "step": 47415 }, { "epoch": 0.89, "learning_rate": 1.442831980504919e-07, "loss": 0.8112, "step": 47416 }, { "epoch": 0.89, "learning_rate": 1.4423205547650866e-07, "loss": 0.9573, "step": 47417 }, { "epoch": 0.89, "learning_rate": 1.4418092169889124e-07, "loss": 0.9416, "step": 47418 }, { "epoch": 0.89, "learning_rate": 1.44129796717829e-07, "loss": 0.8418, "step": 47419 }, { "epoch": 0.89, "learning_rate": 1.4407868053351483e-07, "loss": 0.8297, "step": 47420 }, { "epoch": 0.89, "learning_rate": 1.4402757314613823e-07, "loss": 0.9285, "step": 47421 }, { "epoch": 0.89, "learning_rate": 1.4397647455589053e-07, "loss": 0.7656, "step": 47422 }, { "epoch": 0.89, "learning_rate": 1.4392538476296236e-07, "loss": 0.8621, "step": 47423 }, { "epoch": 0.89, "learning_rate": 1.438743037675444e-07, "loss": 0.9208, "step": 47424 }, { "epoch": 0.89, "learning_rate": 1.4382323156982765e-07, "loss": 0.8374, "step": 47425 }, { "epoch": 0.89, "learning_rate": 1.4377216817000271e-07, "loss": 0.928, "step": 47426 }, { "epoch": 0.89, "learning_rate": 1.4372111356826062e-07, "loss": 0.9, "step": 47427 }, { "epoch": 0.89, "learning_rate": 1.436700677647909e-07, "loss": 0.7658, "step": 47428 }, { "epoch": 0.89, "learning_rate": 1.4361903075978568e-07, "loss": 0.9272, "step": 47429 }, { "epoch": 0.89, "learning_rate": 1.4356800255343445e-07, "loss": 0.9539, "step": 47430 }, { "epoch": 0.89, "learning_rate": 1.4351698314592765e-07, "loss": 1.247, "step": 47431 }, { "epoch": 0.89, "learning_rate": 1.434659725374568e-07, "loss": 0.8257, "step": 47432 }, { "epoch": 0.89, "learning_rate": 1.4341497072821147e-07, "loss": 0.8578, "step": 47433 }, { "epoch": 0.89, "learning_rate": 1.4336397771838234e-07, "loss": 0.7708, "step": 47434 }, { "epoch": 0.89, "learning_rate": 1.433129935081601e-07, "loss": 0.7198, "step": 47435 }, { "epoch": 0.89, "learning_rate": 1.4326201809773454e-07, "loss": 0.8477, "step": 47436 }, { "epoch": 0.89, "learning_rate": 1.432110514872964e-07, "loss": 1.1872, "step": 47437 }, { "epoch": 0.9, "learning_rate": 1.431600936770361e-07, "loss": 0.9465, "step": 47438 }, { "epoch": 0.9, "learning_rate": 1.43109144667144e-07, "loss": 1.0518, "step": 47439 }, { "epoch": 0.9, "learning_rate": 1.4305820445780938e-07, "loss": 0.7844, "step": 47440 }, { "epoch": 0.9, "learning_rate": 1.4300727304922406e-07, "loss": 0.86, "step": 47441 }, { "epoch": 0.9, "learning_rate": 1.429563504415768e-07, "loss": 1.0107, "step": 47442 }, { "epoch": 0.9, "learning_rate": 1.4290543663505823e-07, "loss": 1.0173, "step": 47443 }, { "epoch": 0.9, "learning_rate": 1.4285453162985853e-07, "loss": 0.9062, "step": 47444 }, { "epoch": 0.9, "learning_rate": 1.4280363542616775e-07, "loss": 1.0877, "step": 47445 }, { "epoch": 0.9, "learning_rate": 1.4275274802417582e-07, "loss": 0.9368, "step": 47446 }, { "epoch": 0.9, "learning_rate": 1.4270186942407282e-07, "loss": 0.9531, "step": 47447 }, { "epoch": 0.9, "learning_rate": 1.4265099962604946e-07, "loss": 0.7681, "step": 47448 }, { "epoch": 0.9, "learning_rate": 1.4260013863029388e-07, "loss": 1.0047, "step": 47449 }, { "epoch": 0.9, "learning_rate": 1.425492864369979e-07, "loss": 1.0574, "step": 47450 }, { "epoch": 0.9, "learning_rate": 1.4249844304635052e-07, "loss": 1.0814, "step": 47451 }, { "epoch": 0.9, "learning_rate": 1.4244760845854106e-07, "loss": 0.8713, "step": 47452 }, { "epoch": 0.9, "learning_rate": 1.4239678267376072e-07, "loss": 0.8283, "step": 47453 }, { "epoch": 0.9, "learning_rate": 1.42345965692198e-07, "loss": 0.8293, "step": 47454 }, { "epoch": 0.9, "learning_rate": 1.4229515751404355e-07, "loss": 0.9393, "step": 47455 }, { "epoch": 0.9, "learning_rate": 1.4224435813948638e-07, "loss": 1.1478, "step": 47456 }, { "epoch": 0.9, "learning_rate": 1.421935675687164e-07, "loss": 0.9142, "step": 47457 }, { "epoch": 0.9, "learning_rate": 1.4214278580192364e-07, "loss": 0.7964, "step": 47458 }, { "epoch": 0.9, "learning_rate": 1.420920128392972e-07, "loss": 0.9608, "step": 47459 }, { "epoch": 0.9, "learning_rate": 1.4204124868102743e-07, "loss": 0.912, "step": 47460 }, { "epoch": 0.9, "learning_rate": 1.4199049332730254e-07, "loss": 0.8654, "step": 47461 }, { "epoch": 0.9, "learning_rate": 1.4193974677831345e-07, "loss": 1.2994, "step": 47462 }, { "epoch": 0.9, "learning_rate": 1.4188900903424897e-07, "loss": 0.9804, "step": 47463 }, { "epoch": 0.9, "learning_rate": 1.418382800952983e-07, "loss": 1.0197, "step": 47464 }, { "epoch": 0.9, "learning_rate": 1.417875599616514e-07, "loss": 0.8323, "step": 47465 }, { "epoch": 0.9, "learning_rate": 1.4173684863349745e-07, "loss": 0.9312, "step": 47466 }, { "epoch": 0.9, "learning_rate": 1.4168614611102555e-07, "loss": 0.8889, "step": 47467 }, { "epoch": 0.9, "learning_rate": 1.416354523944255e-07, "loss": 0.8594, "step": 47468 }, { "epoch": 0.9, "learning_rate": 1.4158476748388688e-07, "loss": 0.8735, "step": 47469 }, { "epoch": 0.9, "learning_rate": 1.4153409137959733e-07, "loss": 0.93, "step": 47470 }, { "epoch": 0.9, "learning_rate": 1.4148342408174808e-07, "loss": 0.951, "step": 47471 }, { "epoch": 0.9, "learning_rate": 1.4143276559052703e-07, "loss": 0.9597, "step": 47472 }, { "epoch": 0.9, "learning_rate": 1.4138211590612348e-07, "loss": 0.8172, "step": 47473 }, { "epoch": 0.9, "learning_rate": 1.413314750287273e-07, "loss": 0.9023, "step": 47474 }, { "epoch": 0.9, "learning_rate": 1.412808429585269e-07, "loss": 1.1611, "step": 47475 }, { "epoch": 0.9, "learning_rate": 1.4123021969571133e-07, "loss": 0.7421, "step": 47476 }, { "epoch": 0.9, "learning_rate": 1.4117960524046987e-07, "loss": 0.8458, "step": 47477 }, { "epoch": 0.9, "learning_rate": 1.4112899959299153e-07, "loss": 0.8593, "step": 47478 }, { "epoch": 0.9, "learning_rate": 1.4107840275346507e-07, "loss": 0.8718, "step": 47479 }, { "epoch": 0.9, "learning_rate": 1.4102781472207978e-07, "loss": 0.9673, "step": 47480 }, { "epoch": 0.9, "learning_rate": 1.4097723549902436e-07, "loss": 0.9871, "step": 47481 }, { "epoch": 0.9, "learning_rate": 1.4092666508448704e-07, "loss": 1.0421, "step": 47482 }, { "epoch": 0.9, "learning_rate": 1.4087610347865792e-07, "loss": 1.054, "step": 47483 }, { "epoch": 0.9, "learning_rate": 1.4082555068172465e-07, "loss": 1.1429, "step": 47484 }, { "epoch": 0.9, "learning_rate": 1.407750066938765e-07, "loss": 0.9026, "step": 47485 }, { "epoch": 0.9, "learning_rate": 1.407244715153022e-07, "loss": 1.0423, "step": 47486 }, { "epoch": 0.9, "learning_rate": 1.4067394514619026e-07, "loss": 1.0842, "step": 47487 }, { "epoch": 0.9, "learning_rate": 1.4062342758672965e-07, "loss": 0.9025, "step": 47488 }, { "epoch": 0.9, "learning_rate": 1.4057291883710854e-07, "loss": 0.6796, "step": 47489 }, { "epoch": 0.9, "learning_rate": 1.4052241889751627e-07, "loss": 0.8732, "step": 47490 }, { "epoch": 0.9, "learning_rate": 1.4047192776814045e-07, "loss": 0.7798, "step": 47491 }, { "epoch": 0.9, "learning_rate": 1.4042144544917062e-07, "loss": 0.857, "step": 47492 }, { "epoch": 0.9, "learning_rate": 1.4037097194079447e-07, "loss": 0.8607, "step": 47493 }, { "epoch": 0.9, "learning_rate": 1.403205072432004e-07, "loss": 1.137, "step": 47494 }, { "epoch": 0.9, "learning_rate": 1.40270051356578e-07, "loss": 0.8863, "step": 47495 }, { "epoch": 0.9, "learning_rate": 1.4021960428111437e-07, "loss": 0.93, "step": 47496 }, { "epoch": 0.9, "learning_rate": 1.4016916601699848e-07, "loss": 0.7395, "step": 47497 }, { "epoch": 0.9, "learning_rate": 1.4011873656441853e-07, "loss": 0.7907, "step": 47498 }, { "epoch": 0.9, "learning_rate": 1.4006831592356273e-07, "loss": 1.079, "step": 47499 }, { "epoch": 0.9, "learning_rate": 1.400179040946198e-07, "loss": 1.1629, "step": 47500 }, { "epoch": 0.9, "learning_rate": 1.3996750107777733e-07, "loss": 1.0729, "step": 47501 }, { "epoch": 0.9, "learning_rate": 1.399171068732244e-07, "loss": 0.7365, "step": 47502 }, { "epoch": 0.9, "learning_rate": 1.3986672148114805e-07, "loss": 0.9711, "step": 47503 }, { "epoch": 0.9, "learning_rate": 1.3981634490173755e-07, "loss": 0.9382, "step": 47504 }, { "epoch": 0.9, "learning_rate": 1.3976597713518003e-07, "loss": 0.9949, "step": 47505 }, { "epoch": 0.9, "learning_rate": 1.397156181816639e-07, "loss": 1.2396, "step": 47506 }, { "epoch": 0.9, "learning_rate": 1.3966526804137737e-07, "loss": 1.0905, "step": 47507 }, { "epoch": 0.9, "learning_rate": 1.396149267145086e-07, "loss": 0.9378, "step": 47508 }, { "epoch": 0.9, "learning_rate": 1.3956459420124497e-07, "loss": 0.6891, "step": 47509 }, { "epoch": 0.9, "learning_rate": 1.3951427050177519e-07, "loss": 0.7249, "step": 47510 }, { "epoch": 0.9, "learning_rate": 1.3946395561628662e-07, "loss": 0.7833, "step": 47511 }, { "epoch": 0.9, "learning_rate": 1.3941364954496716e-07, "loss": 1.1567, "step": 47512 }, { "epoch": 0.9, "learning_rate": 1.3936335228800447e-07, "loss": 0.9499, "step": 47513 }, { "epoch": 0.9, "learning_rate": 1.3931306384558724e-07, "loss": 0.8839, "step": 47514 }, { "epoch": 0.9, "learning_rate": 1.392627842179023e-07, "loss": 0.9167, "step": 47515 }, { "epoch": 0.9, "learning_rate": 1.3921251340513781e-07, "loss": 0.8326, "step": 47516 }, { "epoch": 0.9, "learning_rate": 1.391622514074814e-07, "loss": 0.8471, "step": 47517 }, { "epoch": 0.9, "learning_rate": 1.3911199822512074e-07, "loss": 1.2786, "step": 47518 }, { "epoch": 0.9, "learning_rate": 1.3906175385824338e-07, "loss": 1.0513, "step": 47519 }, { "epoch": 0.9, "learning_rate": 1.390115183070373e-07, "loss": 0.762, "step": 47520 }, { "epoch": 0.9, "learning_rate": 1.389612915716898e-07, "loss": 0.9789, "step": 47521 }, { "epoch": 0.9, "learning_rate": 1.3891107365238797e-07, "loss": 0.826, "step": 47522 }, { "epoch": 0.9, "learning_rate": 1.3886086454932058e-07, "loss": 0.8441, "step": 47523 }, { "epoch": 0.9, "learning_rate": 1.3881066426267382e-07, "loss": 1.0183, "step": 47524 }, { "epoch": 0.9, "learning_rate": 1.3876047279263588e-07, "loss": 1.1498, "step": 47525 }, { "epoch": 0.9, "learning_rate": 1.387102901393936e-07, "loss": 0.7721, "step": 47526 }, { "epoch": 0.9, "learning_rate": 1.386601163031348e-07, "loss": 1.0516, "step": 47527 }, { "epoch": 0.9, "learning_rate": 1.3860995128404692e-07, "loss": 0.863, "step": 47528 }, { "epoch": 0.9, "learning_rate": 1.3855979508231698e-07, "loss": 0.8135, "step": 47529 }, { "epoch": 0.9, "learning_rate": 1.3850964769813263e-07, "loss": 0.9311, "step": 47530 }, { "epoch": 0.9, "learning_rate": 1.3845950913168012e-07, "loss": 0.9959, "step": 47531 }, { "epoch": 0.9, "learning_rate": 1.3840937938314842e-07, "loss": 0.9656, "step": 47532 }, { "epoch": 0.9, "learning_rate": 1.3835925845272297e-07, "loss": 0.8635, "step": 47533 }, { "epoch": 0.9, "learning_rate": 1.383091463405914e-07, "loss": 0.7973, "step": 47534 }, { "epoch": 0.9, "learning_rate": 1.3825904304694187e-07, "loss": 0.6922, "step": 47535 }, { "epoch": 0.9, "learning_rate": 1.382089485719601e-07, "loss": 0.6945, "step": 47536 }, { "epoch": 0.9, "learning_rate": 1.3815886291583398e-07, "loss": 1.0293, "step": 47537 }, { "epoch": 0.9, "learning_rate": 1.3810878607875e-07, "loss": 0.8746, "step": 47538 }, { "epoch": 0.9, "learning_rate": 1.3805871806089554e-07, "loss": 0.9704, "step": 47539 }, { "epoch": 0.9, "learning_rate": 1.380086588624574e-07, "loss": 0.8153, "step": 47540 }, { "epoch": 0.9, "learning_rate": 1.3795860848362236e-07, "loss": 0.762, "step": 47541 }, { "epoch": 0.9, "learning_rate": 1.3790856692457805e-07, "loss": 0.9194, "step": 47542 }, { "epoch": 0.9, "learning_rate": 1.3785853418550987e-07, "loss": 1.1366, "step": 47543 }, { "epoch": 0.9, "learning_rate": 1.37808510266606e-07, "loss": 1.0237, "step": 47544 }, { "epoch": 0.9, "learning_rate": 1.3775849516805274e-07, "loss": 0.9809, "step": 47545 }, { "epoch": 0.9, "learning_rate": 1.3770848889003652e-07, "loss": 1.0045, "step": 47546 }, { "epoch": 0.9, "learning_rate": 1.3765849143274475e-07, "loss": 1.144, "step": 47547 }, { "epoch": 0.9, "learning_rate": 1.3760850279636335e-07, "loss": 0.65, "step": 47548 }, { "epoch": 0.9, "learning_rate": 1.3755852298107968e-07, "loss": 0.9008, "step": 47549 }, { "epoch": 0.9, "learning_rate": 1.3750855198707974e-07, "loss": 1.105, "step": 47550 }, { "epoch": 0.9, "learning_rate": 1.3745858981455112e-07, "loss": 1.0453, "step": 47551 }, { "epoch": 0.9, "learning_rate": 1.3740863646367869e-07, "loss": 0.7208, "step": 47552 }, { "epoch": 0.9, "learning_rate": 1.373586919346509e-07, "loss": 0.7121, "step": 47553 }, { "epoch": 0.9, "learning_rate": 1.3730875622765288e-07, "loss": 0.8138, "step": 47554 }, { "epoch": 0.9, "learning_rate": 1.3725882934287117e-07, "loss": 0.797, "step": 47555 }, { "epoch": 0.9, "learning_rate": 1.3720891128049336e-07, "loss": 1.028, "step": 47556 }, { "epoch": 0.9, "learning_rate": 1.371590020407046e-07, "loss": 0.9212, "step": 47557 }, { "epoch": 0.9, "learning_rate": 1.3710910162369139e-07, "loss": 0.9227, "step": 47558 }, { "epoch": 0.9, "learning_rate": 1.3705921002964084e-07, "loss": 0.8103, "step": 47559 }, { "epoch": 0.9, "learning_rate": 1.3700932725873834e-07, "loss": 1.0101, "step": 47560 }, { "epoch": 0.9, "learning_rate": 1.3695945331117095e-07, "loss": 0.9646, "step": 47561 }, { "epoch": 0.9, "learning_rate": 1.3690958818712407e-07, "loss": 1.1685, "step": 47562 }, { "epoch": 0.9, "learning_rate": 1.3685973188678508e-07, "loss": 0.8893, "step": 47563 }, { "epoch": 0.9, "learning_rate": 1.3680988441033854e-07, "loss": 0.8601, "step": 47564 }, { "epoch": 0.9, "learning_rate": 1.3676004575797208e-07, "loss": 1.0018, "step": 47565 }, { "epoch": 0.9, "learning_rate": 1.3671021592987083e-07, "loss": 0.9317, "step": 47566 }, { "epoch": 0.9, "learning_rate": 1.36660394926221e-07, "loss": 1.0193, "step": 47567 }, { "epoch": 0.9, "learning_rate": 1.3661058274720919e-07, "loss": 1.0018, "step": 47568 }, { "epoch": 0.9, "learning_rate": 1.3656077939302071e-07, "loss": 1.0088, "step": 47569 }, { "epoch": 0.9, "learning_rate": 1.3651098486384183e-07, "loss": 0.87, "step": 47570 }, { "epoch": 0.9, "learning_rate": 1.3646119915985857e-07, "loss": 1.0, "step": 47571 }, { "epoch": 0.9, "learning_rate": 1.364114222812571e-07, "loss": 0.8725, "step": 47572 }, { "epoch": 0.9, "learning_rate": 1.3636165422822202e-07, "loss": 0.7476, "step": 47573 }, { "epoch": 0.9, "learning_rate": 1.3631189500094095e-07, "loss": 0.6967, "step": 47574 }, { "epoch": 0.9, "learning_rate": 1.3626214459959848e-07, "loss": 1.0635, "step": 47575 }, { "epoch": 0.9, "learning_rate": 1.3621240302438e-07, "loss": 0.8752, "step": 47576 }, { "epoch": 0.9, "learning_rate": 1.3616267027547287e-07, "loss": 0.8218, "step": 47577 }, { "epoch": 0.9, "learning_rate": 1.3611294635306166e-07, "loss": 0.886, "step": 47578 }, { "epoch": 0.9, "learning_rate": 1.3606323125733206e-07, "loss": 0.9361, "step": 47579 }, { "epoch": 0.9, "learning_rate": 1.3601352498846975e-07, "loss": 1.0149, "step": 47580 }, { "epoch": 0.9, "learning_rate": 1.359638275466607e-07, "loss": 0.9919, "step": 47581 }, { "epoch": 0.9, "learning_rate": 1.3591413893209004e-07, "loss": 1.0598, "step": 47582 }, { "epoch": 0.9, "learning_rate": 1.3586445914494372e-07, "loss": 0.894, "step": 47583 }, { "epoch": 0.9, "learning_rate": 1.3581478818540717e-07, "loss": 0.7435, "step": 47584 }, { "epoch": 0.9, "learning_rate": 1.3576512605366494e-07, "loss": 1.0279, "step": 47585 }, { "epoch": 0.9, "learning_rate": 1.357154727499041e-07, "loss": 0.9128, "step": 47586 }, { "epoch": 0.9, "learning_rate": 1.3566582827430898e-07, "loss": 0.9563, "step": 47587 }, { "epoch": 0.9, "learning_rate": 1.3561619262706495e-07, "loss": 0.8607, "step": 47588 }, { "epoch": 0.9, "learning_rate": 1.355665658083577e-07, "loss": 0.8891, "step": 47589 }, { "epoch": 0.9, "learning_rate": 1.355169478183721e-07, "loss": 0.9797, "step": 47590 }, { "epoch": 0.9, "learning_rate": 1.354673386572941e-07, "loss": 0.6678, "step": 47591 }, { "epoch": 0.9, "learning_rate": 1.354177383253083e-07, "loss": 0.9532, "step": 47592 }, { "epoch": 0.9, "learning_rate": 1.3536814682260062e-07, "loss": 1.055, "step": 47593 }, { "epoch": 0.9, "learning_rate": 1.3531856414935512e-07, "loss": 1.1567, "step": 47594 }, { "epoch": 0.9, "learning_rate": 1.352689903057583e-07, "loss": 0.9306, "step": 47595 }, { "epoch": 0.9, "learning_rate": 1.3521942529199417e-07, "loss": 0.8441, "step": 47596 }, { "epoch": 0.9, "learning_rate": 1.3516986910824786e-07, "loss": 1.0402, "step": 47597 }, { "epoch": 0.9, "learning_rate": 1.3512032175470536e-07, "loss": 0.8588, "step": 47598 }, { "epoch": 0.9, "learning_rate": 1.3507078323155066e-07, "loss": 1.0153, "step": 47599 }, { "epoch": 0.9, "learning_rate": 1.3502125353896944e-07, "loss": 0.7048, "step": 47600 }, { "epoch": 0.9, "learning_rate": 1.3497173267714602e-07, "loss": 1.0484, "step": 47601 }, { "epoch": 0.9, "learning_rate": 1.349222206462658e-07, "loss": 0.9164, "step": 47602 }, { "epoch": 0.9, "learning_rate": 1.3487271744651365e-07, "loss": 1.0637, "step": 47603 }, { "epoch": 0.9, "learning_rate": 1.348232230780741e-07, "loss": 0.6682, "step": 47604 }, { "epoch": 0.9, "learning_rate": 1.3477373754113233e-07, "loss": 0.7769, "step": 47605 }, { "epoch": 0.9, "learning_rate": 1.347242608358726e-07, "loss": 1.1812, "step": 47606 }, { "epoch": 0.9, "learning_rate": 1.3467479296248033e-07, "loss": 0.9867, "step": 47607 }, { "epoch": 0.9, "learning_rate": 1.3462533392113954e-07, "loss": 0.937, "step": 47608 }, { "epoch": 0.9, "learning_rate": 1.3457588371203535e-07, "loss": 0.9468, "step": 47609 }, { "epoch": 0.9, "learning_rate": 1.3452644233535206e-07, "loss": 0.6648, "step": 47610 }, { "epoch": 0.9, "learning_rate": 1.344770097912748e-07, "loss": 0.8668, "step": 47611 }, { "epoch": 0.9, "learning_rate": 1.3442758607998762e-07, "loss": 1.0289, "step": 47612 }, { "epoch": 0.9, "learning_rate": 1.3437817120167534e-07, "loss": 0.874, "step": 47613 }, { "epoch": 0.9, "learning_rate": 1.3432876515652283e-07, "loss": 0.8071, "step": 47614 }, { "epoch": 0.9, "learning_rate": 1.3427936794471352e-07, "loss": 0.9514, "step": 47615 }, { "epoch": 0.9, "learning_rate": 1.3422997956643312e-07, "loss": 0.9762, "step": 47616 }, { "epoch": 0.9, "learning_rate": 1.341806000218654e-07, "loss": 0.8772, "step": 47617 }, { "epoch": 0.9, "learning_rate": 1.3413122931119404e-07, "loss": 1.1407, "step": 47618 }, { "epoch": 0.9, "learning_rate": 1.3408186743460505e-07, "loss": 1.1821, "step": 47619 }, { "epoch": 0.9, "learning_rate": 1.3403251439228132e-07, "loss": 0.8307, "step": 47620 }, { "epoch": 0.9, "learning_rate": 1.339831701844077e-07, "loss": 0.9684, "step": 47621 }, { "epoch": 0.9, "learning_rate": 1.339338348111685e-07, "loss": 0.7849, "step": 47622 }, { "epoch": 0.9, "learning_rate": 1.3388450827274773e-07, "loss": 0.7536, "step": 47623 }, { "epoch": 0.9, "learning_rate": 1.338351905693297e-07, "loss": 0.9847, "step": 47624 }, { "epoch": 0.9, "learning_rate": 1.337858817010984e-07, "loss": 1.0648, "step": 47625 }, { "epoch": 0.9, "learning_rate": 1.3373658166823844e-07, "loss": 0.8845, "step": 47626 }, { "epoch": 0.9, "learning_rate": 1.3368729047093297e-07, "loss": 1.0684, "step": 47627 }, { "epoch": 0.9, "learning_rate": 1.3363800810936717e-07, "loss": 0.9562, "step": 47628 }, { "epoch": 0.9, "learning_rate": 1.3358873458372419e-07, "loss": 0.804, "step": 47629 }, { "epoch": 0.9, "learning_rate": 1.335394698941883e-07, "loss": 0.7536, "step": 47630 }, { "epoch": 0.9, "learning_rate": 1.3349021404094358e-07, "loss": 1.0035, "step": 47631 }, { "epoch": 0.9, "learning_rate": 1.3344096702417376e-07, "loss": 1.075, "step": 47632 }, { "epoch": 0.9, "learning_rate": 1.3339172884406283e-07, "loss": 0.9218, "step": 47633 }, { "epoch": 0.9, "learning_rate": 1.3334249950079453e-07, "loss": 0.8269, "step": 47634 }, { "epoch": 0.9, "learning_rate": 1.332932789945532e-07, "loss": 0.6674, "step": 47635 }, { "epoch": 0.9, "learning_rate": 1.332440673255214e-07, "loss": 0.7993, "step": 47636 }, { "epoch": 0.9, "learning_rate": 1.3319486449388464e-07, "loss": 1.1628, "step": 47637 }, { "epoch": 0.9, "learning_rate": 1.3314567049982518e-07, "loss": 0.9593, "step": 47638 }, { "epoch": 0.9, "learning_rate": 1.3309648534352681e-07, "loss": 0.837, "step": 47639 }, { "epoch": 0.9, "learning_rate": 1.3304730902517437e-07, "loss": 0.9606, "step": 47640 }, { "epoch": 0.9, "learning_rate": 1.3299814154495023e-07, "loss": 0.9144, "step": 47641 }, { "epoch": 0.9, "learning_rate": 1.3294898290303866e-07, "loss": 0.9138, "step": 47642 }, { "epoch": 0.9, "learning_rate": 1.3289983309962284e-07, "loss": 1.1283, "step": 47643 }, { "epoch": 0.9, "learning_rate": 1.3285069213488655e-07, "loss": 1.1804, "step": 47644 }, { "epoch": 0.9, "learning_rate": 1.3280156000901324e-07, "loss": 0.8768, "step": 47645 }, { "epoch": 0.9, "learning_rate": 1.3275243672218608e-07, "loss": 0.9566, "step": 47646 }, { "epoch": 0.9, "learning_rate": 1.3270332227458936e-07, "loss": 0.8579, "step": 47647 }, { "epoch": 0.9, "learning_rate": 1.3265421666640522e-07, "loss": 0.8606, "step": 47648 }, { "epoch": 0.9, "learning_rate": 1.3260511989781815e-07, "loss": 0.7923, "step": 47649 }, { "epoch": 0.9, "learning_rate": 1.3255603196901055e-07, "loss": 1.0546, "step": 47650 }, { "epoch": 0.9, "learning_rate": 1.325069528801662e-07, "loss": 0.9309, "step": 47651 }, { "epoch": 0.9, "learning_rate": 1.3245788263146846e-07, "loss": 0.8053, "step": 47652 }, { "epoch": 0.9, "learning_rate": 1.3240882122310034e-07, "loss": 0.8256, "step": 47653 }, { "epoch": 0.9, "learning_rate": 1.3235976865524498e-07, "loss": 0.7183, "step": 47654 }, { "epoch": 0.9, "learning_rate": 1.3231072492808583e-07, "loss": 1.1516, "step": 47655 }, { "epoch": 0.9, "learning_rate": 1.3226169004180612e-07, "loss": 0.936, "step": 47656 }, { "epoch": 0.9, "learning_rate": 1.3221266399658788e-07, "loss": 0.8837, "step": 47657 }, { "epoch": 0.9, "learning_rate": 1.3216364679261572e-07, "loss": 0.9814, "step": 47658 }, { "epoch": 0.9, "learning_rate": 1.3211463843007145e-07, "loss": 1.0747, "step": 47659 }, { "epoch": 0.9, "learning_rate": 1.320656389091382e-07, "loss": 0.7584, "step": 47660 }, { "epoch": 0.9, "learning_rate": 1.3201664823000005e-07, "loss": 0.8668, "step": 47661 }, { "epoch": 0.9, "learning_rate": 1.3196766639283875e-07, "loss": 1.0673, "step": 47662 }, { "epoch": 0.9, "learning_rate": 1.3191869339783753e-07, "loss": 0.8538, "step": 47663 }, { "epoch": 0.9, "learning_rate": 1.3186972924517927e-07, "loss": 0.7105, "step": 47664 }, { "epoch": 0.9, "learning_rate": 1.318207739350469e-07, "loss": 0.9596, "step": 47665 }, { "epoch": 0.9, "learning_rate": 1.3177182746762328e-07, "loss": 0.7864, "step": 47666 }, { "epoch": 0.9, "learning_rate": 1.3172288984309084e-07, "loss": 0.83, "step": 47667 }, { "epoch": 0.9, "learning_rate": 1.3167396106163299e-07, "loss": 0.9415, "step": 47668 }, { "epoch": 0.9, "learning_rate": 1.3162504112343126e-07, "loss": 1.118, "step": 47669 }, { "epoch": 0.9, "learning_rate": 1.3157613002866943e-07, "loss": 0.748, "step": 47670 }, { "epoch": 0.9, "learning_rate": 1.315272277775298e-07, "loss": 0.8724, "step": 47671 }, { "epoch": 0.9, "learning_rate": 1.3147833437019448e-07, "loss": 1.0429, "step": 47672 }, { "epoch": 0.9, "learning_rate": 1.3142944980684663e-07, "loss": 0.7796, "step": 47673 }, { "epoch": 0.9, "learning_rate": 1.3138057408766864e-07, "loss": 1.0872, "step": 47674 }, { "epoch": 0.9, "learning_rate": 1.3133170721284283e-07, "loss": 0.9241, "step": 47675 }, { "epoch": 0.9, "learning_rate": 1.3128284918255186e-07, "loss": 0.7608, "step": 47676 }, { "epoch": 0.9, "learning_rate": 1.312339999969786e-07, "loss": 0.9972, "step": 47677 }, { "epoch": 0.9, "learning_rate": 1.3118515965630406e-07, "loss": 1.0417, "step": 47678 }, { "epoch": 0.9, "learning_rate": 1.3113632816071226e-07, "loss": 0.8397, "step": 47679 }, { "epoch": 0.9, "learning_rate": 1.310875055103844e-07, "loss": 0.922, "step": 47680 }, { "epoch": 0.9, "learning_rate": 1.3103869170550288e-07, "loss": 0.7885, "step": 47681 }, { "epoch": 0.9, "learning_rate": 1.3098988674625113e-07, "loss": 1.0624, "step": 47682 }, { "epoch": 0.9, "learning_rate": 1.3094109063280986e-07, "loss": 0.9364, "step": 47683 }, { "epoch": 0.9, "learning_rate": 1.3089230336536196e-07, "loss": 1.027, "step": 47684 }, { "epoch": 0.9, "learning_rate": 1.3084352494408982e-07, "loss": 0.9457, "step": 47685 }, { "epoch": 0.9, "learning_rate": 1.307947553691749e-07, "loss": 0.9678, "step": 47686 }, { "epoch": 0.9, "learning_rate": 1.307459946407999e-07, "loss": 1.1401, "step": 47687 }, { "epoch": 0.9, "learning_rate": 1.3069724275914685e-07, "loss": 1.0452, "step": 47688 }, { "epoch": 0.9, "learning_rate": 1.3064849972439785e-07, "loss": 0.9012, "step": 47689 }, { "epoch": 0.9, "learning_rate": 1.3059976553673414e-07, "loss": 0.837, "step": 47690 }, { "epoch": 0.9, "learning_rate": 1.305510401963389e-07, "loss": 0.898, "step": 47691 }, { "epoch": 0.9, "learning_rate": 1.3050232370339312e-07, "loss": 0.851, "step": 47692 }, { "epoch": 0.9, "learning_rate": 1.3045361605807882e-07, "loss": 1.0188, "step": 47693 }, { "epoch": 0.9, "learning_rate": 1.3040491726057814e-07, "loss": 0.9689, "step": 47694 }, { "epoch": 0.9, "learning_rate": 1.3035622731107312e-07, "loss": 0.8531, "step": 47695 }, { "epoch": 0.9, "learning_rate": 1.30307546209745e-07, "loss": 0.9585, "step": 47696 }, { "epoch": 0.9, "learning_rate": 1.3025887395677588e-07, "loss": 0.9475, "step": 47697 }, { "epoch": 0.9, "learning_rate": 1.3021021055234785e-07, "loss": 0.7557, "step": 47698 }, { "epoch": 0.9, "learning_rate": 1.3016155599664154e-07, "loss": 0.8465, "step": 47699 }, { "epoch": 0.9, "learning_rate": 1.3011291028983992e-07, "loss": 0.9314, "step": 47700 }, { "epoch": 0.9, "learning_rate": 1.3006427343212392e-07, "loss": 0.9409, "step": 47701 }, { "epoch": 0.9, "learning_rate": 1.300156454236748e-07, "loss": 0.7475, "step": 47702 }, { "epoch": 0.9, "learning_rate": 1.2996702626467517e-07, "loss": 0.8457, "step": 47703 }, { "epoch": 0.9, "learning_rate": 1.2991841595530574e-07, "loss": 0.9615, "step": 47704 }, { "epoch": 0.9, "learning_rate": 1.2986981449574832e-07, "loss": 0.7759, "step": 47705 }, { "epoch": 0.9, "learning_rate": 1.2982122188618412e-07, "loss": 0.9517, "step": 47706 }, { "epoch": 0.9, "learning_rate": 1.2977263812679524e-07, "loss": 0.8965, "step": 47707 }, { "epoch": 0.9, "learning_rate": 1.2972406321776237e-07, "loss": 0.8723, "step": 47708 }, { "epoch": 0.9, "learning_rate": 1.2967549715926703e-07, "loss": 0.9491, "step": 47709 }, { "epoch": 0.9, "learning_rate": 1.296269399514913e-07, "loss": 0.8948, "step": 47710 }, { "epoch": 0.9, "learning_rate": 1.2957839159461526e-07, "loss": 0.8112, "step": 47711 }, { "epoch": 0.9, "learning_rate": 1.2952985208882135e-07, "loss": 1.0044, "step": 47712 }, { "epoch": 0.9, "learning_rate": 1.2948132143428993e-07, "loss": 1.0198, "step": 47713 }, { "epoch": 0.9, "learning_rate": 1.2943279963120252e-07, "loss": 0.8368, "step": 47714 }, { "epoch": 0.9, "learning_rate": 1.2938428667974068e-07, "loss": 0.9774, "step": 47715 }, { "epoch": 0.9, "learning_rate": 1.2933578258008505e-07, "loss": 0.7864, "step": 47716 }, { "epoch": 0.9, "learning_rate": 1.2928728733241664e-07, "loss": 1.0359, "step": 47717 }, { "epoch": 0.9, "learning_rate": 1.292388009369172e-07, "loss": 0.9871, "step": 47718 }, { "epoch": 0.9, "learning_rate": 1.2919032339376747e-07, "loss": 1.2524, "step": 47719 }, { "epoch": 0.9, "learning_rate": 1.2914185470314784e-07, "loss": 0.9113, "step": 47720 }, { "epoch": 0.9, "learning_rate": 1.2909339486524064e-07, "loss": 0.8972, "step": 47721 }, { "epoch": 0.9, "learning_rate": 1.2904494388022548e-07, "loss": 0.8775, "step": 47722 }, { "epoch": 0.9, "learning_rate": 1.2899650174828359e-07, "loss": 0.8443, "step": 47723 }, { "epoch": 0.9, "learning_rate": 1.289480684695965e-07, "loss": 0.8173, "step": 47724 }, { "epoch": 0.9, "learning_rate": 1.2889964404434464e-07, "loss": 1.1691, "step": 47725 }, { "epoch": 0.9, "learning_rate": 1.2885122847270836e-07, "loss": 0.9187, "step": 47726 }, { "epoch": 0.9, "learning_rate": 1.2880282175486926e-07, "loss": 0.8394, "step": 47727 }, { "epoch": 0.9, "learning_rate": 1.2875442389100768e-07, "loss": 0.7604, "step": 47728 }, { "epoch": 0.9, "learning_rate": 1.2870603488130436e-07, "loss": 0.7824, "step": 47729 }, { "epoch": 0.9, "learning_rate": 1.2865765472593993e-07, "loss": 0.9964, "step": 47730 }, { "epoch": 0.9, "learning_rate": 1.2860928342509543e-07, "loss": 1.1407, "step": 47731 }, { "epoch": 0.9, "learning_rate": 1.285609209789504e-07, "loss": 0.9249, "step": 47732 }, { "epoch": 0.9, "learning_rate": 1.2851256738768693e-07, "loss": 0.7902, "step": 47733 }, { "epoch": 0.9, "learning_rate": 1.2846422265148455e-07, "loss": 0.9138, "step": 47734 }, { "epoch": 0.9, "learning_rate": 1.2841588677052402e-07, "loss": 0.8056, "step": 47735 }, { "epoch": 0.9, "learning_rate": 1.2836755974498598e-07, "loss": 1.0331, "step": 47736 }, { "epoch": 0.9, "learning_rate": 1.283192415750506e-07, "loss": 1.0698, "step": 47737 }, { "epoch": 0.9, "learning_rate": 1.2827093226089855e-07, "loss": 0.9316, "step": 47738 }, { "epoch": 0.9, "learning_rate": 1.2822263180270994e-07, "loss": 0.7982, "step": 47739 }, { "epoch": 0.9, "learning_rate": 1.2817434020066577e-07, "loss": 0.7941, "step": 47740 }, { "epoch": 0.9, "learning_rate": 1.2812605745494533e-07, "loss": 0.7542, "step": 47741 }, { "epoch": 0.9, "learning_rate": 1.2807778356573015e-07, "loss": 0.9659, "step": 47742 }, { "epoch": 0.9, "learning_rate": 1.2802951853319923e-07, "loss": 1.0299, "step": 47743 }, { "epoch": 0.9, "learning_rate": 1.27981262357533e-07, "loss": 0.9139, "step": 47744 }, { "epoch": 0.9, "learning_rate": 1.2793301503891297e-07, "loss": 0.951, "step": 47745 }, { "epoch": 0.9, "learning_rate": 1.278847765775179e-07, "loss": 0.8624, "step": 47746 }, { "epoch": 0.9, "learning_rate": 1.2783654697352848e-07, "loss": 0.9547, "step": 47747 }, { "epoch": 0.9, "learning_rate": 1.2778832622712429e-07, "loss": 0.8931, "step": 47748 }, { "epoch": 0.9, "learning_rate": 1.2774011433848572e-07, "loss": 0.8834, "step": 47749 }, { "epoch": 0.9, "learning_rate": 1.2769191130779345e-07, "loss": 0.9908, "step": 47750 }, { "epoch": 0.9, "learning_rate": 1.2764371713522598e-07, "loss": 0.7824, "step": 47751 }, { "epoch": 0.9, "learning_rate": 1.2759553182096513e-07, "loss": 0.9504, "step": 47752 }, { "epoch": 0.9, "learning_rate": 1.275473553651893e-07, "loss": 0.9391, "step": 47753 }, { "epoch": 0.9, "learning_rate": 1.274991877680787e-07, "loss": 0.9228, "step": 47754 }, { "epoch": 0.9, "learning_rate": 1.2745102902981365e-07, "loss": 0.783, "step": 47755 }, { "epoch": 0.9, "learning_rate": 1.2740287915057353e-07, "loss": 0.9807, "step": 47756 }, { "epoch": 0.9, "learning_rate": 1.2735473813053844e-07, "loss": 0.8952, "step": 47757 }, { "epoch": 0.9, "learning_rate": 1.2730660596988826e-07, "loss": 0.8272, "step": 47758 }, { "epoch": 0.9, "learning_rate": 1.2725848266880254e-07, "loss": 0.8549, "step": 47759 }, { "epoch": 0.9, "learning_rate": 1.2721036822746003e-07, "loss": 0.6797, "step": 47760 }, { "epoch": 0.9, "learning_rate": 1.2716226264604225e-07, "loss": 1.0311, "step": 47761 }, { "epoch": 0.9, "learning_rate": 1.2711416592472741e-07, "loss": 1.1985, "step": 47762 }, { "epoch": 0.9, "learning_rate": 1.2706607806369537e-07, "loss": 0.9257, "step": 47763 }, { "epoch": 0.9, "learning_rate": 1.2701799906312595e-07, "loss": 0.8597, "step": 47764 }, { "epoch": 0.9, "learning_rate": 1.2696992892319848e-07, "loss": 0.8549, "step": 47765 }, { "epoch": 0.9, "learning_rate": 1.2692186764409253e-07, "loss": 0.8685, "step": 47766 }, { "epoch": 0.9, "learning_rate": 1.268738152259877e-07, "loss": 0.7052, "step": 47767 }, { "epoch": 0.9, "learning_rate": 1.268257716690635e-07, "loss": 1.0081, "step": 47768 }, { "epoch": 0.9, "learning_rate": 1.2677773697349877e-07, "loss": 0.988, "step": 47769 }, { "epoch": 0.9, "learning_rate": 1.26729711139473e-07, "loss": 0.9319, "step": 47770 }, { "epoch": 0.9, "learning_rate": 1.2668169416716642e-07, "loss": 1.0262, "step": 47771 }, { "epoch": 0.9, "learning_rate": 1.2663368605675687e-07, "loss": 0.715, "step": 47772 }, { "epoch": 0.9, "learning_rate": 1.2658568680842505e-07, "loss": 0.7017, "step": 47773 }, { "epoch": 0.9, "learning_rate": 1.2653769642234913e-07, "loss": 0.9664, "step": 47774 }, { "epoch": 0.9, "learning_rate": 1.2648971489870877e-07, "loss": 1.1641, "step": 47775 }, { "epoch": 0.9, "learning_rate": 1.264417422376829e-07, "loss": 0.9388, "step": 47776 }, { "epoch": 0.9, "learning_rate": 1.2639377843945089e-07, "loss": 0.9624, "step": 47777 }, { "epoch": 0.9, "learning_rate": 1.2634582350419173e-07, "loss": 1.0375, "step": 47778 }, { "epoch": 0.9, "learning_rate": 1.2629787743208444e-07, "loss": 0.9421, "step": 47779 }, { "epoch": 0.9, "learning_rate": 1.2624994022330862e-07, "loss": 0.8134, "step": 47780 }, { "epoch": 0.9, "learning_rate": 1.2620201187804186e-07, "loss": 1.0025, "step": 47781 }, { "epoch": 0.9, "learning_rate": 1.2615409239646465e-07, "loss": 0.761, "step": 47782 }, { "epoch": 0.9, "learning_rate": 1.261061817787551e-07, "loss": 0.9591, "step": 47783 }, { "epoch": 0.9, "learning_rate": 1.2605828002509201e-07, "loss": 0.9008, "step": 47784 }, { "epoch": 0.9, "learning_rate": 1.2601038713565466e-07, "loss": 0.8564, "step": 47785 }, { "epoch": 0.9, "learning_rate": 1.259625031106218e-07, "loss": 0.8982, "step": 47786 }, { "epoch": 0.9, "learning_rate": 1.2591462795017218e-07, "loss": 1.0527, "step": 47787 }, { "epoch": 0.9, "learning_rate": 1.2586676165448452e-07, "loss": 1.0905, "step": 47788 }, { "epoch": 0.9, "learning_rate": 1.2581890422373787e-07, "loss": 0.8427, "step": 47789 }, { "epoch": 0.9, "learning_rate": 1.2577105565811015e-07, "loss": 0.9338, "step": 47790 }, { "epoch": 0.9, "learning_rate": 1.2572321595778063e-07, "loss": 0.873, "step": 47791 }, { "epoch": 0.9, "learning_rate": 1.2567538512292837e-07, "loss": 0.7134, "step": 47792 }, { "epoch": 0.9, "learning_rate": 1.256275631537304e-07, "loss": 1.033, "step": 47793 }, { "epoch": 0.9, "learning_rate": 1.255797500503672e-07, "loss": 0.962, "step": 47794 }, { "epoch": 0.9, "learning_rate": 1.2553194581301608e-07, "loss": 1.0287, "step": 47795 }, { "epoch": 0.9, "learning_rate": 1.254841504418558e-07, "loss": 0.8365, "step": 47796 }, { "epoch": 0.9, "learning_rate": 1.254363639370651e-07, "loss": 0.9046, "step": 47797 }, { "epoch": 0.9, "learning_rate": 1.2538858629882218e-07, "loss": 0.9796, "step": 47798 }, { "epoch": 0.9, "learning_rate": 1.253408175273052e-07, "loss": 0.9344, "step": 47799 }, { "epoch": 0.9, "learning_rate": 1.2529305762269294e-07, "loss": 1.0828, "step": 47800 }, { "epoch": 0.9, "learning_rate": 1.2524530658516388e-07, "loss": 0.8179, "step": 47801 }, { "epoch": 0.9, "learning_rate": 1.2519756441489562e-07, "loss": 0.886, "step": 47802 }, { "epoch": 0.9, "learning_rate": 1.251498311120672e-07, "loss": 0.6463, "step": 47803 }, { "epoch": 0.9, "learning_rate": 1.2510210667685624e-07, "loss": 0.7576, "step": 47804 }, { "epoch": 0.9, "learning_rate": 1.2505439110944123e-07, "loss": 0.9565, "step": 47805 }, { "epoch": 0.9, "learning_rate": 1.2500668441000036e-07, "loss": 1.0664, "step": 47806 }, { "epoch": 0.9, "learning_rate": 1.249589865787118e-07, "loss": 1.1221, "step": 47807 }, { "epoch": 0.9, "learning_rate": 1.2491129761575348e-07, "loss": 0.8106, "step": 47808 }, { "epoch": 0.9, "learning_rate": 1.2486361752130332e-07, "loss": 0.8129, "step": 47809 }, { "epoch": 0.9, "learning_rate": 1.2481594629554034e-07, "loss": 0.8255, "step": 47810 }, { "epoch": 0.9, "learning_rate": 1.2476828393864077e-07, "loss": 0.7274, "step": 47811 }, { "epoch": 0.9, "learning_rate": 1.2472063045078392e-07, "loss": 0.9756, "step": 47812 }, { "epoch": 0.9, "learning_rate": 1.2467298583214798e-07, "loss": 0.9773, "step": 47813 }, { "epoch": 0.9, "learning_rate": 1.2462535008290948e-07, "loss": 0.7428, "step": 47814 }, { "epoch": 0.9, "learning_rate": 1.2457772320324775e-07, "loss": 0.8471, "step": 47815 }, { "epoch": 0.9, "learning_rate": 1.245301051933398e-07, "loss": 1.0265, "step": 47816 }, { "epoch": 0.9, "learning_rate": 1.244824960533636e-07, "loss": 0.8565, "step": 47817 }, { "epoch": 0.9, "learning_rate": 1.2443489578349677e-07, "loss": 1.0551, "step": 47818 }, { "epoch": 0.9, "learning_rate": 1.243873043839172e-07, "loss": 1.1605, "step": 47819 }, { "epoch": 0.9, "learning_rate": 1.2433972185480258e-07, "loss": 0.6844, "step": 47820 }, { "epoch": 0.9, "learning_rate": 1.242921481963308e-07, "loss": 0.7697, "step": 47821 }, { "epoch": 0.9, "learning_rate": 1.2424458340867946e-07, "loss": 0.8521, "step": 47822 }, { "epoch": 0.9, "learning_rate": 1.241970274920254e-07, "loss": 0.6817, "step": 47823 }, { "epoch": 0.9, "learning_rate": 1.2414948044654736e-07, "loss": 0.7289, "step": 47824 }, { "epoch": 0.9, "learning_rate": 1.241019422724221e-07, "loss": 1.1923, "step": 47825 }, { "epoch": 0.9, "learning_rate": 1.2405441296982707e-07, "loss": 0.9551, "step": 47826 }, { "epoch": 0.9, "learning_rate": 1.240068925389404e-07, "loss": 0.8694, "step": 47827 }, { "epoch": 0.9, "learning_rate": 1.2395938097993888e-07, "loss": 0.7719, "step": 47828 }, { "epoch": 0.9, "learning_rate": 1.2391187829300043e-07, "loss": 0.7434, "step": 47829 }, { "epoch": 0.9, "learning_rate": 1.238643844783019e-07, "loss": 0.8091, "step": 47830 }, { "epoch": 0.9, "learning_rate": 1.2381689953602143e-07, "loss": 1.0897, "step": 47831 }, { "epoch": 0.9, "learning_rate": 1.2376942346633502e-07, "loss": 0.7001, "step": 47832 }, { "epoch": 0.9, "learning_rate": 1.2372195626942112e-07, "loss": 0.7458, "step": 47833 }, { "epoch": 0.9, "learning_rate": 1.2367449794545683e-07, "loss": 0.9824, "step": 47834 }, { "epoch": 0.9, "learning_rate": 1.2362704849461866e-07, "loss": 0.8972, "step": 47835 }, { "epoch": 0.9, "learning_rate": 1.235796079170845e-07, "loss": 1.0307, "step": 47836 }, { "epoch": 0.9, "learning_rate": 1.235321762130312e-07, "loss": 1.073, "step": 47837 }, { "epoch": 0.9, "learning_rate": 1.2348475338263583e-07, "loss": 0.9811, "step": 47838 }, { "epoch": 0.9, "learning_rate": 1.2343733942607545e-07, "loss": 0.84, "step": 47839 }, { "epoch": 0.9, "learning_rate": 1.2338993434352741e-07, "loss": 1.0448, "step": 47840 }, { "epoch": 0.9, "learning_rate": 1.2334253813516829e-07, "loss": 0.8254, "step": 47841 }, { "epoch": 0.9, "learning_rate": 1.2329515080117539e-07, "loss": 0.8848, "step": 47842 }, { "epoch": 0.9, "learning_rate": 1.2324777234172553e-07, "loss": 0.955, "step": 47843 }, { "epoch": 0.9, "learning_rate": 1.2320040275699524e-07, "loss": 1.0189, "step": 47844 }, { "epoch": 0.9, "learning_rate": 1.2315304204716244e-07, "loss": 0.8254, "step": 47845 }, { "epoch": 0.9, "learning_rate": 1.231056902124028e-07, "loss": 0.9067, "step": 47846 }, { "epoch": 0.9, "learning_rate": 1.2305834725289373e-07, "loss": 0.8861, "step": 47847 }, { "epoch": 0.9, "learning_rate": 1.2301101316881198e-07, "loss": 0.8315, "step": 47848 }, { "epoch": 0.9, "learning_rate": 1.2296368796033437e-07, "loss": 0.8823, "step": 47849 }, { "epoch": 0.9, "learning_rate": 1.2291637162763716e-07, "loss": 1.2076, "step": 47850 }, { "epoch": 0.9, "learning_rate": 1.228690641708974e-07, "loss": 0.9377, "step": 47851 }, { "epoch": 0.9, "learning_rate": 1.2282176559029219e-07, "loss": 0.984, "step": 47852 }, { "epoch": 0.9, "learning_rate": 1.2277447588599666e-07, "loss": 0.7614, "step": 47853 }, { "epoch": 0.9, "learning_rate": 1.2272719505818876e-07, "loss": 0.7913, "step": 47854 }, { "epoch": 0.9, "learning_rate": 1.2267992310704524e-07, "loss": 0.9663, "step": 47855 }, { "epoch": 0.9, "learning_rate": 1.22632660032741e-07, "loss": 0.884, "step": 47856 }, { "epoch": 0.9, "learning_rate": 1.2258540583545448e-07, "loss": 0.8356, "step": 47857 }, { "epoch": 0.9, "learning_rate": 1.2253816051536055e-07, "loss": 0.8238, "step": 47858 }, { "epoch": 0.9, "learning_rate": 1.224909240726363e-07, "loss": 0.7624, "step": 47859 }, { "epoch": 0.9, "learning_rate": 1.2244369650745825e-07, "loss": 0.7337, "step": 47860 }, { "epoch": 0.9, "learning_rate": 1.2239647782000237e-07, "loss": 0.7991, "step": 47861 }, { "epoch": 0.9, "learning_rate": 1.223492680104449e-07, "loss": 0.889, "step": 47862 }, { "epoch": 0.9, "learning_rate": 1.2230206707896265e-07, "loss": 0.9976, "step": 47863 }, { "epoch": 0.9, "learning_rate": 1.2225487502573186e-07, "loss": 0.7435, "step": 47864 }, { "epoch": 0.9, "learning_rate": 1.2220769185092794e-07, "loss": 0.7067, "step": 47865 }, { "epoch": 0.9, "learning_rate": 1.2216051755472802e-07, "loss": 0.8248, "step": 47866 }, { "epoch": 0.9, "learning_rate": 1.2211335213730773e-07, "loss": 0.6921, "step": 47867 }, { "epoch": 0.9, "learning_rate": 1.2206619559884308e-07, "loss": 1.2856, "step": 47868 }, { "epoch": 0.9, "learning_rate": 1.220190479395103e-07, "loss": 1.0348, "step": 47869 }, { "epoch": 0.9, "learning_rate": 1.2197190915948565e-07, "loss": 0.8289, "step": 47870 }, { "epoch": 0.9, "learning_rate": 1.2192477925894509e-07, "loss": 0.877, "step": 47871 }, { "epoch": 0.9, "learning_rate": 1.218776582380643e-07, "loss": 0.7798, "step": 47872 }, { "epoch": 0.9, "learning_rate": 1.2183054609701984e-07, "loss": 0.7351, "step": 47873 }, { "epoch": 0.9, "learning_rate": 1.2178344283598625e-07, "loss": 1.1701, "step": 47874 }, { "epoch": 0.9, "learning_rate": 1.2173634845514092e-07, "loss": 1.0853, "step": 47875 }, { "epoch": 0.9, "learning_rate": 1.2168926295465954e-07, "loss": 0.8413, "step": 47876 }, { "epoch": 0.9, "learning_rate": 1.2164218633471697e-07, "loss": 0.7819, "step": 47877 }, { "epoch": 0.9, "learning_rate": 1.2159511859549e-07, "loss": 0.9781, "step": 47878 }, { "epoch": 0.9, "learning_rate": 1.215480597371535e-07, "loss": 0.9253, "step": 47879 }, { "epoch": 0.9, "learning_rate": 1.2150100975988398e-07, "loss": 0.886, "step": 47880 }, { "epoch": 0.9, "learning_rate": 1.2145396866385634e-07, "loss": 1.0847, "step": 47881 }, { "epoch": 0.9, "learning_rate": 1.2140693644924706e-07, "loss": 0.9467, "step": 47882 }, { "epoch": 0.9, "learning_rate": 1.2135991311623102e-07, "loss": 0.7496, "step": 47883 }, { "epoch": 0.9, "learning_rate": 1.2131289866498447e-07, "loss": 0.9182, "step": 47884 }, { "epoch": 0.9, "learning_rate": 1.2126589309568283e-07, "loss": 0.7764, "step": 47885 }, { "epoch": 0.9, "learning_rate": 1.2121889640850066e-07, "loss": 0.9662, "step": 47886 }, { "epoch": 0.9, "learning_rate": 1.2117190860361477e-07, "loss": 0.9813, "step": 47887 }, { "epoch": 0.9, "learning_rate": 1.2112492968119975e-07, "loss": 1.0661, "step": 47888 }, { "epoch": 0.9, "learning_rate": 1.2107795964143132e-07, "loss": 0.7709, "step": 47889 }, { "epoch": 0.9, "learning_rate": 1.2103099848448512e-07, "loss": 0.8973, "step": 47890 }, { "epoch": 0.9, "learning_rate": 1.2098404621053605e-07, "loss": 0.7536, "step": 47891 }, { "epoch": 0.9, "learning_rate": 1.209371028197595e-07, "loss": 0.8838, "step": 47892 }, { "epoch": 0.9, "learning_rate": 1.2089016831233093e-07, "loss": 1.1216, "step": 47893 }, { "epoch": 0.9, "learning_rate": 1.2084324268842595e-07, "loss": 0.8236, "step": 47894 }, { "epoch": 0.9, "learning_rate": 1.207963259482184e-07, "loss": 0.9042, "step": 47895 }, { "epoch": 0.9, "learning_rate": 1.20749418091885e-07, "loss": 0.7341, "step": 47896 }, { "epoch": 0.9, "learning_rate": 1.2070251911960068e-07, "loss": 0.7119, "step": 47897 }, { "epoch": 0.9, "learning_rate": 1.2065562903153943e-07, "loss": 0.7653, "step": 47898 }, { "epoch": 0.9, "learning_rate": 1.206087478278778e-07, "loss": 0.8229, "step": 47899 }, { "epoch": 0.9, "learning_rate": 1.2056187550878978e-07, "loss": 1.1957, "step": 47900 }, { "epoch": 0.9, "learning_rate": 1.2051501207445082e-07, "loss": 0.8341, "step": 47901 }, { "epoch": 0.9, "learning_rate": 1.2046815752503605e-07, "loss": 0.8077, "step": 47902 }, { "epoch": 0.9, "learning_rate": 1.2042131186072003e-07, "loss": 0.7909, "step": 47903 }, { "epoch": 0.9, "learning_rate": 1.2037447508167766e-07, "loss": 0.8247, "step": 47904 }, { "epoch": 0.9, "learning_rate": 1.203276471880843e-07, "loss": 0.9177, "step": 47905 }, { "epoch": 0.9, "learning_rate": 1.202808281801149e-07, "loss": 0.9727, "step": 47906 }, { "epoch": 0.9, "learning_rate": 1.202340180579431e-07, "loss": 0.8629, "step": 47907 }, { "epoch": 0.9, "learning_rate": 1.2018721682174523e-07, "loss": 0.8909, "step": 47908 }, { "epoch": 0.9, "learning_rate": 1.2014042447169498e-07, "loss": 0.8035, "step": 47909 }, { "epoch": 0.9, "learning_rate": 1.2009364100796755e-07, "loss": 0.8058, "step": 47910 }, { "epoch": 0.9, "learning_rate": 1.200468664307375e-07, "loss": 0.7608, "step": 47911 }, { "epoch": 0.9, "learning_rate": 1.2000010074017938e-07, "loss": 0.9528, "step": 47912 }, { "epoch": 0.9, "learning_rate": 1.1995334393646778e-07, "loss": 0.8336, "step": 47913 }, { "epoch": 0.9, "learning_rate": 1.1990659601977762e-07, "loss": 0.9719, "step": 47914 }, { "epoch": 0.9, "learning_rate": 1.1985985699028342e-07, "loss": 0.8373, "step": 47915 }, { "epoch": 0.9, "learning_rate": 1.1981312684815894e-07, "loss": 0.7396, "step": 47916 }, { "epoch": 0.9, "learning_rate": 1.197664055935796e-07, "loss": 0.8216, "step": 47917 }, { "epoch": 0.9, "learning_rate": 1.1971969322672e-07, "loss": 0.8374, "step": 47918 }, { "epoch": 0.9, "learning_rate": 1.1967298974775333e-07, "loss": 1.0486, "step": 47919 }, { "epoch": 0.9, "learning_rate": 1.1962629515685526e-07, "loss": 0.8533, "step": 47920 }, { "epoch": 0.9, "learning_rate": 1.1957960945419955e-07, "loss": 1.0474, "step": 47921 }, { "epoch": 0.9, "learning_rate": 1.1953293263996024e-07, "loss": 0.8667, "step": 47922 }, { "epoch": 0.9, "learning_rate": 1.194862647143122e-07, "loss": 0.7433, "step": 47923 }, { "epoch": 0.9, "learning_rate": 1.194396056774294e-07, "loss": 0.9407, "step": 47924 }, { "epoch": 0.9, "learning_rate": 1.193929555294862e-07, "loss": 1.1719, "step": 47925 }, { "epoch": 0.9, "learning_rate": 1.1934631427065664e-07, "loss": 0.8212, "step": 47926 }, { "epoch": 0.9, "learning_rate": 1.1929968190111552e-07, "loss": 0.7979, "step": 47927 }, { "epoch": 0.9, "learning_rate": 1.1925305842103553e-07, "loss": 0.8408, "step": 47928 }, { "epoch": 0.9, "learning_rate": 1.1920644383059205e-07, "loss": 0.7799, "step": 47929 }, { "epoch": 0.9, "learning_rate": 1.1915983812995885e-07, "loss": 0.8322, "step": 47930 }, { "epoch": 0.9, "learning_rate": 1.191132413193094e-07, "loss": 0.8365, "step": 47931 }, { "epoch": 0.9, "learning_rate": 1.1906665339881829e-07, "loss": 0.8904, "step": 47932 }, { "epoch": 0.9, "learning_rate": 1.1902007436865925e-07, "loss": 0.8142, "step": 47933 }, { "epoch": 0.9, "learning_rate": 1.1897350422900633e-07, "loss": 0.9316, "step": 47934 }, { "epoch": 0.9, "learning_rate": 1.1892694298003327e-07, "loss": 0.868, "step": 47935 }, { "epoch": 0.9, "learning_rate": 1.1888039062191437e-07, "loss": 0.6324, "step": 47936 }, { "epoch": 0.9, "learning_rate": 1.1883384715482254e-07, "loss": 1.1022, "step": 47937 }, { "epoch": 0.9, "learning_rate": 1.1878731257893239e-07, "loss": 1.0867, "step": 47938 }, { "epoch": 0.9, "learning_rate": 1.1874078689441765e-07, "loss": 0.8314, "step": 47939 }, { "epoch": 0.9, "learning_rate": 1.1869427010145095e-07, "loss": 0.8596, "step": 47940 }, { "epoch": 0.9, "learning_rate": 1.1864776220020774e-07, "loss": 0.787, "step": 47941 }, { "epoch": 0.9, "learning_rate": 1.1860126319086035e-07, "loss": 0.8351, "step": 47942 }, { "epoch": 0.9, "learning_rate": 1.1855477307358309e-07, "loss": 0.8612, "step": 47943 }, { "epoch": 0.9, "learning_rate": 1.185082918485489e-07, "loss": 0.828, "step": 47944 }, { "epoch": 0.9, "learning_rate": 1.1846181951593205e-07, "loss": 0.8199, "step": 47945 }, { "epoch": 0.9, "learning_rate": 1.1841535607590548e-07, "loss": 0.9459, "step": 47946 }, { "epoch": 0.9, "learning_rate": 1.1836890152864322e-07, "loss": 0.9059, "step": 47947 }, { "epoch": 0.9, "learning_rate": 1.1832245587431845e-07, "loss": 0.7971, "step": 47948 }, { "epoch": 0.9, "learning_rate": 1.1827601911310438e-07, "loss": 0.9803, "step": 47949 }, { "epoch": 0.9, "learning_rate": 1.1822959124517503e-07, "loss": 1.2101, "step": 47950 }, { "epoch": 0.9, "learning_rate": 1.1818317227070303e-07, "loss": 0.8685, "step": 47951 }, { "epoch": 0.9, "learning_rate": 1.1813676218986187e-07, "loss": 0.8992, "step": 47952 }, { "epoch": 0.9, "learning_rate": 1.1809036100282528e-07, "loss": 0.7888, "step": 47953 }, { "epoch": 0.9, "learning_rate": 1.180439687097662e-07, "loss": 0.8796, "step": 47954 }, { "epoch": 0.9, "learning_rate": 1.1799758531085781e-07, "loss": 0.8102, "step": 47955 }, { "epoch": 0.9, "learning_rate": 1.1795121080627359e-07, "loss": 1.0637, "step": 47956 }, { "epoch": 0.9, "learning_rate": 1.1790484519618673e-07, "loss": 0.9924, "step": 47957 }, { "epoch": 0.9, "learning_rate": 1.178584884807693e-07, "loss": 0.6889, "step": 47958 }, { "epoch": 0.9, "learning_rate": 1.1781214066019592e-07, "loss": 0.8146, "step": 47959 }, { "epoch": 0.9, "learning_rate": 1.177658017346392e-07, "loss": 0.718, "step": 47960 }, { "epoch": 0.9, "learning_rate": 1.1771947170427096e-07, "loss": 0.7431, "step": 47961 }, { "epoch": 0.9, "learning_rate": 1.1767315056926604e-07, "loss": 1.1215, "step": 47962 }, { "epoch": 0.9, "learning_rate": 1.1762683832979627e-07, "loss": 0.9059, "step": 47963 }, { "epoch": 0.9, "learning_rate": 1.1758053498603483e-07, "loss": 0.7559, "step": 47964 }, { "epoch": 0.9, "learning_rate": 1.1753424053815465e-07, "loss": 0.7053, "step": 47965 }, { "epoch": 0.9, "learning_rate": 1.1748795498632865e-07, "loss": 0.963, "step": 47966 }, { "epoch": 0.9, "learning_rate": 1.1744167833072917e-07, "loss": 0.7769, "step": 47967 }, { "epoch": 0.91, "learning_rate": 1.173954105715297e-07, "loss": 1.037, "step": 47968 }, { "epoch": 0.91, "learning_rate": 1.1734915170890315e-07, "loss": 0.9252, "step": 47969 }, { "epoch": 0.91, "learning_rate": 1.1730290174302106e-07, "loss": 0.6988, "step": 47970 }, { "epoch": 0.91, "learning_rate": 1.1725666067405744e-07, "loss": 1.0099, "step": 47971 }, { "epoch": 0.91, "learning_rate": 1.1721042850218411e-07, "loss": 0.7554, "step": 47972 }, { "epoch": 0.91, "learning_rate": 1.1716420522757399e-07, "loss": 0.9036, "step": 47973 }, { "epoch": 0.91, "learning_rate": 1.1711799085039971e-07, "loss": 0.873, "step": 47974 }, { "epoch": 0.91, "learning_rate": 1.1707178537083391e-07, "loss": 1.0922, "step": 47975 }, { "epoch": 0.91, "learning_rate": 1.1702558878904868e-07, "loss": 0.9507, "step": 47976 }, { "epoch": 0.91, "learning_rate": 1.1697940110521694e-07, "loss": 0.9713, "step": 47977 }, { "epoch": 0.91, "learning_rate": 1.1693322231951159e-07, "loss": 0.997, "step": 47978 }, { "epoch": 0.91, "learning_rate": 1.1688705243210392e-07, "loss": 0.8017, "step": 47979 }, { "epoch": 0.91, "learning_rate": 1.1684089144316679e-07, "loss": 0.9887, "step": 47980 }, { "epoch": 0.91, "learning_rate": 1.1679473935287344e-07, "loss": 0.9594, "step": 47981 }, { "epoch": 0.91, "learning_rate": 1.1674859616139483e-07, "loss": 0.954, "step": 47982 }, { "epoch": 0.91, "learning_rate": 1.1670246186890416e-07, "loss": 0.8138, "step": 47983 }, { "epoch": 0.91, "learning_rate": 1.1665633647557322e-07, "loss": 0.8534, "step": 47984 }, { "epoch": 0.91, "learning_rate": 1.1661021998157468e-07, "loss": 0.9305, "step": 47985 }, { "epoch": 0.91, "learning_rate": 1.1656411238708033e-07, "loss": 0.8878, "step": 47986 }, { "epoch": 0.91, "learning_rate": 1.1651801369226251e-07, "loss": 1.1089, "step": 47987 }, { "epoch": 0.91, "learning_rate": 1.1647192389729362e-07, "loss": 0.8771, "step": 47988 }, { "epoch": 0.91, "learning_rate": 1.1642584300234517e-07, "loss": 0.9096, "step": 47989 }, { "epoch": 0.91, "learning_rate": 1.1637977100758979e-07, "loss": 0.8383, "step": 47990 }, { "epoch": 0.91, "learning_rate": 1.1633370791319903e-07, "loss": 0.9594, "step": 47991 }, { "epoch": 0.91, "learning_rate": 1.1628765371934525e-07, "loss": 0.7591, "step": 47992 }, { "epoch": 0.91, "learning_rate": 1.1624160842620024e-07, "loss": 1.0081, "step": 47993 }, { "epoch": 0.91, "learning_rate": 1.1619557203393583e-07, "loss": 1.1251, "step": 47994 }, { "epoch": 0.91, "learning_rate": 1.1614954454272437e-07, "loss": 0.9201, "step": 47995 }, { "epoch": 0.91, "learning_rate": 1.161035259527371e-07, "loss": 0.9349, "step": 47996 }, { "epoch": 0.91, "learning_rate": 1.1605751626414668e-07, "loss": 0.9398, "step": 47997 }, { "epoch": 0.91, "learning_rate": 1.1601151547712381e-07, "loss": 0.772, "step": 47998 }, { "epoch": 0.91, "learning_rate": 1.1596552359184137e-07, "loss": 1.0466, "step": 47999 }, { "epoch": 0.91, "learning_rate": 1.1591954060847011e-07, "loss": 1.2602, "step": 48000 }, { "epoch": 0.91, "learning_rate": 1.1587356652718207e-07, "loss": 0.9785, "step": 48001 }, { "epoch": 0.91, "learning_rate": 1.1582760134814963e-07, "loss": 0.9758, "step": 48002 }, { "epoch": 0.91, "learning_rate": 1.1578164507154349e-07, "loss": 0.7284, "step": 48003 }, { "epoch": 0.91, "learning_rate": 1.1573569769753573e-07, "loss": 0.8496, "step": 48004 }, { "epoch": 0.91, "learning_rate": 1.1568975922629761e-07, "loss": 0.808, "step": 48005 }, { "epoch": 0.91, "learning_rate": 1.1564382965800091e-07, "loss": 1.0912, "step": 48006 }, { "epoch": 0.91, "learning_rate": 1.1559790899281692e-07, "loss": 0.92, "step": 48007 }, { "epoch": 0.91, "learning_rate": 1.1555199723091715e-07, "loss": 0.7837, "step": 48008 }, { "epoch": 0.91, "learning_rate": 1.1550609437247367e-07, "loss": 1.032, "step": 48009 }, { "epoch": 0.91, "learning_rate": 1.1546020041765665e-07, "loss": 1.029, "step": 48010 }, { "epoch": 0.91, "learning_rate": 1.1541431536663872e-07, "loss": 0.8645, "step": 48011 }, { "epoch": 0.91, "learning_rate": 1.1536843921959028e-07, "loss": 1.1542, "step": 48012 }, { "epoch": 0.91, "learning_rate": 1.1532257197668289e-07, "loss": 1.0328, "step": 48013 }, { "epoch": 0.91, "learning_rate": 1.1527671363808806e-07, "loss": 0.8776, "step": 48014 }, { "epoch": 0.91, "learning_rate": 1.1523086420397677e-07, "loss": 0.8833, "step": 48015 }, { "epoch": 0.91, "learning_rate": 1.1518502367452055e-07, "loss": 0.8976, "step": 48016 }, { "epoch": 0.91, "learning_rate": 1.151391920498901e-07, "loss": 0.7353, "step": 48017 }, { "epoch": 0.91, "learning_rate": 1.1509336933025722e-07, "loss": 1.157, "step": 48018 }, { "epoch": 0.91, "learning_rate": 1.1504755551579178e-07, "loss": 0.94, "step": 48019 }, { "epoch": 0.91, "learning_rate": 1.150017506066664e-07, "loss": 0.9291, "step": 48020 }, { "epoch": 0.91, "learning_rate": 1.1495595460305098e-07, "loss": 0.8078, "step": 48021 }, { "epoch": 0.91, "learning_rate": 1.1491016750511646e-07, "loss": 0.9758, "step": 48022 }, { "epoch": 0.91, "learning_rate": 1.1486438931303495e-07, "loss": 0.8328, "step": 48023 }, { "epoch": 0.91, "learning_rate": 1.1481862002697659e-07, "loss": 0.8521, "step": 48024 }, { "epoch": 0.91, "learning_rate": 1.1477285964711205e-07, "loss": 0.9639, "step": 48025 }, { "epoch": 0.91, "learning_rate": 1.1472710817361288e-07, "loss": 0.9513, "step": 48026 }, { "epoch": 0.91, "learning_rate": 1.1468136560664923e-07, "loss": 1.0034, "step": 48027 }, { "epoch": 0.91, "learning_rate": 1.1463563194639233e-07, "loss": 0.8645, "step": 48028 }, { "epoch": 0.91, "learning_rate": 1.1458990719301288e-07, "loss": 0.9429, "step": 48029 }, { "epoch": 0.91, "learning_rate": 1.1454419134668188e-07, "loss": 1.0164, "step": 48030 }, { "epoch": 0.91, "learning_rate": 1.1449848440756917e-07, "loss": 1.0617, "step": 48031 }, { "epoch": 0.91, "learning_rate": 1.1445278637584656e-07, "loss": 0.8441, "step": 48032 }, { "epoch": 0.91, "learning_rate": 1.1440709725168365e-07, "loss": 1.0323, "step": 48033 }, { "epoch": 0.91, "learning_rate": 1.1436141703525166e-07, "loss": 0.8659, "step": 48034 }, { "epoch": 0.91, "learning_rate": 1.1431574572672105e-07, "loss": 1.0207, "step": 48035 }, { "epoch": 0.91, "learning_rate": 1.1427008332626222e-07, "loss": 0.9102, "step": 48036 }, { "epoch": 0.91, "learning_rate": 1.1422442983404558e-07, "loss": 1.137, "step": 48037 }, { "epoch": 0.91, "learning_rate": 1.1417878525024184e-07, "loss": 0.8274, "step": 48038 }, { "epoch": 0.91, "learning_rate": 1.1413314957502198e-07, "loss": 0.8763, "step": 48039 }, { "epoch": 0.91, "learning_rate": 1.1408752280855472e-07, "loss": 0.9233, "step": 48040 }, { "epoch": 0.91, "learning_rate": 1.1404190495101247e-07, "loss": 0.8702, "step": 48041 }, { "epoch": 0.91, "learning_rate": 1.1399629600256423e-07, "loss": 0.7387, "step": 48042 }, { "epoch": 0.91, "learning_rate": 1.1395069596338015e-07, "loss": 0.9553, "step": 48043 }, { "epoch": 0.91, "learning_rate": 1.1390510483363177e-07, "loss": 1.0231, "step": 48044 }, { "epoch": 0.91, "learning_rate": 1.1385952261348838e-07, "loss": 0.8539, "step": 48045 }, { "epoch": 0.91, "learning_rate": 1.1381394930312011e-07, "loss": 0.9764, "step": 48046 }, { "epoch": 0.91, "learning_rate": 1.1376838490269743e-07, "loss": 0.9391, "step": 48047 }, { "epoch": 0.91, "learning_rate": 1.1372282941239072e-07, "loss": 0.952, "step": 48048 }, { "epoch": 0.91, "learning_rate": 1.1367728283236956e-07, "loss": 0.8267, "step": 48049 }, { "epoch": 0.91, "learning_rate": 1.1363174516280412e-07, "loss": 1.0775, "step": 48050 }, { "epoch": 0.91, "learning_rate": 1.1358621640386508e-07, "loss": 0.765, "step": 48051 }, { "epoch": 0.91, "learning_rate": 1.1354069655572148e-07, "loss": 0.8423, "step": 48052 }, { "epoch": 0.91, "learning_rate": 1.13495185618544e-07, "loss": 1.0861, "step": 48053 }, { "epoch": 0.91, "learning_rate": 1.1344968359250225e-07, "loss": 0.8381, "step": 48054 }, { "epoch": 0.91, "learning_rate": 1.1340419047776635e-07, "loss": 1.097, "step": 48055 }, { "epoch": 0.91, "learning_rate": 1.1335870627450563e-07, "loss": 1.1815, "step": 48056 }, { "epoch": 0.91, "learning_rate": 1.1331323098289076e-07, "loss": 0.8152, "step": 48057 }, { "epoch": 0.91, "learning_rate": 1.132677646030908e-07, "loss": 0.8257, "step": 48058 }, { "epoch": 0.91, "learning_rate": 1.1322230713527588e-07, "loss": 1.0801, "step": 48059 }, { "epoch": 0.91, "learning_rate": 1.1317685857961613e-07, "loss": 0.7786, "step": 48060 }, { "epoch": 0.91, "learning_rate": 1.1313141893628005e-07, "loss": 0.9291, "step": 48061 }, { "epoch": 0.91, "learning_rate": 1.1308598820543858e-07, "loss": 1.1534, "step": 48062 }, { "epoch": 0.91, "learning_rate": 1.130405663872608e-07, "loss": 0.9516, "step": 48063 }, { "epoch": 0.91, "learning_rate": 1.1299515348191598e-07, "loss": 0.9782, "step": 48064 }, { "epoch": 0.91, "learning_rate": 1.1294974948957454e-07, "loss": 0.7885, "step": 48065 }, { "epoch": 0.91, "learning_rate": 1.1290435441040553e-07, "loss": 0.965, "step": 48066 }, { "epoch": 0.91, "learning_rate": 1.1285896824457826e-07, "loss": 0.8252, "step": 48067 }, { "epoch": 0.91, "learning_rate": 1.128135909922623e-07, "loss": 0.8659, "step": 48068 }, { "epoch": 0.91, "learning_rate": 1.1276822265362725e-07, "loss": 1.1503, "step": 48069 }, { "epoch": 0.91, "learning_rate": 1.1272286322884268e-07, "loss": 0.9544, "step": 48070 }, { "epoch": 0.91, "learning_rate": 1.1267751271807764e-07, "loss": 0.8151, "step": 48071 }, { "epoch": 0.91, "learning_rate": 1.1263217112150171e-07, "loss": 1.0796, "step": 48072 }, { "epoch": 0.91, "learning_rate": 1.1258683843928364e-07, "loss": 0.8541, "step": 48073 }, { "epoch": 0.91, "learning_rate": 1.1254151467159358e-07, "loss": 0.9496, "step": 48074 }, { "epoch": 0.91, "learning_rate": 1.1249619981860027e-07, "loss": 0.9827, "step": 48075 }, { "epoch": 0.91, "learning_rate": 1.1245089388047275e-07, "loss": 0.9511, "step": 48076 }, { "epoch": 0.91, "learning_rate": 1.1240559685738034e-07, "loss": 0.7865, "step": 48077 }, { "epoch": 0.91, "learning_rate": 1.1236030874949233e-07, "loss": 0.8065, "step": 48078 }, { "epoch": 0.91, "learning_rate": 1.1231502955697748e-07, "loss": 0.9107, "step": 48079 }, { "epoch": 0.91, "learning_rate": 1.1226975928000539e-07, "loss": 0.7784, "step": 48080 }, { "epoch": 0.91, "learning_rate": 1.1222449791874506e-07, "loss": 1.0002, "step": 48081 }, { "epoch": 0.91, "learning_rate": 1.1217924547336472e-07, "loss": 1.0429, "step": 48082 }, { "epoch": 0.91, "learning_rate": 1.1213400194403423e-07, "loss": 0.7631, "step": 48083 }, { "epoch": 0.91, "learning_rate": 1.1208876733092206e-07, "loss": 0.8811, "step": 48084 }, { "epoch": 0.91, "learning_rate": 1.1204354163419667e-07, "loss": 0.9553, "step": 48085 }, { "epoch": 0.91, "learning_rate": 1.1199832485402823e-07, "loss": 0.8111, "step": 48086 }, { "epoch": 0.91, "learning_rate": 1.1195311699058464e-07, "loss": 0.8646, "step": 48087 }, { "epoch": 0.91, "learning_rate": 1.1190791804403467e-07, "loss": 0.8547, "step": 48088 }, { "epoch": 0.91, "learning_rate": 1.1186272801454761e-07, "loss": 1.0245, "step": 48089 }, { "epoch": 0.91, "learning_rate": 1.1181754690229168e-07, "loss": 0.869, "step": 48090 }, { "epoch": 0.91, "learning_rate": 1.117723747074359e-07, "loss": 0.999, "step": 48091 }, { "epoch": 0.91, "learning_rate": 1.1172721143014876e-07, "loss": 0.8537, "step": 48092 }, { "epoch": 0.91, "learning_rate": 1.1168205707059926e-07, "loss": 1.0911, "step": 48093 }, { "epoch": 0.91, "learning_rate": 1.1163691162895535e-07, "loss": 0.97, "step": 48094 }, { "epoch": 0.91, "learning_rate": 1.1159177510538632e-07, "loss": 0.8008, "step": 48095 }, { "epoch": 0.91, "learning_rate": 1.115466475000604e-07, "loss": 0.8564, "step": 48096 }, { "epoch": 0.91, "learning_rate": 1.1150152881314574e-07, "loss": 1.0414, "step": 48097 }, { "epoch": 0.91, "learning_rate": 1.1145641904481114e-07, "loss": 0.8691, "step": 48098 }, { "epoch": 0.91, "learning_rate": 1.1141131819522532e-07, "loss": 0.9519, "step": 48099 }, { "epoch": 0.91, "learning_rate": 1.1136622626455623e-07, "loss": 1.1779, "step": 48100 }, { "epoch": 0.91, "learning_rate": 1.1132114325297233e-07, "loss": 0.9694, "step": 48101 }, { "epoch": 0.91, "learning_rate": 1.1127606916064237e-07, "loss": 0.7859, "step": 48102 }, { "epoch": 0.91, "learning_rate": 1.1123100398773373e-07, "loss": 0.9226, "step": 48103 }, { "epoch": 0.91, "learning_rate": 1.1118594773441599e-07, "loss": 0.9774, "step": 48104 }, { "epoch": 0.91, "learning_rate": 1.1114090040085651e-07, "loss": 0.8921, "step": 48105 }, { "epoch": 0.91, "learning_rate": 1.1109586198722294e-07, "loss": 0.9418, "step": 48106 }, { "epoch": 0.91, "learning_rate": 1.1105083249368515e-07, "loss": 0.8979, "step": 48107 }, { "epoch": 0.91, "learning_rate": 1.1100581192040994e-07, "loss": 0.7881, "step": 48108 }, { "epoch": 0.91, "learning_rate": 1.109608002675655e-07, "loss": 0.7872, "step": 48109 }, { "epoch": 0.91, "learning_rate": 1.1091579753532062e-07, "loss": 1.1662, "step": 48110 }, { "epoch": 0.91, "learning_rate": 1.1087080372384262e-07, "loss": 0.835, "step": 48111 }, { "epoch": 0.91, "learning_rate": 1.1082581883329974e-07, "loss": 0.9617, "step": 48112 }, { "epoch": 0.91, "learning_rate": 1.1078084286386014e-07, "loss": 0.9379, "step": 48113 }, { "epoch": 0.91, "learning_rate": 1.1073587581569178e-07, "loss": 0.8269, "step": 48114 }, { "epoch": 0.91, "learning_rate": 1.1069091768896201e-07, "loss": 0.9082, "step": 48115 }, { "epoch": 0.91, "learning_rate": 1.1064596848383957e-07, "loss": 0.8773, "step": 48116 }, { "epoch": 0.91, "learning_rate": 1.1060102820049157e-07, "loss": 0.861, "step": 48117 }, { "epoch": 0.91, "learning_rate": 1.1055609683908592e-07, "loss": 1.1879, "step": 48118 }, { "epoch": 0.91, "learning_rate": 1.1051117439979081e-07, "loss": 1.1177, "step": 48119 }, { "epoch": 0.91, "learning_rate": 1.1046626088277363e-07, "loss": 0.9191, "step": 48120 }, { "epoch": 0.91, "learning_rate": 1.10421356288202e-07, "loss": 0.9808, "step": 48121 }, { "epoch": 0.91, "learning_rate": 1.1037646061624385e-07, "loss": 1.0198, "step": 48122 }, { "epoch": 0.91, "learning_rate": 1.1033157386706711e-07, "loss": 0.662, "step": 48123 }, { "epoch": 0.91, "learning_rate": 1.102866960408383e-07, "loss": 1.0885, "step": 48124 }, { "epoch": 0.91, "learning_rate": 1.1024182713772591e-07, "loss": 1.1147, "step": 48125 }, { "epoch": 0.91, "learning_rate": 1.1019696715789785e-07, "loss": 0.8431, "step": 48126 }, { "epoch": 0.91, "learning_rate": 1.101521161015201e-07, "loss": 0.9718, "step": 48127 }, { "epoch": 0.91, "learning_rate": 1.1010727396876198e-07, "loss": 0.8543, "step": 48128 }, { "epoch": 0.91, "learning_rate": 1.1006244075978944e-07, "loss": 0.8929, "step": 48129 }, { "epoch": 0.91, "learning_rate": 1.1001761647477071e-07, "loss": 0.8039, "step": 48130 }, { "epoch": 0.91, "learning_rate": 1.0997280111387287e-07, "loss": 0.999, "step": 48131 }, { "epoch": 0.91, "learning_rate": 1.0992799467726328e-07, "loss": 0.8267, "step": 48132 }, { "epoch": 0.91, "learning_rate": 1.0988319716510932e-07, "loss": 0.7792, "step": 48133 }, { "epoch": 0.91, "learning_rate": 1.0983840857757805e-07, "loss": 0.7737, "step": 48134 }, { "epoch": 0.91, "learning_rate": 1.0979362891483742e-07, "loss": 1.0089, "step": 48135 }, { "epoch": 0.91, "learning_rate": 1.0974885817705339e-07, "loss": 0.9335, "step": 48136 }, { "epoch": 0.91, "learning_rate": 1.0970409636439444e-07, "loss": 1.1638, "step": 48137 }, { "epoch": 0.91, "learning_rate": 1.0965934347702683e-07, "loss": 0.8687, "step": 48138 }, { "epoch": 0.91, "learning_rate": 1.0961459951511765e-07, "loss": 0.8572, "step": 48139 }, { "epoch": 0.91, "learning_rate": 1.0956986447883456e-07, "loss": 1.0786, "step": 48140 }, { "epoch": 0.91, "learning_rate": 1.0952513836834433e-07, "loss": 0.7123, "step": 48141 }, { "epoch": 0.91, "learning_rate": 1.094804211838138e-07, "loss": 0.8746, "step": 48142 }, { "epoch": 0.91, "learning_rate": 1.0943571292541034e-07, "loss": 0.899, "step": 48143 }, { "epoch": 0.91, "learning_rate": 1.0939101359330073e-07, "loss": 1.0022, "step": 48144 }, { "epoch": 0.91, "learning_rate": 1.0934632318765098e-07, "loss": 0.8915, "step": 48145 }, { "epoch": 0.91, "learning_rate": 1.0930164170862928e-07, "loss": 0.858, "step": 48146 }, { "epoch": 0.91, "learning_rate": 1.0925696915640244e-07, "loss": 0.8019, "step": 48147 }, { "epoch": 0.91, "learning_rate": 1.0921230553113588e-07, "loss": 0.8453, "step": 48148 }, { "epoch": 0.91, "learning_rate": 1.0916765083299808e-07, "loss": 0.727, "step": 48149 }, { "epoch": 0.91, "learning_rate": 1.0912300506215445e-07, "loss": 1.0464, "step": 48150 }, { "epoch": 0.91, "learning_rate": 1.0907836821877237e-07, "loss": 0.7028, "step": 48151 }, { "epoch": 0.91, "learning_rate": 1.0903374030301811e-07, "loss": 0.7782, "step": 48152 }, { "epoch": 0.91, "learning_rate": 1.0898912131505874e-07, "loss": 0.9423, "step": 48153 }, { "epoch": 0.91, "learning_rate": 1.0894451125506078e-07, "loss": 0.8644, "step": 48154 }, { "epoch": 0.91, "learning_rate": 1.0889991012319051e-07, "loss": 1.0368, "step": 48155 }, { "epoch": 0.91, "learning_rate": 1.0885531791961528e-07, "loss": 0.9673, "step": 48156 }, { "epoch": 0.91, "learning_rate": 1.0881073464449998e-07, "loss": 0.8995, "step": 48157 }, { "epoch": 0.91, "learning_rate": 1.0876616029801306e-07, "loss": 1.0858, "step": 48158 }, { "epoch": 0.91, "learning_rate": 1.0872159488031942e-07, "loss": 0.9006, "step": 48159 }, { "epoch": 0.91, "learning_rate": 1.086770383915861e-07, "loss": 0.764, "step": 48160 }, { "epoch": 0.91, "learning_rate": 1.086324908319794e-07, "loss": 0.7648, "step": 48161 }, { "epoch": 0.91, "learning_rate": 1.0858795220166557e-07, "loss": 1.0778, "step": 48162 }, { "epoch": 0.91, "learning_rate": 1.0854342250081112e-07, "loss": 0.9354, "step": 48163 }, { "epoch": 0.91, "learning_rate": 1.0849890172958206e-07, "loss": 0.8474, "step": 48164 }, { "epoch": 0.91, "learning_rate": 1.0845438988814517e-07, "loss": 0.9924, "step": 48165 }, { "epoch": 0.91, "learning_rate": 1.0840988697666587e-07, "loss": 0.9339, "step": 48166 }, { "epoch": 0.91, "learning_rate": 1.0836539299531073e-07, "loss": 0.9384, "step": 48167 }, { "epoch": 0.91, "learning_rate": 1.0832090794424627e-07, "loss": 0.9261, "step": 48168 }, { "epoch": 0.91, "learning_rate": 1.0827643182363762e-07, "loss": 0.943, "step": 48169 }, { "epoch": 0.91, "learning_rate": 1.0823196463365215e-07, "loss": 0.9154, "step": 48170 }, { "epoch": 0.91, "learning_rate": 1.0818750637445475e-07, "loss": 0.8571, "step": 48171 }, { "epoch": 0.91, "learning_rate": 1.0814305704621192e-07, "loss": 0.9139, "step": 48172 }, { "epoch": 0.91, "learning_rate": 1.0809861664908939e-07, "loss": 0.8136, "step": 48173 }, { "epoch": 0.91, "learning_rate": 1.0805418518325366e-07, "loss": 1.0793, "step": 48174 }, { "epoch": 0.91, "learning_rate": 1.0800976264886992e-07, "loss": 0.9888, "step": 48175 }, { "epoch": 0.91, "learning_rate": 1.0796534904610467e-07, "loss": 0.7034, "step": 48176 }, { "epoch": 0.91, "learning_rate": 1.0792094437512363e-07, "loss": 0.7151, "step": 48177 }, { "epoch": 0.91, "learning_rate": 1.0787654863609166e-07, "loss": 0.8915, "step": 48178 }, { "epoch": 0.91, "learning_rate": 1.0783216182917611e-07, "loss": 0.8447, "step": 48179 }, { "epoch": 0.91, "learning_rate": 1.0778778395454159e-07, "loss": 0.9376, "step": 48180 }, { "epoch": 0.91, "learning_rate": 1.0774341501235436e-07, "loss": 1.0801, "step": 48181 }, { "epoch": 0.91, "learning_rate": 1.0769905500277956e-07, "loss": 1.0126, "step": 48182 }, { "epoch": 0.91, "learning_rate": 1.0765470392598316e-07, "loss": 0.812, "step": 48183 }, { "epoch": 0.91, "learning_rate": 1.0761036178213086e-07, "loss": 0.7721, "step": 48184 }, { "epoch": 0.91, "learning_rate": 1.0756602857138809e-07, "loss": 0.9965, "step": 48185 }, { "epoch": 0.91, "learning_rate": 1.0752170429392084e-07, "loss": 0.9455, "step": 48186 }, { "epoch": 0.91, "learning_rate": 1.0747738894989341e-07, "loss": 1.2304, "step": 48187 }, { "epoch": 0.91, "learning_rate": 1.0743308253947232e-07, "loss": 0.8853, "step": 48188 }, { "epoch": 0.91, "learning_rate": 1.0738878506282301e-07, "loss": 0.9581, "step": 48189 }, { "epoch": 0.91, "learning_rate": 1.0734449652011008e-07, "loss": 0.9173, "step": 48190 }, { "epoch": 0.91, "learning_rate": 1.0730021691150034e-07, "loss": 0.926, "step": 48191 }, { "epoch": 0.91, "learning_rate": 1.0725594623715752e-07, "loss": 0.7781, "step": 48192 }, { "epoch": 0.91, "learning_rate": 1.072116844972479e-07, "loss": 0.7478, "step": 48193 }, { "epoch": 0.91, "learning_rate": 1.0716743169193633e-07, "loss": 1.03, "step": 48194 }, { "epoch": 0.91, "learning_rate": 1.0712318782138825e-07, "loss": 0.7181, "step": 48195 }, { "epoch": 0.91, "learning_rate": 1.0707895288576881e-07, "loss": 0.8047, "step": 48196 }, { "epoch": 0.91, "learning_rate": 1.0703472688524314e-07, "loss": 0.8654, "step": 48197 }, { "epoch": 0.91, "learning_rate": 1.0699050981997694e-07, "loss": 0.6892, "step": 48198 }, { "epoch": 0.91, "learning_rate": 1.0694630169013398e-07, "loss": 0.9467, "step": 48199 }, { "epoch": 0.91, "learning_rate": 1.0690210249588079e-07, "loss": 0.8566, "step": 48200 }, { "epoch": 0.91, "learning_rate": 1.0685791223738167e-07, "loss": 0.9844, "step": 48201 }, { "epoch": 0.91, "learning_rate": 1.0681373091480152e-07, "loss": 0.9858, "step": 48202 }, { "epoch": 0.91, "learning_rate": 1.0676955852830545e-07, "loss": 0.8212, "step": 48203 }, { "epoch": 0.91, "learning_rate": 1.0672539507805863e-07, "loss": 0.6853, "step": 48204 }, { "epoch": 0.91, "learning_rate": 1.066812405642259e-07, "loss": 1.0361, "step": 48205 }, { "epoch": 0.91, "learning_rate": 1.0663709498697188e-07, "loss": 0.9895, "step": 48206 }, { "epoch": 0.91, "learning_rate": 1.0659295834646199e-07, "loss": 0.8067, "step": 48207 }, { "epoch": 0.91, "learning_rate": 1.0654883064285971e-07, "loss": 0.9115, "step": 48208 }, { "epoch": 0.91, "learning_rate": 1.0650471187633127e-07, "loss": 0.9011, "step": 48209 }, { "epoch": 0.91, "learning_rate": 1.0646060204704101e-07, "loss": 0.7864, "step": 48210 }, { "epoch": 0.91, "learning_rate": 1.0641650115515295e-07, "loss": 0.9823, "step": 48211 }, { "epoch": 0.91, "learning_rate": 1.0637240920083308e-07, "loss": 1.0604, "step": 48212 }, { "epoch": 0.91, "learning_rate": 1.063283261842446e-07, "loss": 0.9208, "step": 48213 }, { "epoch": 0.91, "learning_rate": 1.0628425210555293e-07, "loss": 0.6311, "step": 48214 }, { "epoch": 0.91, "learning_rate": 1.0624018696492267e-07, "loss": 0.7529, "step": 48215 }, { "epoch": 0.91, "learning_rate": 1.0619613076251784e-07, "loss": 1.0714, "step": 48216 }, { "epoch": 0.91, "learning_rate": 1.0615208349850359e-07, "loss": 0.9068, "step": 48217 }, { "epoch": 0.91, "learning_rate": 1.0610804517304369e-07, "loss": 0.9223, "step": 48218 }, { "epoch": 0.91, "learning_rate": 1.0606401578630327e-07, "loss": 1.1348, "step": 48219 }, { "epoch": 0.91, "learning_rate": 1.0601999533844637e-07, "loss": 0.5855, "step": 48220 }, { "epoch": 0.91, "learning_rate": 1.0597598382963731e-07, "loss": 1.0594, "step": 48221 }, { "epoch": 0.91, "learning_rate": 1.059319812600404e-07, "loss": 0.7449, "step": 48222 }, { "epoch": 0.91, "learning_rate": 1.0588798762982022e-07, "loss": 0.8025, "step": 48223 }, { "epoch": 0.91, "learning_rate": 1.0584400293914082e-07, "loss": 0.8635, "step": 48224 }, { "epoch": 0.91, "learning_rate": 1.0580002718816652e-07, "loss": 1.1457, "step": 48225 }, { "epoch": 0.91, "learning_rate": 1.0575606037706188e-07, "loss": 0.9633, "step": 48226 }, { "epoch": 0.91, "learning_rate": 1.0571210250599013e-07, "loss": 0.869, "step": 48227 }, { "epoch": 0.91, "learning_rate": 1.056681535751164e-07, "loss": 0.9951, "step": 48228 }, { "epoch": 0.91, "learning_rate": 1.0562421358460418e-07, "loss": 0.7542, "step": 48229 }, { "epoch": 0.91, "learning_rate": 1.055802825346175e-07, "loss": 0.8235, "step": 48230 }, { "epoch": 0.91, "learning_rate": 1.0553636042532095e-07, "loss": 1.2396, "step": 48231 }, { "epoch": 0.91, "learning_rate": 1.0549244725687829e-07, "loss": 0.9232, "step": 48232 }, { "epoch": 0.91, "learning_rate": 1.05448543029453e-07, "loss": 0.9681, "step": 48233 }, { "epoch": 0.91, "learning_rate": 1.0540464774320968e-07, "loss": 0.9554, "step": 48234 }, { "epoch": 0.91, "learning_rate": 1.0536076139831209e-07, "loss": 0.9282, "step": 48235 }, { "epoch": 0.91, "learning_rate": 1.0531688399492396e-07, "loss": 0.8658, "step": 48236 }, { "epoch": 0.91, "learning_rate": 1.0527301553320906e-07, "loss": 1.0218, "step": 48237 }, { "epoch": 0.91, "learning_rate": 1.0522915601333144e-07, "loss": 0.9628, "step": 48238 }, { "epoch": 0.91, "learning_rate": 1.051853054354543e-07, "loss": 0.7637, "step": 48239 }, { "epoch": 0.91, "learning_rate": 1.0514146379974249e-07, "loss": 0.8328, "step": 48240 }, { "epoch": 0.91, "learning_rate": 1.0509763110635868e-07, "loss": 0.9715, "step": 48241 }, { "epoch": 0.91, "learning_rate": 1.0505380735546689e-07, "loss": 0.7347, "step": 48242 }, { "epoch": 0.91, "learning_rate": 1.050099925472306e-07, "loss": 1.0667, "step": 48243 }, { "epoch": 0.91, "learning_rate": 1.0496618668181385e-07, "loss": 0.9724, "step": 48244 }, { "epoch": 0.91, "learning_rate": 1.0492238975937957e-07, "loss": 0.7714, "step": 48245 }, { "epoch": 0.91, "learning_rate": 1.0487860178009179e-07, "loss": 0.8414, "step": 48246 }, { "epoch": 0.91, "learning_rate": 1.0483482274411428e-07, "loss": 0.8224, "step": 48247 }, { "epoch": 0.91, "learning_rate": 1.0479105265160938e-07, "loss": 0.8372, "step": 48248 }, { "epoch": 0.91, "learning_rate": 1.0474729150274198e-07, "loss": 1.0609, "step": 48249 }, { "epoch": 0.91, "learning_rate": 1.0470353929767446e-07, "loss": 0.8314, "step": 48250 }, { "epoch": 0.91, "learning_rate": 1.0465979603657e-07, "loss": 0.8064, "step": 48251 }, { "epoch": 0.91, "learning_rate": 1.0461606171959321e-07, "loss": 0.9429, "step": 48252 }, { "epoch": 0.91, "learning_rate": 1.0457233634690616e-07, "loss": 0.8021, "step": 48253 }, { "epoch": 0.91, "learning_rate": 1.0452861991867264e-07, "loss": 0.7254, "step": 48254 }, { "epoch": 0.91, "learning_rate": 1.0448491243505581e-07, "loss": 0.923, "step": 48255 }, { "epoch": 0.91, "learning_rate": 1.0444121389621891e-07, "loss": 1.048, "step": 48256 }, { "epoch": 0.91, "learning_rate": 1.0439752430232487e-07, "loss": 0.9157, "step": 48257 }, { "epoch": 0.91, "learning_rate": 1.0435384365353712e-07, "loss": 0.8225, "step": 48258 }, { "epoch": 0.91, "learning_rate": 1.043101719500192e-07, "loss": 0.8322, "step": 48259 }, { "epoch": 0.91, "learning_rate": 1.0426650919193287e-07, "loss": 0.8161, "step": 48260 }, { "epoch": 0.91, "learning_rate": 1.0422285537944249e-07, "loss": 0.8687, "step": 48261 }, { "epoch": 0.91, "learning_rate": 1.0417921051271013e-07, "loss": 1.0752, "step": 48262 }, { "epoch": 0.91, "learning_rate": 1.0413557459189927e-07, "loss": 0.9805, "step": 48263 }, { "epoch": 0.91, "learning_rate": 1.0409194761717257e-07, "loss": 0.9849, "step": 48264 }, { "epoch": 0.91, "learning_rate": 1.0404832958869321e-07, "loss": 0.6933, "step": 48265 }, { "epoch": 0.91, "learning_rate": 1.0400472050662413e-07, "loss": 0.8018, "step": 48266 }, { "epoch": 0.91, "learning_rate": 1.0396112037112771e-07, "loss": 0.8999, "step": 48267 }, { "epoch": 0.91, "learning_rate": 1.0391752918236741e-07, "loss": 0.8759, "step": 48268 }, { "epoch": 0.91, "learning_rate": 1.0387394694050479e-07, "loss": 1.0567, "step": 48269 }, { "epoch": 0.91, "learning_rate": 1.0383037364570413e-07, "loss": 0.9913, "step": 48270 }, { "epoch": 0.91, "learning_rate": 1.0378680929812701e-07, "loss": 0.8061, "step": 48271 }, { "epoch": 0.91, "learning_rate": 1.0374325389793633e-07, "loss": 0.8357, "step": 48272 }, { "epoch": 0.91, "learning_rate": 1.0369970744529528e-07, "loss": 0.813, "step": 48273 }, { "epoch": 0.91, "learning_rate": 1.0365616994036598e-07, "loss": 0.9761, "step": 48274 }, { "epoch": 0.91, "learning_rate": 1.0361264138331078e-07, "loss": 1.1363, "step": 48275 }, { "epoch": 0.91, "learning_rate": 1.0356912177429262e-07, "loss": 0.9709, "step": 48276 }, { "epoch": 0.91, "learning_rate": 1.0352561111347415e-07, "loss": 0.9071, "step": 48277 }, { "epoch": 0.91, "learning_rate": 1.0348210940101716e-07, "loss": 0.8862, "step": 48278 }, { "epoch": 0.91, "learning_rate": 1.0343861663708487e-07, "loss": 0.7679, "step": 48279 }, { "epoch": 0.91, "learning_rate": 1.0339513282183938e-07, "loss": 1.1415, "step": 48280 }, { "epoch": 0.91, "learning_rate": 1.0335165795544222e-07, "loss": 1.1226, "step": 48281 }, { "epoch": 0.91, "learning_rate": 1.0330819203805742e-07, "loss": 0.9737, "step": 48282 }, { "epoch": 0.91, "learning_rate": 1.0326473506984596e-07, "loss": 0.8682, "step": 48283 }, { "epoch": 0.91, "learning_rate": 1.0322128705097024e-07, "loss": 0.8922, "step": 48284 }, { "epoch": 0.91, "learning_rate": 1.0317784798159314e-07, "loss": 0.7222, "step": 48285 }, { "epoch": 0.91, "learning_rate": 1.0313441786187623e-07, "loss": 0.7791, "step": 48286 }, { "epoch": 0.91, "learning_rate": 1.0309099669198186e-07, "loss": 1.0426, "step": 48287 }, { "epoch": 0.91, "learning_rate": 1.0304758447207241e-07, "loss": 0.9833, "step": 48288 }, { "epoch": 0.91, "learning_rate": 1.0300418120230998e-07, "loss": 0.7879, "step": 48289 }, { "epoch": 0.91, "learning_rate": 1.0296078688285582e-07, "loss": 0.7497, "step": 48290 }, { "epoch": 0.91, "learning_rate": 1.0291740151387342e-07, "loss": 0.7065, "step": 48291 }, { "epoch": 0.91, "learning_rate": 1.0287402509552318e-07, "loss": 1.0294, "step": 48292 }, { "epoch": 0.91, "learning_rate": 1.0283065762796778e-07, "loss": 1.0406, "step": 48293 }, { "epoch": 0.91, "learning_rate": 1.0278729911136987e-07, "loss": 0.9419, "step": 48294 }, { "epoch": 0.91, "learning_rate": 1.027439495458904e-07, "loss": 0.9441, "step": 48295 }, { "epoch": 0.91, "learning_rate": 1.0270060893169148e-07, "loss": 1.037, "step": 48296 }, { "epoch": 0.91, "learning_rate": 1.0265727726893494e-07, "loss": 0.8713, "step": 48297 }, { "epoch": 0.91, "learning_rate": 1.0261395455778283e-07, "loss": 0.699, "step": 48298 }, { "epoch": 0.91, "learning_rate": 1.0257064079839646e-07, "loss": 0.9457, "step": 48299 }, { "epoch": 0.91, "learning_rate": 1.0252733599093789e-07, "loss": 1.0824, "step": 48300 }, { "epoch": 0.91, "learning_rate": 1.0248404013556895e-07, "loss": 0.7321, "step": 48301 }, { "epoch": 0.91, "learning_rate": 1.0244075323245062e-07, "loss": 0.8391, "step": 48302 }, { "epoch": 0.91, "learning_rate": 1.0239747528174554e-07, "loss": 0.8084, "step": 48303 }, { "epoch": 0.91, "learning_rate": 1.0235420628361442e-07, "loss": 0.8934, "step": 48304 }, { "epoch": 0.91, "learning_rate": 1.0231094623821936e-07, "loss": 1.1064, "step": 48305 }, { "epoch": 0.91, "learning_rate": 1.0226769514572161e-07, "loss": 0.9725, "step": 48306 }, { "epoch": 0.91, "learning_rate": 1.022244530062827e-07, "loss": 1.0496, "step": 48307 }, { "epoch": 0.91, "learning_rate": 1.0218121982006418e-07, "loss": 0.955, "step": 48308 }, { "epoch": 0.91, "learning_rate": 1.0213799558722759e-07, "loss": 1.002, "step": 48309 }, { "epoch": 0.91, "learning_rate": 1.0209478030793446e-07, "loss": 0.908, "step": 48310 }, { "epoch": 0.91, "learning_rate": 1.0205157398234522e-07, "loss": 0.9038, "step": 48311 }, { "epoch": 0.91, "learning_rate": 1.0200837661062251e-07, "loss": 1.1122, "step": 48312 }, { "epoch": 0.91, "learning_rate": 1.0196518819292678e-07, "loss": 0.8781, "step": 48313 }, { "epoch": 0.91, "learning_rate": 1.0192200872941927e-07, "loss": 0.798, "step": 48314 }, { "epoch": 0.91, "learning_rate": 1.0187883822026179e-07, "loss": 1.0032, "step": 48315 }, { "epoch": 0.91, "learning_rate": 1.0183567666561506e-07, "loss": 0.7398, "step": 48316 }, { "epoch": 0.91, "learning_rate": 1.0179252406564033e-07, "loss": 0.8712, "step": 48317 }, { "epoch": 0.91, "learning_rate": 1.0174938042049886e-07, "loss": 1.049, "step": 48318 }, { "epoch": 0.91, "learning_rate": 1.0170624573035164e-07, "loss": 0.9901, "step": 48319 }, { "epoch": 0.91, "learning_rate": 1.0166311999535994e-07, "loss": 0.9717, "step": 48320 }, { "epoch": 0.91, "learning_rate": 1.0162000321568444e-07, "loss": 0.8828, "step": 48321 }, { "epoch": 0.91, "learning_rate": 1.0157689539148641e-07, "loss": 0.8767, "step": 48322 }, { "epoch": 0.91, "learning_rate": 1.0153379652292655e-07, "loss": 0.825, "step": 48323 }, { "epoch": 0.91, "learning_rate": 1.0149070661016614e-07, "loss": 1.2122, "step": 48324 }, { "epoch": 0.91, "learning_rate": 1.0144762565336585e-07, "loss": 1.3283, "step": 48325 }, { "epoch": 0.91, "learning_rate": 1.0140455365268642e-07, "loss": 0.8519, "step": 48326 }, { "epoch": 0.91, "learning_rate": 1.013614906082891e-07, "loss": 0.9718, "step": 48327 }, { "epoch": 0.91, "learning_rate": 1.013184365203343e-07, "loss": 0.9377, "step": 48328 }, { "epoch": 0.91, "learning_rate": 1.0127539138898273e-07, "loss": 0.9189, "step": 48329 }, { "epoch": 0.91, "learning_rate": 1.012323552143954e-07, "loss": 0.8341, "step": 48330 }, { "epoch": 0.91, "learning_rate": 1.0118932799673325e-07, "loss": 0.9706, "step": 48331 }, { "epoch": 0.91, "learning_rate": 1.011463097361562e-07, "loss": 0.9962, "step": 48332 }, { "epoch": 0.91, "learning_rate": 1.0110330043282546e-07, "loss": 0.8158, "step": 48333 }, { "epoch": 0.91, "learning_rate": 1.0106030008690149e-07, "loss": 0.6497, "step": 48334 }, { "epoch": 0.91, "learning_rate": 1.0101730869854442e-07, "loss": 0.8339, "step": 48335 }, { "epoch": 0.91, "learning_rate": 1.0097432626791553e-07, "loss": 0.8558, "step": 48336 }, { "epoch": 0.91, "learning_rate": 1.0093135279517497e-07, "loss": 1.0114, "step": 48337 }, { "epoch": 0.91, "learning_rate": 1.0088838828048314e-07, "loss": 1.0868, "step": 48338 }, { "epoch": 0.91, "learning_rate": 1.0084543272400049e-07, "loss": 0.5442, "step": 48339 }, { "epoch": 0.91, "learning_rate": 1.0080248612588717e-07, "loss": 0.8967, "step": 48340 }, { "epoch": 0.91, "learning_rate": 1.0075954848630415e-07, "loss": 1.004, "step": 48341 }, { "epoch": 0.91, "learning_rate": 1.007166198054113e-07, "loss": 0.9406, "step": 48342 }, { "epoch": 0.91, "learning_rate": 1.0067370008336935e-07, "loss": 1.0401, "step": 48343 }, { "epoch": 0.91, "learning_rate": 1.0063078932033732e-07, "loss": 0.9572, "step": 48344 }, { "epoch": 0.91, "learning_rate": 1.005878875164773e-07, "loss": 0.7591, "step": 48345 }, { "epoch": 0.91, "learning_rate": 1.0054499467194833e-07, "loss": 1.0609, "step": 48346 }, { "epoch": 0.91, "learning_rate": 1.0050211078691057e-07, "loss": 0.9205, "step": 48347 }, { "epoch": 0.91, "learning_rate": 1.0045923586152446e-07, "loss": 1.0984, "step": 48348 }, { "epoch": 0.91, "learning_rate": 1.0041636989594983e-07, "loss": 1.061, "step": 48349 }, { "epoch": 0.91, "learning_rate": 1.0037351289034714e-07, "loss": 1.1781, "step": 48350 }, { "epoch": 0.91, "learning_rate": 1.0033066484487596e-07, "loss": 1.1046, "step": 48351 }, { "epoch": 0.91, "learning_rate": 1.0028782575969676e-07, "loss": 0.8206, "step": 48352 }, { "epoch": 0.91, "learning_rate": 1.0024499563496882e-07, "loss": 0.8136, "step": 48353 }, { "epoch": 0.91, "learning_rate": 1.0020217447085312e-07, "loss": 0.8613, "step": 48354 }, { "epoch": 0.91, "learning_rate": 1.0015936226750844e-07, "loss": 0.8684, "step": 48355 }, { "epoch": 0.91, "learning_rate": 1.0011655902509492e-07, "loss": 1.1271, "step": 48356 }, { "epoch": 0.91, "learning_rate": 1.0007376474377328e-07, "loss": 0.8642, "step": 48357 }, { "epoch": 0.91, "learning_rate": 1.0003097942370227e-07, "loss": 0.8628, "step": 48358 }, { "epoch": 0.91, "learning_rate": 9.998820306504204e-08, "loss": 0.8735, "step": 48359 }, { "epoch": 0.91, "learning_rate": 9.994543566795217e-08, "loss": 0.7222, "step": 48360 }, { "epoch": 0.91, "learning_rate": 9.990267723259228e-08, "loss": 0.8481, "step": 48361 }, { "epoch": 0.91, "learning_rate": 9.985992775912252e-08, "loss": 0.9852, "step": 48362 }, { "epoch": 0.91, "learning_rate": 9.981718724770218e-08, "loss": 1.1206, "step": 48363 }, { "epoch": 0.91, "learning_rate": 9.977445569849087e-08, "loss": 0.9988, "step": 48364 }, { "epoch": 0.91, "learning_rate": 9.973173311164791e-08, "loss": 0.8202, "step": 48365 }, { "epoch": 0.91, "learning_rate": 9.968901948733345e-08, "loss": 0.9412, "step": 48366 }, { "epoch": 0.91, "learning_rate": 9.964631482570625e-08, "loss": 1.02, "step": 48367 }, { "epoch": 0.91, "learning_rate": 9.960361912692617e-08, "loss": 0.9967, "step": 48368 }, { "epoch": 0.91, "learning_rate": 9.956093239115283e-08, "loss": 0.9355, "step": 48369 }, { "epoch": 0.91, "learning_rate": 9.951825461854498e-08, "loss": 0.7735, "step": 48370 }, { "epoch": 0.91, "learning_rate": 9.947558580926276e-08, "loss": 0.8141, "step": 48371 }, { "epoch": 0.91, "learning_rate": 9.943292596346494e-08, "loss": 0.9014, "step": 48372 }, { "epoch": 0.91, "learning_rate": 9.939027508131111e-08, "loss": 0.9798, "step": 48373 }, { "epoch": 0.91, "learning_rate": 9.934763316295976e-08, "loss": 0.9681, "step": 48374 }, { "epoch": 0.91, "learning_rate": 9.93050002085716e-08, "loss": 1.255, "step": 48375 }, { "epoch": 0.91, "learning_rate": 9.926237621830454e-08, "loss": 0.8792, "step": 48376 }, { "epoch": 0.91, "learning_rate": 9.921976119231791e-08, "loss": 0.9507, "step": 48377 }, { "epoch": 0.91, "learning_rate": 9.917715513077159e-08, "loss": 0.8766, "step": 48378 }, { "epoch": 0.91, "learning_rate": 9.913455803382404e-08, "loss": 0.8519, "step": 48379 }, { "epoch": 0.91, "learning_rate": 9.909196990163434e-08, "loss": 0.6889, "step": 48380 }, { "epoch": 0.91, "learning_rate": 9.904939073436149e-08, "loss": 0.9185, "step": 48381 }, { "epoch": 0.91, "learning_rate": 9.900682053216453e-08, "loss": 0.8716, "step": 48382 }, { "epoch": 0.91, "learning_rate": 9.896425929520281e-08, "loss": 1.0204, "step": 48383 }, { "epoch": 0.91, "learning_rate": 9.89217070236348e-08, "loss": 0.7845, "step": 48384 }, { "epoch": 0.91, "learning_rate": 9.88791637176198e-08, "loss": 0.9309, "step": 48385 }, { "epoch": 0.91, "learning_rate": 9.883662937731575e-08, "loss": 0.85, "step": 48386 }, { "epoch": 0.91, "learning_rate": 9.879410400288253e-08, "loss": 0.7742, "step": 48387 }, { "epoch": 0.91, "learning_rate": 9.875158759447862e-08, "loss": 0.9727, "step": 48388 }, { "epoch": 0.91, "learning_rate": 9.870908015226222e-08, "loss": 0.7082, "step": 48389 }, { "epoch": 0.91, "learning_rate": 9.866658167639293e-08, "loss": 0.882, "step": 48390 }, { "epoch": 0.91, "learning_rate": 9.862409216702868e-08, "loss": 0.7991, "step": 48391 }, { "epoch": 0.91, "learning_rate": 9.85816116243285e-08, "loss": 0.952, "step": 48392 }, { "epoch": 0.91, "learning_rate": 9.853914004845089e-08, "loss": 0.9075, "step": 48393 }, { "epoch": 0.91, "learning_rate": 9.849667743955488e-08, "loss": 0.9504, "step": 48394 }, { "epoch": 0.91, "learning_rate": 9.845422379779812e-08, "loss": 0.7231, "step": 48395 }, { "epoch": 0.91, "learning_rate": 9.841177912334021e-08, "loss": 1.0042, "step": 48396 }, { "epoch": 0.91, "learning_rate": 9.836934341633881e-08, "loss": 0.801, "step": 48397 }, { "epoch": 0.91, "learning_rate": 9.832691667695237e-08, "loss": 0.9166, "step": 48398 }, { "epoch": 0.91, "learning_rate": 9.828449890533997e-08, "loss": 1.1026, "step": 48399 }, { "epoch": 0.91, "learning_rate": 9.824209010165953e-08, "loss": 1.0179, "step": 48400 }, { "epoch": 0.91, "learning_rate": 9.819969026606952e-08, "loss": 0.9408, "step": 48401 }, { "epoch": 0.91, "learning_rate": 9.815729939872814e-08, "loss": 1.0344, "step": 48402 }, { "epoch": 0.91, "learning_rate": 9.811491749979362e-08, "loss": 0.7507, "step": 48403 }, { "epoch": 0.91, "learning_rate": 9.807254456942444e-08, "loss": 0.6716, "step": 48404 }, { "epoch": 0.91, "learning_rate": 9.80301806077788e-08, "loss": 0.9714, "step": 48405 }, { "epoch": 0.91, "learning_rate": 9.798782561501518e-08, "loss": 1.2877, "step": 48406 }, { "epoch": 0.91, "learning_rate": 9.79454795912907e-08, "loss": 0.9777, "step": 48407 }, { "epoch": 0.91, "learning_rate": 9.790314253676465e-08, "loss": 0.7611, "step": 48408 }, { "epoch": 0.91, "learning_rate": 9.78608144515944e-08, "loss": 0.9039, "step": 48409 }, { "epoch": 0.91, "learning_rate": 9.781849533593818e-08, "loss": 0.758, "step": 48410 }, { "epoch": 0.91, "learning_rate": 9.777618518995419e-08, "loss": 0.7696, "step": 48411 }, { "epoch": 0.91, "learning_rate": 9.773388401380007e-08, "loss": 1.2276, "step": 48412 }, { "epoch": 0.91, "learning_rate": 9.769159180763404e-08, "loss": 0.8382, "step": 48413 }, { "epoch": 0.91, "learning_rate": 9.764930857161403e-08, "loss": 1.0003, "step": 48414 }, { "epoch": 0.91, "learning_rate": 9.760703430589825e-08, "loss": 0.6259, "step": 48415 }, { "epoch": 0.91, "learning_rate": 9.756476901064322e-08, "loss": 0.8786, "step": 48416 }, { "epoch": 0.91, "learning_rate": 9.752251268600854e-08, "loss": 0.8939, "step": 48417 }, { "epoch": 0.91, "learning_rate": 9.748026533215077e-08, "loss": 1.2435, "step": 48418 }, { "epoch": 0.91, "learning_rate": 9.743802694922754e-08, "loss": 1.1766, "step": 48419 }, { "epoch": 0.91, "learning_rate": 9.739579753739792e-08, "loss": 0.8542, "step": 48420 }, { "epoch": 0.91, "learning_rate": 9.735357709681842e-08, "loss": 0.8707, "step": 48421 }, { "epoch": 0.91, "learning_rate": 9.73113656276467e-08, "loss": 0.8752, "step": 48422 }, { "epoch": 0.91, "learning_rate": 9.726916313004098e-08, "loss": 0.7263, "step": 48423 }, { "epoch": 0.91, "learning_rate": 9.722696960415834e-08, "loss": 1.062, "step": 48424 }, { "epoch": 0.91, "learning_rate": 9.718478505015672e-08, "loss": 0.9792, "step": 48425 }, { "epoch": 0.91, "learning_rate": 9.714260946819321e-08, "loss": 1.1863, "step": 48426 }, { "epoch": 0.91, "learning_rate": 9.710044285842601e-08, "loss": 0.7292, "step": 48427 }, { "epoch": 0.91, "learning_rate": 9.70582852210114e-08, "loss": 1.0305, "step": 48428 }, { "epoch": 0.91, "learning_rate": 9.701613655610814e-08, "loss": 0.9194, "step": 48429 }, { "epoch": 0.91, "learning_rate": 9.697399686387248e-08, "loss": 0.9592, "step": 48430 }, { "epoch": 0.91, "learning_rate": 9.693186614446237e-08, "loss": 0.849, "step": 48431 }, { "epoch": 0.91, "learning_rate": 9.688974439803517e-08, "loss": 1.1005, "step": 48432 }, { "epoch": 0.91, "learning_rate": 9.68476316247477e-08, "loss": 0.8604, "step": 48433 }, { "epoch": 0.91, "learning_rate": 9.68055278247576e-08, "loss": 0.9262, "step": 48434 }, { "epoch": 0.91, "learning_rate": 9.6763432998222e-08, "loss": 0.9003, "step": 48435 }, { "epoch": 0.91, "learning_rate": 9.672134714529824e-08, "loss": 0.8071, "step": 48436 }, { "epoch": 0.91, "learning_rate": 9.667927026614288e-08, "loss": 0.9531, "step": 48437 }, { "epoch": 0.91, "learning_rate": 9.663720236091384e-08, "loss": 1.0601, "step": 48438 }, { "epoch": 0.91, "learning_rate": 9.659514342976767e-08, "loss": 0.8953, "step": 48439 }, { "epoch": 0.91, "learning_rate": 9.65530934728609e-08, "loss": 0.8441, "step": 48440 }, { "epoch": 0.91, "learning_rate": 9.651105249035231e-08, "loss": 0.9509, "step": 48441 }, { "epoch": 0.91, "learning_rate": 9.646902048239704e-08, "loss": 0.8724, "step": 48442 }, { "epoch": 0.91, "learning_rate": 9.642699744915302e-08, "loss": 1.0427, "step": 48443 }, { "epoch": 0.91, "learning_rate": 9.638498339077679e-08, "loss": 1.0105, "step": 48444 }, { "epoch": 0.91, "learning_rate": 9.634297830742517e-08, "loss": 0.7381, "step": 48445 }, { "epoch": 0.91, "learning_rate": 9.630098219925526e-08, "loss": 0.7168, "step": 48446 }, { "epoch": 0.91, "learning_rate": 9.625899506642388e-08, "loss": 0.7052, "step": 48447 }, { "epoch": 0.91, "learning_rate": 9.621701690908813e-08, "loss": 0.9051, "step": 48448 }, { "epoch": 0.91, "learning_rate": 9.617504772740372e-08, "loss": 0.9706, "step": 48449 }, { "epoch": 0.91, "learning_rate": 9.613308752152827e-08, "loss": 1.2686, "step": 48450 }, { "epoch": 0.91, "learning_rate": 9.609113629161809e-08, "loss": 0.6819, "step": 48451 }, { "epoch": 0.91, "learning_rate": 9.60491940378297e-08, "loss": 0.818, "step": 48452 }, { "epoch": 0.91, "learning_rate": 9.600726076032018e-08, "loss": 0.8926, "step": 48453 }, { "epoch": 0.91, "learning_rate": 9.596533645924583e-08, "loss": 0.7475, "step": 48454 }, { "epoch": 0.91, "learning_rate": 9.592342113476316e-08, "loss": 0.8156, "step": 48455 }, { "epoch": 0.91, "learning_rate": 9.588151478702845e-08, "loss": 0.877, "step": 48456 }, { "epoch": 0.91, "learning_rate": 9.583961741619907e-08, "loss": 0.9442, "step": 48457 }, { "epoch": 0.91, "learning_rate": 9.579772902243046e-08, "loss": 0.8043, "step": 48458 }, { "epoch": 0.91, "learning_rate": 9.575584960587942e-08, "loss": 0.9902, "step": 48459 }, { "epoch": 0.91, "learning_rate": 9.571397916670222e-08, "loss": 0.9666, "step": 48460 }, { "epoch": 0.91, "learning_rate": 9.567211770505541e-08, "loss": 1.0696, "step": 48461 }, { "epoch": 0.91, "learning_rate": 9.563026522109525e-08, "loss": 1.0259, "step": 48462 }, { "epoch": 0.91, "learning_rate": 9.558842171497773e-08, "loss": 0.893, "step": 48463 }, { "epoch": 0.91, "learning_rate": 9.554658718685994e-08, "loss": 0.8636, "step": 48464 }, { "epoch": 0.91, "learning_rate": 9.550476163689649e-08, "loss": 0.7157, "step": 48465 }, { "epoch": 0.91, "learning_rate": 9.5462945065245e-08, "loss": 0.7526, "step": 48466 }, { "epoch": 0.91, "learning_rate": 9.542113747206149e-08, "loss": 0.8936, "step": 48467 }, { "epoch": 0.91, "learning_rate": 9.537933885750139e-08, "loss": 1.0648, "step": 48468 }, { "epoch": 0.91, "learning_rate": 9.533754922172123e-08, "loss": 0.9532, "step": 48469 }, { "epoch": 0.91, "learning_rate": 9.5295768564877e-08, "loss": 0.6158, "step": 48470 }, { "epoch": 0.91, "learning_rate": 9.525399688712439e-08, "loss": 0.8139, "step": 48471 }, { "epoch": 0.91, "learning_rate": 9.521223418861969e-08, "loss": 0.7993, "step": 48472 }, { "epoch": 0.91, "learning_rate": 9.517048046951888e-08, "loss": 0.7543, "step": 48473 }, { "epoch": 0.91, "learning_rate": 9.512873572997766e-08, "loss": 1.1453, "step": 48474 }, { "epoch": 0.91, "learning_rate": 9.508699997015202e-08, "loss": 0.9536, "step": 48475 }, { "epoch": 0.91, "learning_rate": 9.504527319019824e-08, "loss": 0.9787, "step": 48476 }, { "epoch": 0.91, "learning_rate": 9.50035553902709e-08, "loss": 0.8642, "step": 48477 }, { "epoch": 0.91, "learning_rate": 9.496184657052738e-08, "loss": 0.8105, "step": 48478 }, { "epoch": 0.91, "learning_rate": 9.492014673112199e-08, "loss": 0.6366, "step": 48479 }, { "epoch": 0.91, "learning_rate": 9.487845587221101e-08, "loss": 0.857, "step": 48480 }, { "epoch": 0.91, "learning_rate": 9.483677399395042e-08, "loss": 0.8873, "step": 48481 }, { "epoch": 0.91, "learning_rate": 9.479510109649536e-08, "loss": 0.8688, "step": 48482 }, { "epoch": 0.91, "learning_rate": 9.475343718000157e-08, "loss": 0.94, "step": 48483 }, { "epoch": 0.91, "learning_rate": 9.471178224462502e-08, "loss": 0.7961, "step": 48484 }, { "epoch": 0.91, "learning_rate": 9.467013629052086e-08, "loss": 0.7324, "step": 48485 }, { "epoch": 0.91, "learning_rate": 9.462849931784423e-08, "loss": 0.9171, "step": 48486 }, { "epoch": 0.91, "learning_rate": 9.458687132675142e-08, "loss": 1.11, "step": 48487 }, { "epoch": 0.91, "learning_rate": 9.454525231739786e-08, "loss": 0.976, "step": 48488 }, { "epoch": 0.91, "learning_rate": 9.450364228993759e-08, "loss": 0.7663, "step": 48489 }, { "epoch": 0.91, "learning_rate": 9.446204124452796e-08, "loss": 0.7148, "step": 48490 }, { "epoch": 0.91, "learning_rate": 9.442044918132276e-08, "loss": 0.9905, "step": 48491 }, { "epoch": 0.91, "learning_rate": 9.437886610047798e-08, "loss": 0.866, "step": 48492 }, { "epoch": 0.91, "learning_rate": 9.433729200214874e-08, "loss": 0.8987, "step": 48493 }, { "epoch": 0.91, "learning_rate": 9.429572688649024e-08, "loss": 1.0311, "step": 48494 }, { "epoch": 0.91, "learning_rate": 9.425417075365761e-08, "loss": 1.0034, "step": 48495 }, { "epoch": 0.91, "learning_rate": 9.421262360380657e-08, "loss": 0.7304, "step": 48496 }, { "epoch": 0.91, "learning_rate": 9.417108543709169e-08, "loss": 0.8135, "step": 48497 }, { "epoch": 0.92, "learning_rate": 9.412955625366788e-08, "loss": 0.9116, "step": 48498 }, { "epoch": 0.92, "learning_rate": 9.408803605369082e-08, "loss": 1.0574, "step": 48499 }, { "epoch": 0.92, "learning_rate": 9.404652483731542e-08, "loss": 1.1025, "step": 48500 }, { "epoch": 0.92, "learning_rate": 9.400502260469624e-08, "loss": 1.0026, "step": 48501 }, { "epoch": 0.92, "learning_rate": 9.396352935598846e-08, "loss": 0.768, "step": 48502 }, { "epoch": 0.92, "learning_rate": 9.392204509134723e-08, "loss": 0.975, "step": 48503 }, { "epoch": 0.92, "learning_rate": 9.388056981092742e-08, "loss": 0.7379, "step": 48504 }, { "epoch": 0.92, "learning_rate": 9.383910351488363e-08, "loss": 0.9501, "step": 48505 }, { "epoch": 0.92, "learning_rate": 9.379764620337129e-08, "loss": 1.1008, "step": 48506 }, { "epoch": 0.92, "learning_rate": 9.375619787654389e-08, "loss": 0.8184, "step": 48507 }, { "epoch": 0.92, "learning_rate": 9.371475853455769e-08, "loss": 0.799, "step": 48508 }, { "epoch": 0.92, "learning_rate": 9.367332817756675e-08, "loss": 0.8963, "step": 48509 }, { "epoch": 0.92, "learning_rate": 9.363190680572564e-08, "loss": 0.7426, "step": 48510 }, { "epoch": 0.92, "learning_rate": 9.359049441918955e-08, "loss": 0.7625, "step": 48511 }, { "epoch": 0.92, "learning_rate": 9.354909101811249e-08, "loss": 0.8372, "step": 48512 }, { "epoch": 0.92, "learning_rate": 9.350769660264936e-08, "loss": 1.1647, "step": 48513 }, { "epoch": 0.92, "learning_rate": 9.346631117295473e-08, "loss": 0.8625, "step": 48514 }, { "epoch": 0.92, "learning_rate": 9.342493472918295e-08, "loss": 0.9969, "step": 48515 }, { "epoch": 0.92, "learning_rate": 9.33835672714889e-08, "loss": 0.7522, "step": 48516 }, { "epoch": 0.92, "learning_rate": 9.334220880002687e-08, "loss": 0.8332, "step": 48517 }, { "epoch": 0.92, "learning_rate": 9.330085931495148e-08, "loss": 0.8954, "step": 48518 }, { "epoch": 0.92, "learning_rate": 9.32595188164162e-08, "loss": 1.0916, "step": 48519 }, { "epoch": 0.92, "learning_rate": 9.321818730457649e-08, "loss": 1.0347, "step": 48520 }, { "epoch": 0.92, "learning_rate": 9.317686477958637e-08, "loss": 0.8428, "step": 48521 }, { "epoch": 0.92, "learning_rate": 9.31355512415999e-08, "loss": 0.9717, "step": 48522 }, { "epoch": 0.92, "learning_rate": 9.309424669077139e-08, "loss": 0.6081, "step": 48523 }, { "epoch": 0.92, "learning_rate": 9.305295112725516e-08, "loss": 0.8642, "step": 48524 }, { "epoch": 0.92, "learning_rate": 9.301166455120552e-08, "loss": 1.3464, "step": 48525 }, { "epoch": 0.92, "learning_rate": 9.297038696277655e-08, "loss": 0.73, "step": 48526 }, { "epoch": 0.92, "learning_rate": 9.292911836212254e-08, "loss": 0.8708, "step": 48527 }, { "epoch": 0.92, "learning_rate": 9.288785874939671e-08, "loss": 0.6992, "step": 48528 }, { "epoch": 0.92, "learning_rate": 9.284660812475448e-08, "loss": 0.967, "step": 48529 }, { "epoch": 0.92, "learning_rate": 9.28053664883491e-08, "loss": 0.7871, "step": 48530 }, { "epoch": 0.92, "learning_rate": 9.276413384033428e-08, "loss": 1.0272, "step": 48531 }, { "epoch": 0.92, "learning_rate": 9.272291018086493e-08, "loss": 0.9662, "step": 48532 }, { "epoch": 0.92, "learning_rate": 9.268169551009427e-08, "loss": 0.802, "step": 48533 }, { "epoch": 0.92, "learning_rate": 9.26404898281763e-08, "loss": 1.0751, "step": 48534 }, { "epoch": 0.92, "learning_rate": 9.259929313526483e-08, "loss": 0.8307, "step": 48535 }, { "epoch": 0.92, "learning_rate": 9.255810543151361e-08, "loss": 0.9946, "step": 48536 }, { "epoch": 0.92, "learning_rate": 9.251692671707696e-08, "loss": 1.3762, "step": 48537 }, { "epoch": 0.92, "learning_rate": 9.24757569921081e-08, "loss": 0.9349, "step": 48538 }, { "epoch": 0.92, "learning_rate": 9.243459625676132e-08, "loss": 0.9174, "step": 48539 }, { "epoch": 0.92, "learning_rate": 9.239344451118932e-08, "loss": 0.8884, "step": 48540 }, { "epoch": 0.92, "learning_rate": 9.235230175554694e-08, "loss": 0.6896, "step": 48541 }, { "epoch": 0.92, "learning_rate": 9.231116798998713e-08, "loss": 0.8781, "step": 48542 }, { "epoch": 0.92, "learning_rate": 9.227004321466338e-08, "loss": 1.0032, "step": 48543 }, { "epoch": 0.92, "learning_rate": 9.222892742972945e-08, "loss": 0.9638, "step": 48544 }, { "epoch": 0.92, "learning_rate": 9.21878206353391e-08, "loss": 0.7626, "step": 48545 }, { "epoch": 0.92, "learning_rate": 9.214672283164528e-08, "loss": 0.6745, "step": 48546 }, { "epoch": 0.92, "learning_rate": 9.210563401880201e-08, "loss": 0.9155, "step": 48547 }, { "epoch": 0.92, "learning_rate": 9.20645541969628e-08, "loss": 0.8457, "step": 48548 }, { "epoch": 0.92, "learning_rate": 9.202348336628003e-08, "loss": 0.796, "step": 48549 }, { "epoch": 0.92, "learning_rate": 9.1982421526908e-08, "loss": 0.946, "step": 48550 }, { "epoch": 0.92, "learning_rate": 9.194136867900022e-08, "loss": 1.0879, "step": 48551 }, { "epoch": 0.92, "learning_rate": 9.190032482270877e-08, "loss": 0.9353, "step": 48552 }, { "epoch": 0.92, "learning_rate": 9.185928995818827e-08, "loss": 0.9099, "step": 48553 }, { "epoch": 0.92, "learning_rate": 9.181826408559108e-08, "loss": 0.846, "step": 48554 }, { "epoch": 0.92, "learning_rate": 9.17772472050707e-08, "loss": 0.9262, "step": 48555 }, { "epoch": 0.92, "learning_rate": 9.173623931678033e-08, "loss": 0.9572, "step": 48556 }, { "epoch": 0.92, "learning_rate": 9.169524042087291e-08, "loss": 1.0261, "step": 48557 }, { "epoch": 0.92, "learning_rate": 9.165425051750165e-08, "loss": 0.9222, "step": 48558 }, { "epoch": 0.92, "learning_rate": 9.161326960681948e-08, "loss": 0.9954, "step": 48559 }, { "epoch": 0.92, "learning_rate": 9.157229768897991e-08, "loss": 0.8288, "step": 48560 }, { "epoch": 0.92, "learning_rate": 9.1531334764135e-08, "loss": 0.7789, "step": 48561 }, { "epoch": 0.92, "learning_rate": 9.149038083243855e-08, "loss": 1.1037, "step": 48562 }, { "epoch": 0.92, "learning_rate": 9.14494358940432e-08, "loss": 1.0827, "step": 48563 }, { "epoch": 0.92, "learning_rate": 9.140849994910161e-08, "loss": 0.8934, "step": 48564 }, { "epoch": 0.92, "learning_rate": 9.1367572997767e-08, "loss": 0.8264, "step": 48565 }, { "epoch": 0.92, "learning_rate": 9.1326655040192e-08, "loss": 1.0678, "step": 48566 }, { "epoch": 0.92, "learning_rate": 9.128574607652929e-08, "loss": 0.9952, "step": 48567 }, { "epoch": 0.92, "learning_rate": 9.12448461069318e-08, "loss": 1.0538, "step": 48568 }, { "epoch": 0.92, "learning_rate": 9.120395513155245e-08, "loss": 1.0938, "step": 48569 }, { "epoch": 0.92, "learning_rate": 9.116307315054307e-08, "loss": 0.8115, "step": 48570 }, { "epoch": 0.92, "learning_rate": 9.112220016405743e-08, "loss": 0.7672, "step": 48571 }, { "epoch": 0.92, "learning_rate": 9.10813361722479e-08, "loss": 0.9597, "step": 48572 }, { "epoch": 0.92, "learning_rate": 9.104048117526604e-08, "loss": 0.8965, "step": 48573 }, { "epoch": 0.92, "learning_rate": 9.099963517326588e-08, "loss": 1.2323, "step": 48574 }, { "epoch": 0.92, "learning_rate": 9.095879816639869e-08, "loss": 0.877, "step": 48575 }, { "epoch": 0.92, "learning_rate": 9.091797015481768e-08, "loss": 0.9269, "step": 48576 }, { "epoch": 0.92, "learning_rate": 9.087715113867496e-08, "loss": 0.8527, "step": 48577 }, { "epoch": 0.92, "learning_rate": 9.083634111812346e-08, "loss": 0.8639, "step": 48578 }, { "epoch": 0.92, "learning_rate": 9.079554009331471e-08, "loss": 0.7404, "step": 48579 }, { "epoch": 0.92, "learning_rate": 9.075474806440193e-08, "loss": 0.8445, "step": 48580 }, { "epoch": 0.92, "learning_rate": 9.071396503153723e-08, "loss": 1.106, "step": 48581 }, { "epoch": 0.92, "learning_rate": 9.067319099487215e-08, "loss": 0.8736, "step": 48582 }, { "epoch": 0.92, "learning_rate": 9.06324259545599e-08, "loss": 0.9458, "step": 48583 }, { "epoch": 0.92, "learning_rate": 9.059166991075202e-08, "loss": 0.8083, "step": 48584 }, { "epoch": 0.92, "learning_rate": 9.055092286360117e-08, "loss": 0.8177, "step": 48585 }, { "epoch": 0.92, "learning_rate": 9.051018481325919e-08, "loss": 0.8444, "step": 48586 }, { "epoch": 0.92, "learning_rate": 9.046945575987842e-08, "loss": 1.0659, "step": 48587 }, { "epoch": 0.92, "learning_rate": 9.042873570361072e-08, "loss": 1.0092, "step": 48588 }, { "epoch": 0.92, "learning_rate": 9.038802464460816e-08, "loss": 0.8372, "step": 48589 }, { "epoch": 0.92, "learning_rate": 9.034732258302342e-08, "loss": 0.8836, "step": 48590 }, { "epoch": 0.92, "learning_rate": 9.030662951900692e-08, "loss": 0.8749, "step": 48591 }, { "epoch": 0.92, "learning_rate": 9.026594545271217e-08, "loss": 0.784, "step": 48592 }, { "epoch": 0.92, "learning_rate": 9.022527038429068e-08, "loss": 1.0663, "step": 48593 }, { "epoch": 0.92, "learning_rate": 9.018460431389347e-08, "loss": 0.8807, "step": 48594 }, { "epoch": 0.92, "learning_rate": 9.014394724167402e-08, "loss": 0.818, "step": 48595 }, { "epoch": 0.92, "learning_rate": 9.010329916778249e-08, "loss": 0.8961, "step": 48596 }, { "epoch": 0.92, "learning_rate": 9.006266009237153e-08, "loss": 0.7375, "step": 48597 }, { "epoch": 0.92, "learning_rate": 9.002203001559267e-08, "loss": 0.8311, "step": 48598 }, { "epoch": 0.92, "learning_rate": 8.998140893759749e-08, "loss": 0.8252, "step": 48599 }, { "epoch": 0.92, "learning_rate": 8.994079685853808e-08, "loss": 1.0735, "step": 48600 }, { "epoch": 0.92, "learning_rate": 8.990019377856568e-08, "loss": 0.8594, "step": 48601 }, { "epoch": 0.92, "learning_rate": 8.985959969783242e-08, "loss": 0.9522, "step": 48602 }, { "epoch": 0.92, "learning_rate": 8.9819014616489e-08, "loss": 0.6071, "step": 48603 }, { "epoch": 0.92, "learning_rate": 8.977843853468809e-08, "loss": 0.8256, "step": 48604 }, { "epoch": 0.92, "learning_rate": 8.973787145258012e-08, "loss": 0.936, "step": 48605 }, { "epoch": 0.92, "learning_rate": 8.969731337031718e-08, "loss": 1.0518, "step": 48606 }, { "epoch": 0.92, "learning_rate": 8.965676428805053e-08, "loss": 0.9116, "step": 48607 }, { "epoch": 0.92, "learning_rate": 8.961622420593146e-08, "loss": 0.8835, "step": 48608 }, { "epoch": 0.92, "learning_rate": 8.95756931241118e-08, "loss": 0.9114, "step": 48609 }, { "epoch": 0.92, "learning_rate": 8.953517104274251e-08, "loss": 0.7813, "step": 48610 }, { "epoch": 0.92, "learning_rate": 8.949465796197515e-08, "loss": 0.8884, "step": 48611 }, { "epoch": 0.92, "learning_rate": 8.945415388196043e-08, "loss": 1.2246, "step": 48612 }, { "epoch": 0.92, "learning_rate": 8.941365880285019e-08, "loss": 0.9486, "step": 48613 }, { "epoch": 0.92, "learning_rate": 8.937317272479568e-08, "loss": 0.9203, "step": 48614 }, { "epoch": 0.92, "learning_rate": 8.933269564794705e-08, "loss": 0.9499, "step": 48615 }, { "epoch": 0.92, "learning_rate": 8.929222757245726e-08, "loss": 0.6597, "step": 48616 }, { "epoch": 0.92, "learning_rate": 8.925176849847589e-08, "loss": 0.7803, "step": 48617 }, { "epoch": 0.92, "learning_rate": 8.921131842615422e-08, "loss": 1.0627, "step": 48618 }, { "epoch": 0.92, "learning_rate": 8.917087735564406e-08, "loss": 0.9842, "step": 48619 }, { "epoch": 0.92, "learning_rate": 8.913044528709557e-08, "loss": 0.8886, "step": 48620 }, { "epoch": 0.92, "learning_rate": 8.909002222066033e-08, "loss": 0.7188, "step": 48621 }, { "epoch": 0.92, "learning_rate": 8.904960815648872e-08, "loss": 0.769, "step": 48622 }, { "epoch": 0.92, "learning_rate": 8.900920309473232e-08, "loss": 0.7476, "step": 48623 }, { "epoch": 0.92, "learning_rate": 8.896880703554129e-08, "loss": 0.9316, "step": 48624 }, { "epoch": 0.92, "learning_rate": 8.892841997906714e-08, "loss": 1.0343, "step": 48625 }, { "epoch": 0.92, "learning_rate": 8.888804192546036e-08, "loss": 0.8763, "step": 48626 }, { "epoch": 0.92, "learning_rate": 8.884767287487134e-08, "loss": 0.8182, "step": 48627 }, { "epoch": 0.92, "learning_rate": 8.880731282745136e-08, "loss": 0.847, "step": 48628 }, { "epoch": 0.92, "learning_rate": 8.876696178335087e-08, "loss": 0.8717, "step": 48629 }, { "epoch": 0.92, "learning_rate": 8.872661974272085e-08, "loss": 0.9291, "step": 48630 }, { "epoch": 0.92, "learning_rate": 8.868628670571144e-08, "loss": 1.0134, "step": 48631 }, { "epoch": 0.92, "learning_rate": 8.864596267247394e-08, "loss": 0.91, "step": 48632 }, { "epoch": 0.92, "learning_rate": 8.860564764315794e-08, "loss": 0.8705, "step": 48633 }, { "epoch": 0.92, "learning_rate": 8.85653416179147e-08, "loss": 0.885, "step": 48634 }, { "epoch": 0.92, "learning_rate": 8.852504459689465e-08, "loss": 0.8036, "step": 48635 }, { "epoch": 0.92, "learning_rate": 8.848475658024797e-08, "loss": 0.8005, "step": 48636 }, { "epoch": 0.92, "learning_rate": 8.844447756812564e-08, "loss": 0.9079, "step": 48637 }, { "epoch": 0.92, "learning_rate": 8.840420756067725e-08, "loss": 0.8992, "step": 48638 }, { "epoch": 0.92, "learning_rate": 8.83639465580538e-08, "loss": 0.8757, "step": 48639 }, { "epoch": 0.92, "learning_rate": 8.832369456040546e-08, "loss": 0.9921, "step": 48640 }, { "epoch": 0.92, "learning_rate": 8.828345156788237e-08, "loss": 0.9877, "step": 48641 }, { "epoch": 0.92, "learning_rate": 8.824321758063498e-08, "loss": 0.6738, "step": 48642 }, { "epoch": 0.92, "learning_rate": 8.820299259881343e-08, "loss": 1.329, "step": 48643 }, { "epoch": 0.92, "learning_rate": 8.816277662256817e-08, "loss": 0.9796, "step": 48644 }, { "epoch": 0.92, "learning_rate": 8.81225696520488e-08, "loss": 0.8504, "step": 48645 }, { "epoch": 0.92, "learning_rate": 8.80823716874063e-08, "loss": 0.8739, "step": 48646 }, { "epoch": 0.92, "learning_rate": 8.804218272879001e-08, "loss": 1.1534, "step": 48647 }, { "epoch": 0.92, "learning_rate": 8.800200277635008e-08, "loss": 0.7855, "step": 48648 }, { "epoch": 0.92, "learning_rate": 8.796183183023693e-08, "loss": 0.906, "step": 48649 }, { "epoch": 0.92, "learning_rate": 8.79216698906002e-08, "loss": 0.9989, "step": 48650 }, { "epoch": 0.92, "learning_rate": 8.788151695759001e-08, "loss": 0.8688, "step": 48651 }, { "epoch": 0.92, "learning_rate": 8.784137303135654e-08, "loss": 0.9613, "step": 48652 }, { "epoch": 0.92, "learning_rate": 8.780123811204938e-08, "loss": 0.9205, "step": 48653 }, { "epoch": 0.92, "learning_rate": 8.776111219981814e-08, "loss": 0.7756, "step": 48654 }, { "epoch": 0.92, "learning_rate": 8.772099529481298e-08, "loss": 1.0198, "step": 48655 }, { "epoch": 0.92, "learning_rate": 8.768088739718406e-08, "loss": 1.2809, "step": 48656 }, { "epoch": 0.92, "learning_rate": 8.764078850708013e-08, "loss": 0.9662, "step": 48657 }, { "epoch": 0.92, "learning_rate": 8.76006986246522e-08, "loss": 0.9502, "step": 48658 }, { "epoch": 0.92, "learning_rate": 8.756061775004876e-08, "loss": 0.7743, "step": 48659 }, { "epoch": 0.92, "learning_rate": 8.752054588342024e-08, "loss": 0.9501, "step": 48660 }, { "epoch": 0.92, "learning_rate": 8.748048302491597e-08, "loss": 0.84, "step": 48661 }, { "epoch": 0.92, "learning_rate": 8.744042917468582e-08, "loss": 1.0147, "step": 48662 }, { "epoch": 0.92, "learning_rate": 8.740038433287884e-08, "loss": 1.0239, "step": 48663 }, { "epoch": 0.92, "learning_rate": 8.736034849964492e-08, "loss": 1.1106, "step": 48664 }, { "epoch": 0.92, "learning_rate": 8.732032167513366e-08, "loss": 0.8008, "step": 48665 }, { "epoch": 0.92, "learning_rate": 8.72803038594941e-08, "loss": 0.7792, "step": 48666 }, { "epoch": 0.92, "learning_rate": 8.724029505287613e-08, "loss": 0.8109, "step": 48667 }, { "epoch": 0.92, "learning_rate": 8.720029525542878e-08, "loss": 1.0381, "step": 48668 }, { "epoch": 0.92, "learning_rate": 8.716030446730167e-08, "loss": 1.159, "step": 48669 }, { "epoch": 0.92, "learning_rate": 8.712032268864384e-08, "loss": 0.7852, "step": 48670 }, { "epoch": 0.92, "learning_rate": 8.70803499196049e-08, "loss": 0.9135, "step": 48671 }, { "epoch": 0.92, "learning_rate": 8.704038616033389e-08, "loss": 0.78, "step": 48672 }, { "epoch": 0.92, "learning_rate": 8.700043141098013e-08, "loss": 0.8462, "step": 48673 }, { "epoch": 0.92, "learning_rate": 8.696048567169296e-08, "loss": 1.1522, "step": 48674 }, { "epoch": 0.92, "learning_rate": 8.692054894262087e-08, "loss": 1.1157, "step": 48675 }, { "epoch": 0.92, "learning_rate": 8.688062122391345e-08, "loss": 1.0098, "step": 48676 }, { "epoch": 0.92, "learning_rate": 8.684070251572057e-08, "loss": 0.6958, "step": 48677 }, { "epoch": 0.92, "learning_rate": 8.680079281818965e-08, "loss": 0.8073, "step": 48678 }, { "epoch": 0.92, "learning_rate": 8.676089213147109e-08, "loss": 0.7519, "step": 48679 }, { "epoch": 0.92, "learning_rate": 8.672100045571314e-08, "loss": 0.7511, "step": 48680 }, { "epoch": 0.92, "learning_rate": 8.668111779106508e-08, "loss": 1.1846, "step": 48681 }, { "epoch": 0.92, "learning_rate": 8.664124413767572e-08, "loss": 0.7255, "step": 48682 }, { "epoch": 0.92, "learning_rate": 8.660137949569408e-08, "loss": 1.1036, "step": 48683 }, { "epoch": 0.92, "learning_rate": 8.656152386526895e-08, "loss": 0.9304, "step": 48684 }, { "epoch": 0.92, "learning_rate": 8.652167724654853e-08, "loss": 0.8301, "step": 48685 }, { "epoch": 0.92, "learning_rate": 8.648183963968298e-08, "loss": 0.8181, "step": 48686 }, { "epoch": 0.92, "learning_rate": 8.644201104481969e-08, "loss": 0.878, "step": 48687 }, { "epoch": 0.92, "learning_rate": 8.640219146210798e-08, "loss": 0.924, "step": 48688 }, { "epoch": 0.92, "learning_rate": 8.636238089169663e-08, "loss": 0.8934, "step": 48689 }, { "epoch": 0.92, "learning_rate": 8.632257933373411e-08, "loss": 0.9935, "step": 48690 }, { "epoch": 0.92, "learning_rate": 8.628278678836894e-08, "loss": 0.7367, "step": 48691 }, { "epoch": 0.92, "learning_rate": 8.624300325574986e-08, "loss": 0.8676, "step": 48692 }, { "epoch": 0.92, "learning_rate": 8.620322873602565e-08, "loss": 1.0912, "step": 48693 }, { "epoch": 0.92, "learning_rate": 8.616346322934427e-08, "loss": 0.8615, "step": 48694 }, { "epoch": 0.92, "learning_rate": 8.612370673585474e-08, "loss": 0.9245, "step": 48695 }, { "epoch": 0.92, "learning_rate": 8.608395925570529e-08, "loss": 0.6212, "step": 48696 }, { "epoch": 0.92, "learning_rate": 8.604422078904384e-08, "loss": 1.136, "step": 48697 }, { "epoch": 0.92, "learning_rate": 8.600449133601973e-08, "loss": 0.8166, "step": 48698 }, { "epoch": 0.92, "learning_rate": 8.59647708967809e-08, "loss": 0.9119, "step": 48699 }, { "epoch": 0.92, "learning_rate": 8.592505947147528e-08, "loss": 1.2511, "step": 48700 }, { "epoch": 0.92, "learning_rate": 8.588535706025164e-08, "loss": 0.7779, "step": 48701 }, { "epoch": 0.92, "learning_rate": 8.584566366325792e-08, "loss": 0.7893, "step": 48702 }, { "epoch": 0.92, "learning_rate": 8.58059792806426e-08, "loss": 0.9492, "step": 48703 }, { "epoch": 0.92, "learning_rate": 8.576630391255363e-08, "loss": 0.8664, "step": 48704 }, { "epoch": 0.92, "learning_rate": 8.572663755913979e-08, "loss": 0.8272, "step": 48705 }, { "epoch": 0.92, "learning_rate": 8.568698022054788e-08, "loss": 1.1902, "step": 48706 }, { "epoch": 0.92, "learning_rate": 8.564733189692726e-08, "loss": 0.9683, "step": 48707 }, { "epoch": 0.92, "learning_rate": 8.560769258842527e-08, "loss": 0.7045, "step": 48708 }, { "epoch": 0.92, "learning_rate": 8.556806229519016e-08, "loss": 0.8893, "step": 48709 }, { "epoch": 0.92, "learning_rate": 8.552844101737013e-08, "loss": 0.9401, "step": 48710 }, { "epoch": 0.92, "learning_rate": 8.548882875511255e-08, "loss": 0.664, "step": 48711 }, { "epoch": 0.92, "learning_rate": 8.544922550856566e-08, "loss": 1.0079, "step": 48712 }, { "epoch": 0.92, "learning_rate": 8.540963127787738e-08, "loss": 1.0379, "step": 48713 }, { "epoch": 0.92, "learning_rate": 8.537004606319566e-08, "loss": 0.9089, "step": 48714 }, { "epoch": 0.92, "learning_rate": 8.533046986466786e-08, "loss": 0.8471, "step": 48715 }, { "epoch": 0.92, "learning_rate": 8.52909026824425e-08, "loss": 0.6451, "step": 48716 }, { "epoch": 0.92, "learning_rate": 8.525134451666666e-08, "loss": 0.7805, "step": 48717 }, { "epoch": 0.92, "learning_rate": 8.521179536748775e-08, "loss": 1.076, "step": 48718 }, { "epoch": 0.92, "learning_rate": 8.51722552350548e-08, "loss": 1.012, "step": 48719 }, { "epoch": 0.92, "learning_rate": 8.513272411951406e-08, "loss": 0.745, "step": 48720 }, { "epoch": 0.92, "learning_rate": 8.509320202101379e-08, "loss": 0.7467, "step": 48721 }, { "epoch": 0.92, "learning_rate": 8.505368893970162e-08, "loss": 0.9165, "step": 48722 }, { "epoch": 0.92, "learning_rate": 8.501418487572465e-08, "loss": 0.7346, "step": 48723 }, { "epoch": 0.92, "learning_rate": 8.497468982923084e-08, "loss": 1.1207, "step": 48724 }, { "epoch": 0.92, "learning_rate": 8.493520380036757e-08, "loss": 1.1419, "step": 48725 }, { "epoch": 0.92, "learning_rate": 8.489572678928221e-08, "loss": 1.0135, "step": 48726 }, { "epoch": 0.92, "learning_rate": 8.485625879612186e-08, "loss": 0.8376, "step": 48727 }, { "epoch": 0.92, "learning_rate": 8.481679982103475e-08, "loss": 0.7913, "step": 48728 }, { "epoch": 0.92, "learning_rate": 8.477734986416714e-08, "loss": 0.856, "step": 48729 }, { "epoch": 0.92, "learning_rate": 8.473790892566697e-08, "loss": 0.8513, "step": 48730 }, { "epoch": 0.92, "learning_rate": 8.469847700568162e-08, "loss": 0.9683, "step": 48731 }, { "epoch": 0.92, "learning_rate": 8.465905410435765e-08, "loss": 1.008, "step": 48732 }, { "epoch": 0.92, "learning_rate": 8.461964022184299e-08, "loss": 0.9532, "step": 48733 }, { "epoch": 0.92, "learning_rate": 8.458023535828474e-08, "loss": 0.9224, "step": 48734 }, { "epoch": 0.92, "learning_rate": 8.454083951382975e-08, "loss": 0.8329, "step": 48735 }, { "epoch": 0.92, "learning_rate": 8.450145268862481e-08, "loss": 0.851, "step": 48736 }, { "epoch": 0.92, "learning_rate": 8.44620748828176e-08, "loss": 1.0942, "step": 48737 }, { "epoch": 0.92, "learning_rate": 8.442270609655522e-08, "loss": 0.9552, "step": 48738 }, { "epoch": 0.92, "learning_rate": 8.438334632998397e-08, "loss": 0.8629, "step": 48739 }, { "epoch": 0.92, "learning_rate": 8.434399558325173e-08, "loss": 0.925, "step": 48740 }, { "epoch": 0.92, "learning_rate": 8.430465385650455e-08, "loss": 0.7977, "step": 48741 }, { "epoch": 0.92, "learning_rate": 8.426532114988978e-08, "loss": 0.8391, "step": 48742 }, { "epoch": 0.92, "learning_rate": 8.422599746355426e-08, "loss": 0.9697, "step": 48743 }, { "epoch": 0.92, "learning_rate": 8.418668279764481e-08, "loss": 1.0014, "step": 48744 }, { "epoch": 0.92, "learning_rate": 8.414737715230825e-08, "loss": 0.7769, "step": 48745 }, { "epoch": 0.92, "learning_rate": 8.410808052769143e-08, "loss": 0.7638, "step": 48746 }, { "epoch": 0.92, "learning_rate": 8.406879292394088e-08, "loss": 0.7574, "step": 48747 }, { "epoch": 0.92, "learning_rate": 8.402951434120315e-08, "loss": 0.8502, "step": 48748 }, { "epoch": 0.92, "learning_rate": 8.399024477962564e-08, "loss": 0.9492, "step": 48749 }, { "epoch": 0.92, "learning_rate": 8.395098423935404e-08, "loss": 1.1496, "step": 48750 }, { "epoch": 0.92, "learning_rate": 8.391173272053548e-08, "loss": 1.0536, "step": 48751 }, { "epoch": 0.92, "learning_rate": 8.38724902233165e-08, "loss": 0.8541, "step": 48752 }, { "epoch": 0.92, "learning_rate": 8.383325674784337e-08, "loss": 1.1257, "step": 48753 }, { "epoch": 0.92, "learning_rate": 8.379403229426291e-08, "loss": 0.9007, "step": 48754 }, { "epoch": 0.92, "learning_rate": 8.37548168627214e-08, "loss": 0.8347, "step": 48755 }, { "epoch": 0.92, "learning_rate": 8.371561045336568e-08, "loss": 0.8981, "step": 48756 }, { "epoch": 0.92, "learning_rate": 8.367641306634117e-08, "loss": 1.061, "step": 48757 }, { "epoch": 0.92, "learning_rate": 8.363722470179525e-08, "loss": 1.0168, "step": 48758 }, { "epoch": 0.92, "learning_rate": 8.359804535987392e-08, "loss": 0.9518, "step": 48759 }, { "epoch": 0.92, "learning_rate": 8.35588750407229e-08, "loss": 0.7664, "step": 48760 }, { "epoch": 0.92, "learning_rate": 8.351971374448958e-08, "loss": 0.79, "step": 48761 }, { "epoch": 0.92, "learning_rate": 8.348056147131939e-08, "loss": 0.9518, "step": 48762 }, { "epoch": 0.92, "learning_rate": 8.34414182213586e-08, "loss": 0.9796, "step": 48763 }, { "epoch": 0.92, "learning_rate": 8.340228399475319e-08, "loss": 0.8658, "step": 48764 }, { "epoch": 0.92, "learning_rate": 8.336315879165002e-08, "loss": 0.9048, "step": 48765 }, { "epoch": 0.92, "learning_rate": 8.332404261219451e-08, "loss": 0.8803, "step": 48766 }, { "epoch": 0.92, "learning_rate": 8.328493545653265e-08, "loss": 0.7271, "step": 48767 }, { "epoch": 0.92, "learning_rate": 8.324583732481128e-08, "loss": 0.9836, "step": 48768 }, { "epoch": 0.92, "learning_rate": 8.320674821717529e-08, "loss": 1.0796, "step": 48769 }, { "epoch": 0.92, "learning_rate": 8.316766813377175e-08, "loss": 0.8559, "step": 48770 }, { "epoch": 0.92, "learning_rate": 8.312859707474585e-08, "loss": 0.7167, "step": 48771 }, { "epoch": 0.92, "learning_rate": 8.308953504024359e-08, "loss": 0.7951, "step": 48772 }, { "epoch": 0.92, "learning_rate": 8.305048203041094e-08, "loss": 0.9415, "step": 48773 }, { "epoch": 0.92, "learning_rate": 8.301143804539364e-08, "loss": 1.0148, "step": 48774 }, { "epoch": 0.92, "learning_rate": 8.297240308533738e-08, "loss": 1.0091, "step": 48775 }, { "epoch": 0.92, "learning_rate": 8.293337715038818e-08, "loss": 1.0948, "step": 48776 }, { "epoch": 0.92, "learning_rate": 8.289436024069203e-08, "loss": 1.0008, "step": 48777 }, { "epoch": 0.92, "learning_rate": 8.285535235639352e-08, "loss": 0.9752, "step": 48778 }, { "epoch": 0.92, "learning_rate": 8.28163534976395e-08, "loss": 0.8487, "step": 48779 }, { "epoch": 0.92, "learning_rate": 8.277736366457512e-08, "loss": 0.7647, "step": 48780 }, { "epoch": 0.92, "learning_rate": 8.273838285734554e-08, "loss": 1.0947, "step": 48781 }, { "epoch": 0.92, "learning_rate": 8.269941107609731e-08, "loss": 0.9384, "step": 48782 }, { "epoch": 0.92, "learning_rate": 8.266044832097503e-08, "loss": 0.8171, "step": 48783 }, { "epoch": 0.92, "learning_rate": 8.262149459212443e-08, "loss": 0.7815, "step": 48784 }, { "epoch": 0.92, "learning_rate": 8.258254988969122e-08, "loss": 0.8531, "step": 48785 }, { "epoch": 0.92, "learning_rate": 8.254361421382057e-08, "loss": 0.8867, "step": 48786 }, { "epoch": 0.92, "learning_rate": 8.25046875646579e-08, "loss": 0.9346, "step": 48787 }, { "epoch": 0.92, "learning_rate": 8.246576994234867e-08, "loss": 1.143, "step": 48788 }, { "epoch": 0.92, "learning_rate": 8.24268613470383e-08, "loss": 0.9227, "step": 48789 }, { "epoch": 0.92, "learning_rate": 8.238796177887143e-08, "loss": 0.9243, "step": 48790 }, { "epoch": 0.92, "learning_rate": 8.23490712379943e-08, "loss": 0.8406, "step": 48791 }, { "epoch": 0.92, "learning_rate": 8.231018972455152e-08, "loss": 0.7052, "step": 48792 }, { "epoch": 0.92, "learning_rate": 8.227131723868825e-08, "loss": 0.992, "step": 48793 }, { "epoch": 0.92, "learning_rate": 8.223245378054967e-08, "loss": 1.007, "step": 48794 }, { "epoch": 0.92, "learning_rate": 8.219359935028092e-08, "loss": 0.8992, "step": 48795 }, { "epoch": 0.92, "learning_rate": 8.215475394802719e-08, "loss": 0.8898, "step": 48796 }, { "epoch": 0.92, "learning_rate": 8.211591757393361e-08, "loss": 0.8979, "step": 48797 }, { "epoch": 0.92, "learning_rate": 8.207709022814536e-08, "loss": 0.7332, "step": 48798 }, { "epoch": 0.92, "learning_rate": 8.20382719108065e-08, "loss": 1.1927, "step": 48799 }, { "epoch": 0.92, "learning_rate": 8.19994626220627e-08, "loss": 0.9964, "step": 48800 }, { "epoch": 0.92, "learning_rate": 8.196066236205918e-08, "loss": 0.8031, "step": 48801 }, { "epoch": 0.92, "learning_rate": 8.192187113093997e-08, "loss": 0.8422, "step": 48802 }, { "epoch": 0.92, "learning_rate": 8.188308892885078e-08, "loss": 0.8221, "step": 48803 }, { "epoch": 0.92, "learning_rate": 8.184431575593566e-08, "loss": 0.788, "step": 48804 }, { "epoch": 0.92, "learning_rate": 8.180555161233977e-08, "loss": 0.9366, "step": 48805 }, { "epoch": 0.92, "learning_rate": 8.176679649820774e-08, "loss": 0.9547, "step": 48806 }, { "epoch": 0.92, "learning_rate": 8.172805041368442e-08, "loss": 0.71, "step": 48807 }, { "epoch": 0.92, "learning_rate": 8.168931335891444e-08, "loss": 0.8794, "step": 48808 }, { "epoch": 0.92, "learning_rate": 8.165058533404241e-08, "loss": 0.954, "step": 48809 }, { "epoch": 0.92, "learning_rate": 8.161186633921347e-08, "loss": 0.8005, "step": 48810 }, { "epoch": 0.92, "learning_rate": 8.157315637457086e-08, "loss": 0.8964, "step": 48811 }, { "epoch": 0.92, "learning_rate": 8.153445544026028e-08, "loss": 1.066, "step": 48812 }, { "epoch": 0.92, "learning_rate": 8.149576353642608e-08, "loss": 1.0176, "step": 48813 }, { "epoch": 0.92, "learning_rate": 8.145708066321229e-08, "loss": 0.6862, "step": 48814 }, { "epoch": 0.92, "learning_rate": 8.141840682076352e-08, "loss": 0.877, "step": 48815 }, { "epoch": 0.92, "learning_rate": 8.137974200922438e-08, "loss": 0.7337, "step": 48816 }, { "epoch": 0.92, "learning_rate": 8.134108622873893e-08, "loss": 0.7875, "step": 48817 }, { "epoch": 0.92, "learning_rate": 8.130243947945204e-08, "loss": 1.1765, "step": 48818 }, { "epoch": 0.92, "learning_rate": 8.126380176150778e-08, "loss": 1.2664, "step": 48819 }, { "epoch": 0.92, "learning_rate": 8.12251730750499e-08, "loss": 0.8702, "step": 48820 }, { "epoch": 0.92, "learning_rate": 8.118655342022303e-08, "loss": 0.9511, "step": 48821 }, { "epoch": 0.92, "learning_rate": 8.114794279717203e-08, "loss": 0.8323, "step": 48822 }, { "epoch": 0.92, "learning_rate": 8.110934120603958e-08, "loss": 0.7102, "step": 48823 }, { "epoch": 0.92, "learning_rate": 8.10707486469714e-08, "loss": 0.9103, "step": 48824 }, { "epoch": 0.92, "learning_rate": 8.10321651201107e-08, "loss": 1.1979, "step": 48825 }, { "epoch": 0.92, "learning_rate": 8.09935906256018e-08, "loss": 0.9397, "step": 48826 }, { "epoch": 0.92, "learning_rate": 8.09550251635885e-08, "loss": 0.8458, "step": 48827 }, { "epoch": 0.92, "learning_rate": 8.091646873421483e-08, "loss": 1.0066, "step": 48828 }, { "epoch": 0.92, "learning_rate": 8.087792133762512e-08, "loss": 0.7401, "step": 48829 }, { "epoch": 0.92, "learning_rate": 8.083938297396288e-08, "loss": 0.989, "step": 48830 }, { "epoch": 0.92, "learning_rate": 8.08008536433727e-08, "loss": 1.2022, "step": 48831 }, { "epoch": 0.92, "learning_rate": 8.076233334599726e-08, "loss": 0.9604, "step": 48832 }, { "epoch": 0.92, "learning_rate": 8.07238220819817e-08, "loss": 1.0226, "step": 48833 }, { "epoch": 0.92, "learning_rate": 8.0685319851469e-08, "loss": 1.0334, "step": 48834 }, { "epoch": 0.92, "learning_rate": 8.064682665460289e-08, "loss": 0.6852, "step": 48835 }, { "epoch": 0.92, "learning_rate": 8.060834249152771e-08, "loss": 0.757, "step": 48836 }, { "epoch": 0.92, "learning_rate": 8.056986736238642e-08, "loss": 1.2687, "step": 48837 }, { "epoch": 0.92, "learning_rate": 8.053140126732334e-08, "loss": 0.9606, "step": 48838 }, { "epoch": 0.92, "learning_rate": 8.049294420648168e-08, "loss": 0.8461, "step": 48839 }, { "epoch": 0.92, "learning_rate": 8.04544961800055e-08, "loss": 0.9102, "step": 48840 }, { "epoch": 0.92, "learning_rate": 8.041605718803747e-08, "loss": 0.7591, "step": 48841 }, { "epoch": 0.92, "learning_rate": 8.037762723072218e-08, "loss": 0.7068, "step": 48842 }, { "epoch": 0.92, "learning_rate": 8.033920630820286e-08, "loss": 0.8953, "step": 48843 }, { "epoch": 0.92, "learning_rate": 8.030079442062189e-08, "loss": 0.9757, "step": 48844 }, { "epoch": 0.92, "learning_rate": 8.026239156812444e-08, "loss": 0.8517, "step": 48845 }, { "epoch": 0.92, "learning_rate": 8.02239977508526e-08, "loss": 0.8257, "step": 48846 }, { "epoch": 0.92, "learning_rate": 8.018561296895017e-08, "loss": 0.9505, "step": 48847 }, { "epoch": 0.92, "learning_rate": 8.014723722256063e-08, "loss": 0.741, "step": 48848 }, { "epoch": 0.92, "learning_rate": 8.010887051182692e-08, "loss": 0.9717, "step": 48849 }, { "epoch": 0.92, "learning_rate": 8.007051283689254e-08, "loss": 1.2485, "step": 48850 }, { "epoch": 0.92, "learning_rate": 8.003216419790072e-08, "loss": 0.9136, "step": 48851 }, { "epoch": 0.92, "learning_rate": 7.999382459499466e-08, "loss": 0.8079, "step": 48852 }, { "epoch": 0.92, "learning_rate": 7.995549402831731e-08, "loss": 0.869, "step": 48853 }, { "epoch": 0.92, "learning_rate": 7.991717249801218e-08, "loss": 0.777, "step": 48854 }, { "epoch": 0.92, "learning_rate": 7.987886000422191e-08, "loss": 1.08, "step": 48855 }, { "epoch": 0.92, "learning_rate": 7.984055654708972e-08, "loss": 1.0723, "step": 48856 }, { "epoch": 0.92, "learning_rate": 7.980226212675885e-08, "loss": 1.0183, "step": 48857 }, { "epoch": 0.92, "learning_rate": 7.976397674337221e-08, "loss": 0.8661, "step": 48858 }, { "epoch": 0.92, "learning_rate": 7.972570039707251e-08, "loss": 0.9314, "step": 48859 }, { "epoch": 0.92, "learning_rate": 7.968743308800265e-08, "loss": 1.002, "step": 48860 }, { "epoch": 0.92, "learning_rate": 7.964917481630614e-08, "loss": 0.8164, "step": 48861 }, { "epoch": 0.92, "learning_rate": 7.961092558212508e-08, "loss": 1.0093, "step": 48862 }, { "epoch": 0.92, "learning_rate": 7.95726853856027e-08, "loss": 0.9128, "step": 48863 }, { "epoch": 0.92, "learning_rate": 7.953445422688194e-08, "loss": 0.9095, "step": 48864 }, { "epoch": 0.92, "learning_rate": 7.949623210610463e-08, "loss": 0.8239, "step": 48865 }, { "epoch": 0.92, "learning_rate": 7.94580190234151e-08, "loss": 0.9647, "step": 48866 }, { "epoch": 0.92, "learning_rate": 7.941981497895463e-08, "loss": 0.7741, "step": 48867 }, { "epoch": 0.92, "learning_rate": 7.938161997286615e-08, "loss": 1.092, "step": 48868 }, { "epoch": 0.92, "learning_rate": 7.934343400529287e-08, "loss": 0.9599, "step": 48869 }, { "epoch": 0.92, "learning_rate": 7.930525707637666e-08, "loss": 1.0107, "step": 48870 }, { "epoch": 0.92, "learning_rate": 7.926708918626069e-08, "loss": 0.9103, "step": 48871 }, { "epoch": 0.92, "learning_rate": 7.92289303350871e-08, "loss": 0.8737, "step": 48872 }, { "epoch": 0.92, "learning_rate": 7.919078052299855e-08, "loss": 0.7515, "step": 48873 }, { "epoch": 0.92, "learning_rate": 7.915263975013687e-08, "loss": 0.8778, "step": 48874 }, { "epoch": 0.92, "learning_rate": 7.911450801664583e-08, "loss": 1.1484, "step": 48875 }, { "epoch": 0.92, "learning_rate": 7.907638532266642e-08, "loss": 0.8979, "step": 48876 }, { "epoch": 0.92, "learning_rate": 7.903827166834188e-08, "loss": 0.98, "step": 48877 }, { "epoch": 0.92, "learning_rate": 7.900016705381403e-08, "loss": 1.0168, "step": 48878 }, { "epoch": 0.92, "learning_rate": 7.896207147922524e-08, "loss": 0.7162, "step": 48879 }, { "epoch": 0.92, "learning_rate": 7.892398494471793e-08, "loss": 0.9738, "step": 48880 }, { "epoch": 0.92, "learning_rate": 7.888590745043418e-08, "loss": 0.9831, "step": 48881 }, { "epoch": 0.92, "learning_rate": 7.884783899651666e-08, "loss": 0.8239, "step": 48882 }, { "epoch": 0.92, "learning_rate": 7.880977958310637e-08, "loss": 0.8158, "step": 48883 }, { "epoch": 0.92, "learning_rate": 7.877172921034625e-08, "loss": 0.8312, "step": 48884 }, { "epoch": 0.92, "learning_rate": 7.873368787837871e-08, "loss": 0.7937, "step": 48885 }, { "epoch": 0.92, "learning_rate": 7.869565558734499e-08, "loss": 0.714, "step": 48886 }, { "epoch": 0.92, "learning_rate": 7.865763233738777e-08, "loss": 1.3034, "step": 48887 }, { "epoch": 0.92, "learning_rate": 7.861961812864832e-08, "loss": 0.9283, "step": 48888 }, { "epoch": 0.92, "learning_rate": 7.858161296126932e-08, "loss": 1.0517, "step": 48889 }, { "epoch": 0.92, "learning_rate": 7.854361683539202e-08, "loss": 0.7897, "step": 48890 }, { "epoch": 0.92, "learning_rate": 7.850562975115883e-08, "loss": 0.9825, "step": 48891 }, { "epoch": 0.92, "learning_rate": 7.846765170871129e-08, "loss": 0.7848, "step": 48892 }, { "epoch": 0.92, "learning_rate": 7.842968270819123e-08, "loss": 1.0392, "step": 48893 }, { "epoch": 0.92, "learning_rate": 7.839172274974077e-08, "loss": 0.9348, "step": 48894 }, { "epoch": 0.92, "learning_rate": 7.83537718335009e-08, "loss": 1.0999, "step": 48895 }, { "epoch": 0.92, "learning_rate": 7.831582995961429e-08, "loss": 0.8906, "step": 48896 }, { "epoch": 0.92, "learning_rate": 7.827789712822192e-08, "loss": 0.9185, "step": 48897 }, { "epoch": 0.92, "learning_rate": 7.823997333946564e-08, "loss": 0.7517, "step": 48898 }, { "epoch": 0.92, "learning_rate": 7.8202058593487e-08, "loss": 0.9823, "step": 48899 }, { "epoch": 0.92, "learning_rate": 7.816415289042756e-08, "loss": 1.0695, "step": 48900 }, { "epoch": 0.92, "learning_rate": 7.812625623042885e-08, "loss": 0.9374, "step": 48901 }, { "epoch": 0.92, "learning_rate": 7.808836861363273e-08, "loss": 0.8866, "step": 48902 }, { "epoch": 0.92, "learning_rate": 7.805049004018046e-08, "loss": 0.8379, "step": 48903 }, { "epoch": 0.92, "learning_rate": 7.801262051021274e-08, "loss": 0.8189, "step": 48904 }, { "epoch": 0.92, "learning_rate": 7.7974760023872e-08, "loss": 0.9081, "step": 48905 }, { "epoch": 0.92, "learning_rate": 7.793690858129976e-08, "loss": 0.9727, "step": 48906 }, { "epoch": 0.92, "learning_rate": 7.789906618263592e-08, "loss": 0.8108, "step": 48907 }, { "epoch": 0.92, "learning_rate": 7.786123282802344e-08, "loss": 0.7417, "step": 48908 }, { "epoch": 0.92, "learning_rate": 7.782340851760273e-08, "loss": 0.8044, "step": 48909 }, { "epoch": 0.92, "learning_rate": 7.77855932515148e-08, "loss": 0.7937, "step": 48910 }, { "epoch": 0.92, "learning_rate": 7.774778702990149e-08, "loss": 0.8228, "step": 48911 }, { "epoch": 0.92, "learning_rate": 7.77099898529035e-08, "loss": 1.0873, "step": 48912 }, { "epoch": 0.92, "learning_rate": 7.767220172066214e-08, "loss": 1.1075, "step": 48913 }, { "epoch": 0.92, "learning_rate": 7.763442263331866e-08, "loss": 0.9424, "step": 48914 }, { "epoch": 0.92, "learning_rate": 7.759665259101406e-08, "loss": 0.8989, "step": 48915 }, { "epoch": 0.92, "learning_rate": 7.755889159388936e-08, "loss": 0.9691, "step": 48916 }, { "epoch": 0.92, "learning_rate": 7.752113964208524e-08, "loss": 0.9611, "step": 48917 }, { "epoch": 0.92, "learning_rate": 7.748339673574273e-08, "loss": 1.0135, "step": 48918 }, { "epoch": 0.92, "learning_rate": 7.744566287500311e-08, "loss": 1.0183, "step": 48919 }, { "epoch": 0.92, "learning_rate": 7.740793806000735e-08, "loss": 0.8741, "step": 48920 }, { "epoch": 0.92, "learning_rate": 7.737022229089563e-08, "loss": 0.955, "step": 48921 }, { "epoch": 0.92, "learning_rate": 7.733251556780979e-08, "loss": 0.8897, "step": 48922 }, { "epoch": 0.92, "learning_rate": 7.729481789088944e-08, "loss": 0.7149, "step": 48923 }, { "epoch": 0.92, "learning_rate": 7.72571292602764e-08, "loss": 1.0499, "step": 48924 }, { "epoch": 0.92, "learning_rate": 7.721944967611083e-08, "loss": 1.0567, "step": 48925 }, { "epoch": 0.92, "learning_rate": 7.718177913853319e-08, "loss": 0.8753, "step": 48926 }, { "epoch": 0.92, "learning_rate": 7.714411764768503e-08, "loss": 0.8807, "step": 48927 }, { "epoch": 0.92, "learning_rate": 7.710646520370624e-08, "loss": 0.6974, "step": 48928 }, { "epoch": 0.92, "learning_rate": 7.70688218067378e-08, "loss": 0.7625, "step": 48929 }, { "epoch": 0.92, "learning_rate": 7.703118745691989e-08, "loss": 0.881, "step": 48930 }, { "epoch": 0.92, "learning_rate": 7.699356215439324e-08, "loss": 0.9776, "step": 48931 }, { "epoch": 0.92, "learning_rate": 7.695594589929828e-08, "loss": 0.6112, "step": 48932 }, { "epoch": 0.92, "learning_rate": 7.691833869177546e-08, "loss": 0.7745, "step": 48933 }, { "epoch": 0.92, "learning_rate": 7.688074053196576e-08, "loss": 0.9467, "step": 48934 }, { "epoch": 0.92, "learning_rate": 7.684315142000853e-08, "loss": 0.7482, "step": 48935 }, { "epoch": 0.92, "learning_rate": 7.680557135604504e-08, "loss": 0.9458, "step": 48936 }, { "epoch": 0.92, "learning_rate": 7.67680003402152e-08, "loss": 1.2089, "step": 48937 }, { "epoch": 0.92, "learning_rate": 7.673043837265915e-08, "loss": 1.0542, "step": 48938 }, { "epoch": 0.92, "learning_rate": 7.669288545351733e-08, "loss": 0.9757, "step": 48939 }, { "epoch": 0.92, "learning_rate": 7.665534158293019e-08, "loss": 0.86, "step": 48940 }, { "epoch": 0.92, "learning_rate": 7.661780676103736e-08, "loss": 0.9526, "step": 48941 }, { "epoch": 0.92, "learning_rate": 7.658028098797953e-08, "loss": 0.8086, "step": 48942 }, { "epoch": 0.92, "learning_rate": 7.654276426389717e-08, "loss": 0.9348, "step": 48943 }, { "epoch": 0.92, "learning_rate": 7.650525658892905e-08, "loss": 0.882, "step": 48944 }, { "epoch": 0.92, "learning_rate": 7.646775796321643e-08, "loss": 0.9848, "step": 48945 }, { "epoch": 0.92, "learning_rate": 7.643026838689865e-08, "loss": 0.6799, "step": 48946 }, { "epoch": 0.92, "learning_rate": 7.639278786011562e-08, "loss": 0.8077, "step": 48947 }, { "epoch": 0.92, "learning_rate": 7.635531638300831e-08, "loss": 0.8477, "step": 48948 }, { "epoch": 0.92, "learning_rate": 7.631785395571578e-08, "loss": 0.8937, "step": 48949 }, { "epoch": 0.92, "learning_rate": 7.628040057837793e-08, "loss": 1.032, "step": 48950 }, { "epoch": 0.92, "learning_rate": 7.624295625113464e-08, "loss": 1.092, "step": 48951 }, { "epoch": 0.92, "learning_rate": 7.620552097412581e-08, "loss": 0.8857, "step": 48952 }, { "epoch": 0.92, "learning_rate": 7.616809474749159e-08, "loss": 0.8291, "step": 48953 }, { "epoch": 0.92, "learning_rate": 7.613067757137105e-08, "loss": 0.8502, "step": 48954 }, { "epoch": 0.92, "learning_rate": 7.609326944590461e-08, "loss": 0.7241, "step": 48955 }, { "epoch": 0.92, "learning_rate": 7.605587037123108e-08, "loss": 0.9625, "step": 48956 }, { "epoch": 0.92, "learning_rate": 7.601848034749116e-08, "loss": 1.1436, "step": 48957 }, { "epoch": 0.92, "learning_rate": 7.598109937482362e-08, "loss": 0.8005, "step": 48958 }, { "epoch": 0.92, "learning_rate": 7.594372745336836e-08, "loss": 1.0472, "step": 48959 }, { "epoch": 0.92, "learning_rate": 7.590636458326472e-08, "loss": 0.889, "step": 48960 }, { "epoch": 0.92, "learning_rate": 7.586901076465259e-08, "loss": 0.7933, "step": 48961 }, { "epoch": 0.92, "learning_rate": 7.583166599767127e-08, "loss": 0.9354, "step": 48962 }, { "epoch": 0.92, "learning_rate": 7.579433028246013e-08, "loss": 0.9366, "step": 48963 }, { "epoch": 0.92, "learning_rate": 7.575700361915878e-08, "loss": 0.8211, "step": 48964 }, { "epoch": 0.92, "learning_rate": 7.571968600790625e-08, "loss": 0.7887, "step": 48965 }, { "epoch": 0.92, "learning_rate": 7.568237744884216e-08, "loss": 0.9409, "step": 48966 }, { "epoch": 0.92, "learning_rate": 7.564507794210585e-08, "loss": 0.8235, "step": 48967 }, { "epoch": 0.92, "learning_rate": 7.56077874878361e-08, "loss": 0.9481, "step": 48968 }, { "epoch": 0.92, "learning_rate": 7.557050608617306e-08, "loss": 0.9379, "step": 48969 }, { "epoch": 0.92, "learning_rate": 7.553323373725497e-08, "loss": 0.8233, "step": 48970 }, { "epoch": 0.92, "learning_rate": 7.54959704412217e-08, "loss": 1.0161, "step": 48971 }, { "epoch": 0.92, "learning_rate": 7.545871619821204e-08, "loss": 1.0887, "step": 48972 }, { "epoch": 0.92, "learning_rate": 7.542147100836506e-08, "loss": 0.781, "step": 48973 }, { "epoch": 0.92, "learning_rate": 7.538423487182034e-08, "loss": 0.9069, "step": 48974 }, { "epoch": 0.92, "learning_rate": 7.534700778871612e-08, "loss": 1.0028, "step": 48975 }, { "epoch": 0.92, "learning_rate": 7.530978975919229e-08, "loss": 0.9608, "step": 48976 }, { "epoch": 0.92, "learning_rate": 7.527258078338679e-08, "loss": 0.6858, "step": 48977 }, { "epoch": 0.92, "learning_rate": 7.523538086143977e-08, "loss": 0.8563, "step": 48978 }, { "epoch": 0.92, "learning_rate": 7.519818999348921e-08, "loss": 0.5116, "step": 48979 }, { "epoch": 0.92, "learning_rate": 7.516100817967415e-08, "loss": 0.9229, "step": 48980 }, { "epoch": 0.92, "learning_rate": 7.512383542013362e-08, "loss": 1.1, "step": 48981 }, { "epoch": 0.92, "learning_rate": 7.508667171500644e-08, "loss": 1.0546, "step": 48982 }, { "epoch": 0.92, "learning_rate": 7.504951706443109e-08, "loss": 0.8267, "step": 48983 }, { "epoch": 0.92, "learning_rate": 7.501237146854662e-08, "loss": 0.8836, "step": 48984 }, { "epoch": 0.92, "learning_rate": 7.497523492749181e-08, "loss": 0.7731, "step": 48985 }, { "epoch": 0.92, "learning_rate": 7.493810744140462e-08, "loss": 0.9661, "step": 48986 }, { "epoch": 0.92, "learning_rate": 7.490098901042464e-08, "loss": 1.0792, "step": 48987 }, { "epoch": 0.92, "learning_rate": 7.486387963468983e-08, "loss": 1.0298, "step": 48988 }, { "epoch": 0.92, "learning_rate": 7.482677931433868e-08, "loss": 0.8502, "step": 48989 }, { "epoch": 0.92, "learning_rate": 7.478968804951026e-08, "loss": 0.8068, "step": 48990 }, { "epoch": 0.92, "learning_rate": 7.475260584034277e-08, "loss": 0.9866, "step": 48991 }, { "epoch": 0.92, "learning_rate": 7.471553268697473e-08, "loss": 0.7597, "step": 48992 }, { "epoch": 0.92, "learning_rate": 7.467846858954436e-08, "loss": 1.2335, "step": 48993 }, { "epoch": 0.92, "learning_rate": 7.464141354819043e-08, "loss": 0.7579, "step": 48994 }, { "epoch": 0.92, "learning_rate": 7.460436756305089e-08, "loss": 0.8192, "step": 48995 }, { "epoch": 0.92, "learning_rate": 7.456733063426452e-08, "loss": 0.9254, "step": 48996 }, { "epoch": 0.92, "learning_rate": 7.453030276196927e-08, "loss": 0.8932, "step": 48997 }, { "epoch": 0.92, "learning_rate": 7.449328394630334e-08, "loss": 0.8805, "step": 48998 }, { "epoch": 0.92, "learning_rate": 7.445627418740553e-08, "loss": 1.0328, "step": 48999 }, { "epoch": 0.92, "learning_rate": 7.441927348541322e-08, "loss": 0.8857, "step": 49000 }, { "epoch": 0.92, "learning_rate": 7.43822818404652e-08, "loss": 0.9129, "step": 49001 }, { "epoch": 0.92, "learning_rate": 7.434529925269912e-08, "loss": 0.8266, "step": 49002 }, { "epoch": 0.92, "learning_rate": 7.43083257222535e-08, "loss": 0.9282, "step": 49003 }, { "epoch": 0.92, "learning_rate": 7.427136124926626e-08, "loss": 0.6867, "step": 49004 }, { "epoch": 0.92, "learning_rate": 7.423440583387509e-08, "loss": 0.8709, "step": 49005 }, { "epoch": 0.92, "learning_rate": 7.419745947621875e-08, "loss": 1.1339, "step": 49006 }, { "epoch": 0.92, "learning_rate": 7.416052217643438e-08, "loss": 0.7702, "step": 49007 }, { "epoch": 0.92, "learning_rate": 7.412359393466045e-08, "loss": 0.7639, "step": 49008 }, { "epoch": 0.92, "learning_rate": 7.408667475103464e-08, "loss": 0.9428, "step": 49009 }, { "epoch": 0.92, "learning_rate": 7.404976462569435e-08, "loss": 0.9887, "step": 49010 }, { "epoch": 0.92, "learning_rate": 7.401286355877835e-08, "loss": 0.9295, "step": 49011 }, { "epoch": 0.92, "learning_rate": 7.397597155042374e-08, "loss": 1.156, "step": 49012 }, { "epoch": 0.92, "learning_rate": 7.393908860076848e-08, "loss": 0.9007, "step": 49013 }, { "epoch": 0.92, "learning_rate": 7.390221470995024e-08, "loss": 0.8176, "step": 49014 }, { "epoch": 0.92, "learning_rate": 7.386534987810695e-08, "loss": 0.8955, "step": 49015 }, { "epoch": 0.92, "learning_rate": 7.382849410537574e-08, "loss": 0.7135, "step": 49016 }, { "epoch": 0.92, "learning_rate": 7.379164739189482e-08, "loss": 0.8042, "step": 49017 }, { "epoch": 0.92, "learning_rate": 7.375480973780159e-08, "loss": 0.9607, "step": 49018 }, { "epoch": 0.92, "learning_rate": 7.371798114323314e-08, "loss": 0.9204, "step": 49019 }, { "epoch": 0.92, "learning_rate": 7.368116160832772e-08, "loss": 0.8247, "step": 49020 }, { "epoch": 0.92, "learning_rate": 7.364435113322216e-08, "loss": 0.9746, "step": 49021 }, { "epoch": 0.92, "learning_rate": 7.360754971805439e-08, "loss": 0.892, "step": 49022 }, { "epoch": 0.92, "learning_rate": 7.357075736296154e-08, "loss": 0.8104, "step": 49023 }, { "epoch": 0.92, "learning_rate": 7.353397406808099e-08, "loss": 1.1834, "step": 49024 }, { "epoch": 0.92, "learning_rate": 7.349719983355041e-08, "loss": 1.1453, "step": 49025 }, { "epoch": 0.92, "learning_rate": 7.346043465950664e-08, "loss": 0.9406, "step": 49026 }, { "epoch": 0.92, "learning_rate": 7.342367854608761e-08, "loss": 1.0439, "step": 49027 }, { "epoch": 0.93, "learning_rate": 7.338693149342963e-08, "loss": 0.9593, "step": 49028 }, { "epoch": 0.93, "learning_rate": 7.335019350167088e-08, "loss": 0.8365, "step": 49029 }, { "epoch": 0.93, "learning_rate": 7.331346457094796e-08, "loss": 0.9278, "step": 49030 }, { "epoch": 0.93, "learning_rate": 7.327674470139768e-08, "loss": 1.0049, "step": 49031 }, { "epoch": 0.93, "learning_rate": 7.324003389315854e-08, "loss": 0.9717, "step": 49032 }, { "epoch": 0.93, "learning_rate": 7.320333214636599e-08, "loss": 0.7073, "step": 49033 }, { "epoch": 0.93, "learning_rate": 7.316663946115826e-08, "loss": 1.0233, "step": 49034 }, { "epoch": 0.93, "learning_rate": 7.312995583767163e-08, "loss": 0.9292, "step": 49035 }, { "epoch": 0.93, "learning_rate": 7.30932812760432e-08, "loss": 0.8281, "step": 49036 }, { "epoch": 0.93, "learning_rate": 7.305661577641038e-08, "loss": 1.0051, "step": 49037 }, { "epoch": 0.93, "learning_rate": 7.301995933890943e-08, "loss": 0.865, "step": 49038 }, { "epoch": 0.93, "learning_rate": 7.298331196367803e-08, "loss": 0.8823, "step": 49039 }, { "epoch": 0.93, "learning_rate": 7.29466736508519e-08, "loss": 1.0876, "step": 49040 }, { "epoch": 0.93, "learning_rate": 7.291004440056898e-08, "loss": 0.9124, "step": 49041 }, { "epoch": 0.93, "learning_rate": 7.287342421296528e-08, "loss": 0.7873, "step": 49042 }, { "epoch": 0.93, "learning_rate": 7.283681308817792e-08, "loss": 1.0453, "step": 49043 }, { "epoch": 0.93, "learning_rate": 7.280021102634344e-08, "loss": 0.9221, "step": 49044 }, { "epoch": 0.93, "learning_rate": 7.27636180275984e-08, "loss": 0.9588, "step": 49045 }, { "epoch": 0.93, "learning_rate": 7.272703409207965e-08, "loss": 0.8564, "step": 49046 }, { "epoch": 0.93, "learning_rate": 7.269045921992401e-08, "loss": 0.921, "step": 49047 }, { "epoch": 0.93, "learning_rate": 7.265389341126777e-08, "loss": 0.7868, "step": 49048 }, { "epoch": 0.93, "learning_rate": 7.261733666624693e-08, "loss": 0.9702, "step": 49049 }, { "epoch": 0.93, "learning_rate": 7.258078898499915e-08, "loss": 0.7678, "step": 49050 }, { "epoch": 0.93, "learning_rate": 7.254425036765989e-08, "loss": 0.8994, "step": 49051 }, { "epoch": 0.93, "learning_rate": 7.250772081436569e-08, "loss": 0.8536, "step": 49052 }, { "epoch": 0.93, "learning_rate": 7.247120032525395e-08, "loss": 0.7622, "step": 49053 }, { "epoch": 0.93, "learning_rate": 7.243468890045985e-08, "loss": 0.712, "step": 49054 }, { "epoch": 0.93, "learning_rate": 7.239818654012048e-08, "loss": 0.7979, "step": 49055 }, { "epoch": 0.93, "learning_rate": 7.23616932443716e-08, "loss": 1.1395, "step": 49056 }, { "epoch": 0.93, "learning_rate": 7.232520901334971e-08, "loss": 0.9306, "step": 49057 }, { "epoch": 0.93, "learning_rate": 7.228873384719115e-08, "loss": 0.9974, "step": 49058 }, { "epoch": 0.93, "learning_rate": 7.225226774603216e-08, "loss": 0.8506, "step": 49059 }, { "epoch": 0.93, "learning_rate": 7.221581071000877e-08, "loss": 0.8767, "step": 49060 }, { "epoch": 0.93, "learning_rate": 7.217936273925669e-08, "loss": 0.7511, "step": 49061 }, { "epoch": 0.93, "learning_rate": 7.214292383391303e-08, "loss": 0.9886, "step": 49062 }, { "epoch": 0.93, "learning_rate": 7.210649399411296e-08, "loss": 1.0283, "step": 49063 }, { "epoch": 0.93, "learning_rate": 7.207007321999277e-08, "loss": 0.7967, "step": 49064 }, { "epoch": 0.93, "learning_rate": 7.203366151168844e-08, "loss": 0.7977, "step": 49065 }, { "epoch": 0.93, "learning_rate": 7.1997258869336e-08, "loss": 0.7138, "step": 49066 }, { "epoch": 0.93, "learning_rate": 7.196086529307117e-08, "loss": 0.7606, "step": 49067 }, { "epoch": 0.93, "learning_rate": 7.192448078303022e-08, "loss": 1.1602, "step": 49068 }, { "epoch": 0.93, "learning_rate": 7.188810533934915e-08, "loss": 1.0432, "step": 49069 }, { "epoch": 0.93, "learning_rate": 7.185173896216286e-08, "loss": 0.9641, "step": 49070 }, { "epoch": 0.93, "learning_rate": 7.181538165160817e-08, "loss": 0.7381, "step": 49071 }, { "epoch": 0.93, "learning_rate": 7.177903340782028e-08, "loss": 0.7263, "step": 49072 }, { "epoch": 0.93, "learning_rate": 7.174269423093461e-08, "loss": 0.716, "step": 49073 }, { "epoch": 0.93, "learning_rate": 7.1706364121088e-08, "loss": 1.0213, "step": 49074 }, { "epoch": 0.93, "learning_rate": 7.167004307841479e-08, "loss": 0.8741, "step": 49075 }, { "epoch": 0.93, "learning_rate": 7.163373110305155e-08, "loss": 0.8689, "step": 49076 }, { "epoch": 0.93, "learning_rate": 7.159742819513316e-08, "loss": 0.852, "step": 49077 }, { "epoch": 0.93, "learning_rate": 7.15611343547959e-08, "loss": 0.9816, "step": 49078 }, { "epoch": 0.93, "learning_rate": 7.152484958217465e-08, "loss": 0.76, "step": 49079 }, { "epoch": 0.93, "learning_rate": 7.148857387740515e-08, "loss": 0.7089, "step": 49080 }, { "epoch": 0.93, "learning_rate": 7.145230724062313e-08, "loss": 0.8604, "step": 49081 }, { "epoch": 0.93, "learning_rate": 7.141604967196319e-08, "loss": 0.7433, "step": 49082 }, { "epoch": 0.93, "learning_rate": 7.13798011715619e-08, "loss": 0.8705, "step": 49083 }, { "epoch": 0.93, "learning_rate": 7.134356173955359e-08, "loss": 0.7801, "step": 49084 }, { "epoch": 0.93, "learning_rate": 7.130733137607399e-08, "loss": 0.8552, "step": 49085 }, { "epoch": 0.93, "learning_rate": 7.127111008125826e-08, "loss": 0.8464, "step": 49086 }, { "epoch": 0.93, "learning_rate": 7.123489785524185e-08, "loss": 1.115, "step": 49087 }, { "epoch": 0.93, "learning_rate": 7.119869469815993e-08, "loss": 1.1218, "step": 49088 }, { "epoch": 0.93, "learning_rate": 7.116250061014768e-08, "loss": 0.8931, "step": 49089 }, { "epoch": 0.93, "learning_rate": 7.112631559134025e-08, "loss": 0.7849, "step": 49090 }, { "epoch": 0.93, "learning_rate": 7.109013964187227e-08, "loss": 0.8768, "step": 49091 }, { "epoch": 0.93, "learning_rate": 7.105397276187948e-08, "loss": 0.9596, "step": 49092 }, { "epoch": 0.93, "learning_rate": 7.101781495149673e-08, "loss": 1.1226, "step": 49093 }, { "epoch": 0.93, "learning_rate": 7.098166621085867e-08, "loss": 1.0056, "step": 49094 }, { "epoch": 0.93, "learning_rate": 7.094552654010101e-08, "loss": 0.816, "step": 49095 }, { "epoch": 0.93, "learning_rate": 7.090939593935809e-08, "loss": 0.8666, "step": 49096 }, { "epoch": 0.93, "learning_rate": 7.087327440876507e-08, "loss": 0.7518, "step": 49097 }, { "epoch": 0.93, "learning_rate": 7.083716194845686e-08, "loss": 0.9008, "step": 49098 }, { "epoch": 0.93, "learning_rate": 7.080105855856778e-08, "loss": 0.9675, "step": 49099 }, { "epoch": 0.93, "learning_rate": 7.076496423923356e-08, "loss": 1.2108, "step": 49100 }, { "epoch": 0.93, "learning_rate": 7.072887899058828e-08, "loss": 0.8766, "step": 49101 }, { "epoch": 0.93, "learning_rate": 7.069280281276708e-08, "loss": 0.8656, "step": 49102 }, { "epoch": 0.93, "learning_rate": 7.065673570590404e-08, "loss": 0.7086, "step": 49103 }, { "epoch": 0.93, "learning_rate": 7.062067767013459e-08, "loss": 0.6675, "step": 49104 }, { "epoch": 0.93, "learning_rate": 7.058462870559308e-08, "loss": 1.0125, "step": 49105 }, { "epoch": 0.93, "learning_rate": 7.054858881241383e-08, "loss": 1.2609, "step": 49106 }, { "epoch": 0.93, "learning_rate": 7.051255799073175e-08, "loss": 0.9898, "step": 49107 }, { "epoch": 0.93, "learning_rate": 7.047653624068118e-08, "loss": 0.8631, "step": 49108 }, { "epoch": 0.93, "learning_rate": 7.044052356239701e-08, "loss": 0.9266, "step": 49109 }, { "epoch": 0.93, "learning_rate": 7.040451995601327e-08, "loss": 0.8019, "step": 49110 }, { "epoch": 0.93, "learning_rate": 7.03685254216649e-08, "loss": 1.1275, "step": 49111 }, { "epoch": 0.93, "learning_rate": 7.033253995948535e-08, "loss": 1.1369, "step": 49112 }, { "epoch": 0.93, "learning_rate": 7.029656356961012e-08, "loss": 1.1799, "step": 49113 }, { "epoch": 0.93, "learning_rate": 7.026059625217268e-08, "loss": 0.7882, "step": 49114 }, { "epoch": 0.93, "learning_rate": 7.022463800730766e-08, "loss": 0.8954, "step": 49115 }, { "epoch": 0.93, "learning_rate": 7.018868883514967e-08, "loss": 0.6153, "step": 49116 }, { "epoch": 0.93, "learning_rate": 7.01527487358325e-08, "loss": 0.9016, "step": 49117 }, { "epoch": 0.93, "learning_rate": 7.011681770949019e-08, "loss": 0.8996, "step": 49118 }, { "epoch": 0.93, "learning_rate": 7.008089575625737e-08, "loss": 1.1498, "step": 49119 }, { "epoch": 0.93, "learning_rate": 7.00449828762681e-08, "loss": 0.578, "step": 49120 }, { "epoch": 0.93, "learning_rate": 7.000907906965615e-08, "loss": 0.8839, "step": 49121 }, { "epoch": 0.93, "learning_rate": 6.997318433655587e-08, "loss": 0.9942, "step": 49122 }, { "epoch": 0.93, "learning_rate": 6.993729867710159e-08, "loss": 0.8221, "step": 49123 }, { "epoch": 0.93, "learning_rate": 6.990142209142626e-08, "loss": 0.9241, "step": 49124 }, { "epoch": 0.93, "learning_rate": 6.986555457966503e-08, "loss": 1.0355, "step": 49125 }, { "epoch": 0.93, "learning_rate": 6.982969614195117e-08, "loss": 0.9049, "step": 49126 }, { "epoch": 0.93, "learning_rate": 6.979384677841844e-08, "loss": 0.8074, "step": 49127 }, { "epoch": 0.93, "learning_rate": 6.975800648920117e-08, "loss": 0.9852, "step": 49128 }, { "epoch": 0.93, "learning_rate": 6.972217527443315e-08, "loss": 0.8967, "step": 49129 }, { "epoch": 0.93, "learning_rate": 6.968635313424787e-08, "loss": 1.0049, "step": 49130 }, { "epoch": 0.93, "learning_rate": 6.965054006877913e-08, "loss": 1.0499, "step": 49131 }, { "epoch": 0.93, "learning_rate": 6.961473607816128e-08, "loss": 1.0612, "step": 49132 }, { "epoch": 0.93, "learning_rate": 6.957894116252667e-08, "loss": 0.7664, "step": 49133 }, { "epoch": 0.93, "learning_rate": 6.95431553220105e-08, "loss": 0.951, "step": 49134 }, { "epoch": 0.93, "learning_rate": 6.950737855674517e-08, "loss": 1.0493, "step": 49135 }, { "epoch": 0.93, "learning_rate": 6.947161086686472e-08, "loss": 0.8671, "step": 49136 }, { "epoch": 0.93, "learning_rate": 6.943585225250321e-08, "loss": 1.1526, "step": 49137 }, { "epoch": 0.93, "learning_rate": 6.94001027137936e-08, "loss": 0.862, "step": 49138 }, { "epoch": 0.93, "learning_rate": 6.936436225086912e-08, "loss": 0.9849, "step": 49139 }, { "epoch": 0.93, "learning_rate": 6.932863086386382e-08, "loss": 0.7912, "step": 49140 }, { "epoch": 0.93, "learning_rate": 6.929290855291093e-08, "loss": 0.9655, "step": 49141 }, { "epoch": 0.93, "learning_rate": 6.925719531814367e-08, "loss": 0.9406, "step": 49142 }, { "epoch": 0.93, "learning_rate": 6.922149115969556e-08, "loss": 0.8695, "step": 49143 }, { "epoch": 0.93, "learning_rate": 6.918579607770038e-08, "loss": 1.0389, "step": 49144 }, { "epoch": 0.93, "learning_rate": 6.915011007228994e-08, "loss": 0.7733, "step": 49145 }, { "epoch": 0.93, "learning_rate": 6.911443314359944e-08, "loss": 0.656, "step": 49146 }, { "epoch": 0.93, "learning_rate": 6.907876529176045e-08, "loss": 1.2015, "step": 49147 }, { "epoch": 0.93, "learning_rate": 6.904310651690698e-08, "loss": 0.8497, "step": 49148 }, { "epoch": 0.93, "learning_rate": 6.900745681917204e-08, "loss": 0.7736, "step": 49149 }, { "epoch": 0.93, "learning_rate": 6.897181619868881e-08, "loss": 1.0931, "step": 49150 }, { "epoch": 0.93, "learning_rate": 6.893618465559026e-08, "loss": 0.9992, "step": 49151 }, { "epoch": 0.93, "learning_rate": 6.890056219000907e-08, "loss": 0.8542, "step": 49152 }, { "epoch": 0.93, "learning_rate": 6.886494880207928e-08, "loss": 0.7639, "step": 49153 }, { "epoch": 0.93, "learning_rate": 6.882934449193273e-08, "loss": 0.7788, "step": 49154 }, { "epoch": 0.93, "learning_rate": 6.879374925970323e-08, "loss": 0.8104, "step": 49155 }, { "epoch": 0.93, "learning_rate": 6.875816310552313e-08, "loss": 1.1406, "step": 49156 }, { "epoch": 0.93, "learning_rate": 6.872258602952542e-08, "loss": 1.0352, "step": 49157 }, { "epoch": 0.93, "learning_rate": 6.868701803184302e-08, "loss": 0.6844, "step": 49158 }, { "epoch": 0.93, "learning_rate": 6.86514591126089e-08, "loss": 0.9056, "step": 49159 }, { "epoch": 0.93, "learning_rate": 6.861590927195599e-08, "loss": 0.7378, "step": 49160 }, { "epoch": 0.93, "learning_rate": 6.858036851001587e-08, "loss": 0.7853, "step": 49161 }, { "epoch": 0.93, "learning_rate": 6.85448368269226e-08, "loss": 0.7934, "step": 49162 }, { "epoch": 0.93, "learning_rate": 6.850931422280882e-08, "loss": 1.0108, "step": 49163 }, { "epoch": 0.93, "learning_rate": 6.847380069780584e-08, "loss": 0.877, "step": 49164 }, { "epoch": 0.93, "learning_rate": 6.843829625204773e-08, "loss": 0.8555, "step": 49165 }, { "epoch": 0.93, "learning_rate": 6.840280088566631e-08, "loss": 0.7064, "step": 49166 }, { "epoch": 0.93, "learning_rate": 6.836731459879425e-08, "loss": 0.7229, "step": 49167 }, { "epoch": 0.93, "learning_rate": 6.833183739156424e-08, "loss": 1.0068, "step": 49168 }, { "epoch": 0.93, "learning_rate": 6.829636926410837e-08, "loss": 0.9603, "step": 49169 }, { "epoch": 0.93, "learning_rate": 6.826091021655933e-08, "loss": 0.9298, "step": 49170 }, { "epoch": 0.93, "learning_rate": 6.822546024904953e-08, "loss": 0.8769, "step": 49171 }, { "epoch": 0.93, "learning_rate": 6.81900193617116e-08, "loss": 0.8271, "step": 49172 }, { "epoch": 0.93, "learning_rate": 6.815458755467685e-08, "loss": 1.0752, "step": 49173 }, { "epoch": 0.93, "learning_rate": 6.811916482807907e-08, "loss": 0.9084, "step": 49174 }, { "epoch": 0.93, "learning_rate": 6.808375118204952e-08, "loss": 1.152, "step": 49175 }, { "epoch": 0.93, "learning_rate": 6.804834661672033e-08, "loss": 0.9901, "step": 49176 }, { "epoch": 0.93, "learning_rate": 6.801295113222445e-08, "loss": 0.8918, "step": 49177 }, { "epoch": 0.93, "learning_rate": 6.797756472869344e-08, "loss": 0.9762, "step": 49178 }, { "epoch": 0.93, "learning_rate": 6.794218740625969e-08, "loss": 0.9066, "step": 49179 }, { "epoch": 0.93, "learning_rate": 6.790681916505532e-08, "loss": 1.0455, "step": 49180 }, { "epoch": 0.93, "learning_rate": 6.787146000521244e-08, "loss": 1.0131, "step": 49181 }, { "epoch": 0.93, "learning_rate": 6.783610992686235e-08, "loss": 0.8818, "step": 49182 }, { "epoch": 0.93, "learning_rate": 6.780076893013827e-08, "loss": 0.6949, "step": 49183 }, { "epoch": 0.93, "learning_rate": 6.776543701517147e-08, "loss": 0.9478, "step": 49184 }, { "epoch": 0.93, "learning_rate": 6.773011418209352e-08, "loss": 0.6386, "step": 49185 }, { "epoch": 0.93, "learning_rate": 6.769480043103737e-08, "loss": 0.804, "step": 49186 }, { "epoch": 0.93, "learning_rate": 6.765949576213405e-08, "loss": 0.8649, "step": 49187 }, { "epoch": 0.93, "learning_rate": 6.762420017551536e-08, "loss": 0.8989, "step": 49188 }, { "epoch": 0.93, "learning_rate": 6.758891367131343e-08, "loss": 0.8252, "step": 49189 }, { "epoch": 0.93, "learning_rate": 6.75536362496601e-08, "loss": 0.7875, "step": 49190 }, { "epoch": 0.93, "learning_rate": 6.751836791068667e-08, "loss": 0.8664, "step": 49191 }, { "epoch": 0.93, "learning_rate": 6.748310865452523e-08, "loss": 0.8036, "step": 49192 }, { "epoch": 0.93, "learning_rate": 6.744785848130736e-08, "loss": 1.0628, "step": 49193 }, { "epoch": 0.93, "learning_rate": 6.741261739116406e-08, "loss": 1.0306, "step": 49194 }, { "epoch": 0.93, "learning_rate": 6.737738538422828e-08, "loss": 0.8542, "step": 49195 }, { "epoch": 0.93, "learning_rate": 6.734216246063019e-08, "loss": 0.674, "step": 49196 }, { "epoch": 0.93, "learning_rate": 6.730694862050218e-08, "loss": 0.9193, "step": 49197 }, { "epoch": 0.93, "learning_rate": 6.727174386397528e-08, "loss": 0.9038, "step": 49198 }, { "epoch": 0.93, "learning_rate": 6.723654819118102e-08, "loss": 1.076, "step": 49199 }, { "epoch": 0.93, "learning_rate": 6.7201361602251e-08, "loss": 0.7587, "step": 49200 }, { "epoch": 0.93, "learning_rate": 6.716618409731646e-08, "loss": 0.7271, "step": 49201 }, { "epoch": 0.93, "learning_rate": 6.713101567650898e-08, "loss": 0.7948, "step": 49202 }, { "epoch": 0.93, "learning_rate": 6.70958563399593e-08, "loss": 0.9774, "step": 49203 }, { "epoch": 0.93, "learning_rate": 6.706070608779924e-08, "loss": 0.7749, "step": 49204 }, { "epoch": 0.93, "learning_rate": 6.702556492016039e-08, "loss": 1.2442, "step": 49205 }, { "epoch": 0.93, "learning_rate": 6.699043283717261e-08, "loss": 1.002, "step": 49206 }, { "epoch": 0.93, "learning_rate": 6.695530983896886e-08, "loss": 1.1096, "step": 49207 }, { "epoch": 0.93, "learning_rate": 6.692019592567878e-08, "loss": 0.9845, "step": 49208 }, { "epoch": 0.93, "learning_rate": 6.688509109743446e-08, "loss": 0.8538, "step": 49209 }, { "epoch": 0.93, "learning_rate": 6.684999535436637e-08, "loss": 0.6913, "step": 49210 }, { "epoch": 0.93, "learning_rate": 6.681490869660579e-08, "loss": 0.9421, "step": 49211 }, { "epoch": 0.93, "learning_rate": 6.677983112428372e-08, "loss": 1.0934, "step": 49212 }, { "epoch": 0.93, "learning_rate": 6.674476263753116e-08, "loss": 0.96, "step": 49213 }, { "epoch": 0.93, "learning_rate": 6.670970323647941e-08, "loss": 0.9162, "step": 49214 }, { "epoch": 0.93, "learning_rate": 6.667465292125863e-08, "loss": 1.0094, "step": 49215 }, { "epoch": 0.93, "learning_rate": 6.66396116920004e-08, "loss": 0.8282, "step": 49216 }, { "epoch": 0.93, "learning_rate": 6.660457954883487e-08, "loss": 0.7928, "step": 49217 }, { "epoch": 0.93, "learning_rate": 6.656955649189362e-08, "loss": 0.9798, "step": 49218 }, { "epoch": 0.93, "learning_rate": 6.653454252130681e-08, "loss": 1.028, "step": 49219 }, { "epoch": 0.93, "learning_rate": 6.649953763720519e-08, "loss": 0.6763, "step": 49220 }, { "epoch": 0.93, "learning_rate": 6.646454183972e-08, "loss": 0.8189, "step": 49221 }, { "epoch": 0.93, "learning_rate": 6.642955512898147e-08, "loss": 0.8468, "step": 49222 }, { "epoch": 0.93, "learning_rate": 6.639457750512057e-08, "loss": 0.7509, "step": 49223 }, { "epoch": 0.93, "learning_rate": 6.635960896826749e-08, "loss": 1.0093, "step": 49224 }, { "epoch": 0.93, "learning_rate": 6.632464951855294e-08, "loss": 0.986, "step": 49225 }, { "epoch": 0.93, "learning_rate": 6.628969915610795e-08, "loss": 0.968, "step": 49226 }, { "epoch": 0.93, "learning_rate": 6.625475788106183e-08, "loss": 0.7212, "step": 49227 }, { "epoch": 0.93, "learning_rate": 6.621982569354673e-08, "loss": 0.8611, "step": 49228 }, { "epoch": 0.93, "learning_rate": 6.61849025936917e-08, "loss": 1.0344, "step": 49229 }, { "epoch": 0.93, "learning_rate": 6.614998858162775e-08, "loss": 0.8948, "step": 49230 }, { "epoch": 0.93, "learning_rate": 6.611508365748503e-08, "loss": 1.0767, "step": 49231 }, { "epoch": 0.93, "learning_rate": 6.608018782139375e-08, "loss": 1.0251, "step": 49232 }, { "epoch": 0.93, "learning_rate": 6.604530107348461e-08, "loss": 0.9714, "step": 49233 }, { "epoch": 0.93, "learning_rate": 6.60104234138878e-08, "loss": 0.9016, "step": 49234 }, { "epoch": 0.93, "learning_rate": 6.597555484273349e-08, "loss": 0.9464, "step": 49235 }, { "epoch": 0.93, "learning_rate": 6.594069536015158e-08, "loss": 0.968, "step": 49236 }, { "epoch": 0.93, "learning_rate": 6.590584496627278e-08, "loss": 1.0275, "step": 49237 }, { "epoch": 0.93, "learning_rate": 6.587100366122673e-08, "loss": 0.9384, "step": 49238 }, { "epoch": 0.93, "learning_rate": 6.583617144514386e-08, "loss": 1.0605, "step": 49239 }, { "epoch": 0.93, "learning_rate": 6.580134831815382e-08, "loss": 0.6943, "step": 49240 }, { "epoch": 0.93, "learning_rate": 6.576653428038704e-08, "loss": 1.0176, "step": 49241 }, { "epoch": 0.93, "learning_rate": 6.573172933197342e-08, "loss": 0.7794, "step": 49242 }, { "epoch": 0.93, "learning_rate": 6.569693347304285e-08, "loss": 1.0814, "step": 49243 }, { "epoch": 0.93, "learning_rate": 6.56621467037255e-08, "loss": 0.896, "step": 49244 }, { "epoch": 0.93, "learning_rate": 6.562736902415073e-08, "loss": 0.7435, "step": 49245 }, { "epoch": 0.93, "learning_rate": 6.559260043444898e-08, "loss": 0.9391, "step": 49246 }, { "epoch": 0.93, "learning_rate": 6.555784093474988e-08, "loss": 0.8372, "step": 49247 }, { "epoch": 0.93, "learning_rate": 6.552309052518275e-08, "loss": 0.8094, "step": 49248 }, { "epoch": 0.93, "learning_rate": 6.548834920587805e-08, "loss": 0.7158, "step": 49249 }, { "epoch": 0.93, "learning_rate": 6.54536169769654e-08, "loss": 1.166, "step": 49250 }, { "epoch": 0.93, "learning_rate": 6.541889383857386e-08, "loss": 0.9124, "step": 49251 }, { "epoch": 0.93, "learning_rate": 6.538417979083389e-08, "loss": 1.1078, "step": 49252 }, { "epoch": 0.93, "learning_rate": 6.534947483387455e-08, "loss": 0.8765, "step": 49253 }, { "epoch": 0.93, "learning_rate": 6.531477896782546e-08, "loss": 0.8375, "step": 49254 }, { "epoch": 0.93, "learning_rate": 6.52800921928165e-08, "loss": 0.6913, "step": 49255 }, { "epoch": 0.93, "learning_rate": 6.524541450897731e-08, "loss": 1.1091, "step": 49256 }, { "epoch": 0.93, "learning_rate": 6.521074591643667e-08, "loss": 0.9019, "step": 49257 }, { "epoch": 0.93, "learning_rate": 6.517608641532475e-08, "loss": 0.9733, "step": 49258 }, { "epoch": 0.93, "learning_rate": 6.51414360057706e-08, "loss": 0.7734, "step": 49259 }, { "epoch": 0.93, "learning_rate": 6.510679468790359e-08, "loss": 0.9979, "step": 49260 }, { "epoch": 0.93, "learning_rate": 6.507216246185305e-08, "loss": 0.8769, "step": 49261 }, { "epoch": 0.93, "learning_rate": 6.503753932774858e-08, "loss": 0.9731, "step": 49262 }, { "epoch": 0.93, "learning_rate": 6.500292528571927e-08, "loss": 0.9507, "step": 49263 }, { "epoch": 0.93, "learning_rate": 6.496832033589417e-08, "loss": 0.846, "step": 49264 }, { "epoch": 0.93, "learning_rate": 6.493372447840319e-08, "loss": 0.933, "step": 49265 }, { "epoch": 0.93, "learning_rate": 6.489913771337452e-08, "loss": 0.8566, "step": 49266 }, { "epoch": 0.93, "learning_rate": 6.486456004093783e-08, "loss": 0.9152, "step": 49267 }, { "epoch": 0.93, "learning_rate": 6.482999146122271e-08, "loss": 0.973, "step": 49268 }, { "epoch": 0.93, "learning_rate": 6.479543197435712e-08, "loss": 1.0845, "step": 49269 }, { "epoch": 0.93, "learning_rate": 6.476088158047123e-08, "loss": 0.9631, "step": 49270 }, { "epoch": 0.93, "learning_rate": 6.472634027969327e-08, "loss": 0.8304, "step": 49271 }, { "epoch": 0.93, "learning_rate": 6.469180807215258e-08, "loss": 0.7784, "step": 49272 }, { "epoch": 0.93, "learning_rate": 6.465728495797796e-08, "loss": 0.7592, "step": 49273 }, { "epoch": 0.93, "learning_rate": 6.462277093729819e-08, "loss": 0.8939, "step": 49274 }, { "epoch": 0.93, "learning_rate": 6.45882660102426e-08, "loss": 1.1469, "step": 49275 }, { "epoch": 0.93, "learning_rate": 6.45537701769397e-08, "loss": 0.9377, "step": 49276 }, { "epoch": 0.93, "learning_rate": 6.451928343751857e-08, "loss": 0.8995, "step": 49277 }, { "epoch": 0.93, "learning_rate": 6.448480579210714e-08, "loss": 0.7522, "step": 49278 }, { "epoch": 0.93, "learning_rate": 6.445033724083532e-08, "loss": 0.8394, "step": 49279 }, { "epoch": 0.93, "learning_rate": 6.441587778383107e-08, "loss": 1.0018, "step": 49280 }, { "epoch": 0.93, "learning_rate": 6.438142742122316e-08, "loss": 1.097, "step": 49281 }, { "epoch": 0.93, "learning_rate": 6.434698615314038e-08, "loss": 0.8921, "step": 49282 }, { "epoch": 0.93, "learning_rate": 6.431255397971126e-08, "loss": 0.8455, "step": 49283 }, { "epoch": 0.93, "learning_rate": 6.427813090106455e-08, "loss": 0.8119, "step": 49284 }, { "epoch": 0.93, "learning_rate": 6.424371691732851e-08, "loss": 0.8013, "step": 49285 }, { "epoch": 0.93, "learning_rate": 6.42093120286319e-08, "loss": 0.94, "step": 49286 }, { "epoch": 0.93, "learning_rate": 6.41749162351027e-08, "loss": 1.0478, "step": 49287 }, { "epoch": 0.93, "learning_rate": 6.414052953686995e-08, "loss": 1.0341, "step": 49288 }, { "epoch": 0.93, "learning_rate": 6.410615193406189e-08, "loss": 0.9118, "step": 49289 }, { "epoch": 0.93, "learning_rate": 6.40717834268062e-08, "loss": 0.986, "step": 49290 }, { "epoch": 0.93, "learning_rate": 6.40374240152325e-08, "loss": 0.984, "step": 49291 }, { "epoch": 0.93, "learning_rate": 6.40030736994679e-08, "loss": 0.8268, "step": 49292 }, { "epoch": 0.93, "learning_rate": 6.39687324796412e-08, "loss": 0.8029, "step": 49293 }, { "epoch": 0.93, "learning_rate": 6.39344003558806e-08, "loss": 0.9496, "step": 49294 }, { "epoch": 0.93, "learning_rate": 6.390007732831438e-08, "loss": 1.025, "step": 49295 }, { "epoch": 0.93, "learning_rate": 6.386576339707046e-08, "loss": 1.06, "step": 49296 }, { "epoch": 0.93, "learning_rate": 6.383145856227707e-08, "loss": 0.592, "step": 49297 }, { "epoch": 0.93, "learning_rate": 6.379716282406245e-08, "loss": 0.5728, "step": 49298 }, { "epoch": 0.93, "learning_rate": 6.376287618255427e-08, "loss": 0.8752, "step": 49299 }, { "epoch": 0.93, "learning_rate": 6.372859863788106e-08, "loss": 1.0499, "step": 49300 }, { "epoch": 0.93, "learning_rate": 6.369433019017046e-08, "loss": 0.9187, "step": 49301 }, { "epoch": 0.93, "learning_rate": 6.366007083955073e-08, "loss": 0.8397, "step": 49302 }, { "epoch": 0.93, "learning_rate": 6.362582058614925e-08, "loss": 0.8532, "step": 49303 }, { "epoch": 0.93, "learning_rate": 6.359157943009453e-08, "loss": 0.9236, "step": 49304 }, { "epoch": 0.93, "learning_rate": 6.355734737151398e-08, "loss": 0.8189, "step": 49305 }, { "epoch": 0.93, "learning_rate": 6.352312441053554e-08, "loss": 0.8783, "step": 49306 }, { "epoch": 0.93, "learning_rate": 6.348891054728745e-08, "loss": 0.9652, "step": 49307 }, { "epoch": 0.93, "learning_rate": 6.345470578189655e-08, "loss": 0.7659, "step": 49308 }, { "epoch": 0.93, "learning_rate": 6.342051011449136e-08, "loss": 0.8155, "step": 49309 }, { "epoch": 0.93, "learning_rate": 6.338632354519924e-08, "loss": 0.9059, "step": 49310 }, { "epoch": 0.93, "learning_rate": 6.335214607414763e-08, "loss": 0.8147, "step": 49311 }, { "epoch": 0.93, "learning_rate": 6.331797770146502e-08, "loss": 1.0665, "step": 49312 }, { "epoch": 0.93, "learning_rate": 6.328381842727799e-08, "loss": 1.062, "step": 49313 }, { "epoch": 0.93, "learning_rate": 6.324966825171446e-08, "loss": 0.785, "step": 49314 }, { "epoch": 0.93, "learning_rate": 6.321552717490187e-08, "loss": 0.9214, "step": 49315 }, { "epoch": 0.93, "learning_rate": 6.318139519696787e-08, "loss": 0.6585, "step": 49316 }, { "epoch": 0.93, "learning_rate": 6.314727231803985e-08, "loss": 0.8476, "step": 49317 }, { "epoch": 0.93, "learning_rate": 6.311315853824495e-08, "loss": 1.0356, "step": 49318 }, { "epoch": 0.93, "learning_rate": 6.30790538577114e-08, "loss": 0.9335, "step": 49319 }, { "epoch": 0.93, "learning_rate": 6.30449582765652e-08, "loss": 0.9344, "step": 49320 }, { "epoch": 0.93, "learning_rate": 6.301087179493514e-08, "loss": 0.7756, "step": 49321 }, { "epoch": 0.93, "learning_rate": 6.297679441294724e-08, "loss": 0.8338, "step": 49322 }, { "epoch": 0.93, "learning_rate": 6.294272613072943e-08, "loss": 0.951, "step": 49323 }, { "epoch": 0.93, "learning_rate": 6.290866694840886e-08, "loss": 0.8565, "step": 49324 }, { "epoch": 0.93, "learning_rate": 6.287461686611235e-08, "loss": 1.1682, "step": 49325 }, { "epoch": 0.93, "learning_rate": 6.284057588396757e-08, "loss": 0.9062, "step": 49326 }, { "epoch": 0.93, "learning_rate": 6.280654400210112e-08, "loss": 0.9599, "step": 49327 }, { "epoch": 0.93, "learning_rate": 6.277252122064065e-08, "loss": 1.0212, "step": 49328 }, { "epoch": 0.93, "learning_rate": 6.273850753971244e-08, "loss": 0.8621, "step": 49329 }, { "epoch": 0.93, "learning_rate": 6.27045029594442e-08, "loss": 0.8312, "step": 49330 }, { "epoch": 0.93, "learning_rate": 6.267050747996273e-08, "loss": 0.9751, "step": 49331 }, { "epoch": 0.93, "learning_rate": 6.263652110139435e-08, "loss": 0.9432, "step": 49332 }, { "epoch": 0.93, "learning_rate": 6.260254382386698e-08, "loss": 0.9458, "step": 49333 }, { "epoch": 0.93, "learning_rate": 6.256857564750668e-08, "loss": 0.9, "step": 49334 }, { "epoch": 0.93, "learning_rate": 6.253461657244081e-08, "loss": 1.1384, "step": 49335 }, { "epoch": 0.93, "learning_rate": 6.250066659879567e-08, "loss": 0.8061, "step": 49336 }, { "epoch": 0.93, "learning_rate": 6.246672572669837e-08, "loss": 0.957, "step": 49337 }, { "epoch": 0.93, "learning_rate": 6.243279395627577e-08, "loss": 0.9621, "step": 49338 }, { "epoch": 0.93, "learning_rate": 6.239887128765415e-08, "loss": 0.8078, "step": 49339 }, { "epoch": 0.93, "learning_rate": 6.23649577209609e-08, "loss": 0.7693, "step": 49340 }, { "epoch": 0.93, "learning_rate": 6.23310532563215e-08, "loss": 0.7645, "step": 49341 }, { "epoch": 0.93, "learning_rate": 6.229715789386359e-08, "loss": 0.7515, "step": 49342 }, { "epoch": 0.93, "learning_rate": 6.22632716337132e-08, "loss": 0.9297, "step": 49343 }, { "epoch": 0.93, "learning_rate": 6.222939447599691e-08, "loss": 1.0653, "step": 49344 }, { "epoch": 0.93, "learning_rate": 6.219552642084153e-08, "loss": 0.8787, "step": 49345 }, { "epoch": 0.93, "learning_rate": 6.216166746837337e-08, "loss": 0.8339, "step": 49346 }, { "epoch": 0.93, "learning_rate": 6.212781761871872e-08, "loss": 0.8241, "step": 49347 }, { "epoch": 0.93, "learning_rate": 6.209397687200385e-08, "loss": 0.8594, "step": 49348 }, { "epoch": 0.93, "learning_rate": 6.206014522835563e-08, "loss": 0.8031, "step": 49349 }, { "epoch": 0.93, "learning_rate": 6.202632268789976e-08, "loss": 1.0476, "step": 49350 }, { "epoch": 0.93, "learning_rate": 6.199250925076311e-08, "loss": 0.8813, "step": 49351 }, { "epoch": 0.93, "learning_rate": 6.195870491707167e-08, "loss": 1.0494, "step": 49352 }, { "epoch": 0.93, "learning_rate": 6.192490968695147e-08, "loss": 0.7571, "step": 49353 }, { "epoch": 0.93, "learning_rate": 6.189112356052934e-08, "loss": 0.7656, "step": 49354 }, { "epoch": 0.93, "learning_rate": 6.185734653793046e-08, "loss": 1.1076, "step": 49355 }, { "epoch": 0.93, "learning_rate": 6.182357861928167e-08, "loss": 0.9995, "step": 49356 }, { "epoch": 0.93, "learning_rate": 6.178981980470899e-08, "loss": 1.132, "step": 49357 }, { "epoch": 0.93, "learning_rate": 6.175607009433843e-08, "loss": 0.8081, "step": 49358 }, { "epoch": 0.93, "learning_rate": 6.17223294882957e-08, "loss": 0.7353, "step": 49359 }, { "epoch": 0.93, "learning_rate": 6.168859798670712e-08, "loss": 0.7437, "step": 49360 }, { "epoch": 0.93, "learning_rate": 6.165487558969895e-08, "loss": 0.9173, "step": 49361 }, { "epoch": 0.93, "learning_rate": 6.162116229739612e-08, "loss": 1.0761, "step": 49362 }, { "epoch": 0.93, "learning_rate": 6.158745810992545e-08, "loss": 0.982, "step": 49363 }, { "epoch": 0.93, "learning_rate": 6.155376302741239e-08, "loss": 0.8524, "step": 49364 }, { "epoch": 0.93, "learning_rate": 6.152007704998242e-08, "loss": 0.8202, "step": 49365 }, { "epoch": 0.93, "learning_rate": 6.148640017776236e-08, "loss": 0.7996, "step": 49366 }, { "epoch": 0.93, "learning_rate": 6.145273241087684e-08, "loss": 0.9366, "step": 49367 }, { "epoch": 0.93, "learning_rate": 6.141907374945244e-08, "loss": 1.1094, "step": 49368 }, { "epoch": 0.93, "learning_rate": 6.138542419361404e-08, "loss": 1.1483, "step": 49369 }, { "epoch": 0.93, "learning_rate": 6.135178374348793e-08, "loss": 1.1093, "step": 49370 }, { "epoch": 0.93, "learning_rate": 6.13181523991993e-08, "loss": 0.8218, "step": 49371 }, { "epoch": 0.93, "learning_rate": 6.128453016087416e-08, "loss": 0.9484, "step": 49372 }, { "epoch": 0.93, "learning_rate": 6.125091702863795e-08, "loss": 0.8923, "step": 49373 }, { "epoch": 0.93, "learning_rate": 6.121731300261558e-08, "loss": 0.881, "step": 49374 }, { "epoch": 0.93, "learning_rate": 6.118371808293332e-08, "loss": 0.8669, "step": 49375 }, { "epoch": 0.93, "learning_rate": 6.115013226971639e-08, "loss": 0.967, "step": 49376 }, { "epoch": 0.93, "learning_rate": 6.111655556308965e-08, "loss": 1.0048, "step": 49377 }, { "epoch": 0.93, "learning_rate": 6.108298796317913e-08, "loss": 0.8791, "step": 49378 }, { "epoch": 0.93, "learning_rate": 6.104942947011e-08, "loss": 1.0674, "step": 49379 }, { "epoch": 0.93, "learning_rate": 6.101588008400744e-08, "loss": 0.6902, "step": 49380 }, { "epoch": 0.93, "learning_rate": 6.098233980499691e-08, "loss": 1.0657, "step": 49381 }, { "epoch": 0.93, "learning_rate": 6.094880863320385e-08, "loss": 0.9416, "step": 49382 }, { "epoch": 0.93, "learning_rate": 6.091528656875261e-08, "loss": 0.9426, "step": 49383 }, { "epoch": 0.93, "learning_rate": 6.088177361176923e-08, "loss": 0.7058, "step": 49384 }, { "epoch": 0.93, "learning_rate": 6.084826976237829e-08, "loss": 0.9624, "step": 49385 }, { "epoch": 0.93, "learning_rate": 6.081477502070527e-08, "loss": 0.6918, "step": 49386 }, { "epoch": 0.93, "learning_rate": 6.078128938687506e-08, "loss": 1.2325, "step": 49387 }, { "epoch": 0.93, "learning_rate": 6.074781286101255e-08, "loss": 1.0519, "step": 49388 }, { "epoch": 0.93, "learning_rate": 6.071434544324323e-08, "loss": 0.8051, "step": 49389 }, { "epoch": 0.93, "learning_rate": 6.068088713369142e-08, "loss": 0.8176, "step": 49390 }, { "epoch": 0.93, "learning_rate": 6.064743793248257e-08, "loss": 0.6359, "step": 49391 }, { "epoch": 0.93, "learning_rate": 6.061399783974159e-08, "loss": 0.7949, "step": 49392 }, { "epoch": 0.93, "learning_rate": 6.058056685559255e-08, "loss": 1.078, "step": 49393 }, { "epoch": 0.93, "learning_rate": 6.054714498016174e-08, "loss": 0.8202, "step": 49394 }, { "epoch": 0.93, "learning_rate": 6.051373221357237e-08, "loss": 1.1481, "step": 49395 }, { "epoch": 0.93, "learning_rate": 6.04803285559502e-08, "loss": 0.7637, "step": 49396 }, { "epoch": 0.93, "learning_rate": 6.044693400741986e-08, "loss": 1.0168, "step": 49397 }, { "epoch": 0.93, "learning_rate": 6.041354856810566e-08, "loss": 0.8616, "step": 49398 }, { "epoch": 0.93, "learning_rate": 6.038017223813253e-08, "loss": 1.0029, "step": 49399 }, { "epoch": 0.93, "learning_rate": 6.03468050176248e-08, "loss": 0.7533, "step": 49400 }, { "epoch": 0.93, "learning_rate": 6.031344690670764e-08, "loss": 0.8385, "step": 49401 }, { "epoch": 0.93, "learning_rate": 6.028009790550488e-08, "loss": 0.8334, "step": 49402 }, { "epoch": 0.93, "learning_rate": 6.024675801414192e-08, "loss": 0.9199, "step": 49403 }, { "epoch": 0.93, "learning_rate": 6.021342723274259e-08, "loss": 0.8643, "step": 49404 }, { "epoch": 0.93, "learning_rate": 6.01801055614315e-08, "loss": 0.8577, "step": 49405 }, { "epoch": 0.93, "learning_rate": 6.0146793000333e-08, "loss": 1.2428, "step": 49406 }, { "epoch": 0.93, "learning_rate": 6.011348954957142e-08, "loss": 0.969, "step": 49407 }, { "epoch": 0.93, "learning_rate": 6.008019520927166e-08, "loss": 0.849, "step": 49408 }, { "epoch": 0.93, "learning_rate": 6.004690997955726e-08, "loss": 0.7706, "step": 49409 }, { "epoch": 0.93, "learning_rate": 6.001363386055337e-08, "loss": 0.8321, "step": 49410 }, { "epoch": 0.93, "learning_rate": 5.998036685238323e-08, "loss": 0.7989, "step": 49411 }, { "epoch": 0.93, "learning_rate": 5.994710895517175e-08, "loss": 0.9932, "step": 49412 }, { "epoch": 0.93, "learning_rate": 5.991386016904326e-08, "loss": 1.1329, "step": 49413 }, { "epoch": 0.93, "learning_rate": 5.988062049412103e-08, "loss": 0.7829, "step": 49414 }, { "epoch": 0.93, "learning_rate": 5.984738993053019e-08, "loss": 0.9173, "step": 49415 }, { "epoch": 0.93, "learning_rate": 5.981416847839428e-08, "loss": 0.8522, "step": 49416 }, { "epoch": 0.93, "learning_rate": 5.978095613783735e-08, "loss": 0.7899, "step": 49417 }, { "epoch": 0.93, "learning_rate": 5.97477529089835e-08, "loss": 0.9421, "step": 49418 }, { "epoch": 0.93, "learning_rate": 5.971455879195704e-08, "loss": 1.0739, "step": 49419 }, { "epoch": 0.93, "learning_rate": 5.968137378688121e-08, "loss": 0.9713, "step": 49420 }, { "epoch": 0.93, "learning_rate": 5.964819789388037e-08, "loss": 0.8747, "step": 49421 }, { "epoch": 0.93, "learning_rate": 5.96150311130786e-08, "loss": 0.9225, "step": 49422 }, { "epoch": 0.93, "learning_rate": 5.958187344459909e-08, "loss": 0.777, "step": 49423 }, { "epoch": 0.93, "learning_rate": 5.95487248885665e-08, "loss": 0.9529, "step": 49424 }, { "epoch": 0.93, "learning_rate": 5.951558544510405e-08, "loss": 1.2364, "step": 49425 }, { "epoch": 0.93, "learning_rate": 5.948245511433526e-08, "loss": 0.8105, "step": 49426 }, { "epoch": 0.93, "learning_rate": 5.9449333896384186e-08, "loss": 0.8331, "step": 49427 }, { "epoch": 0.93, "learning_rate": 5.9416221791374626e-08, "loss": 0.903, "step": 49428 }, { "epoch": 0.93, "learning_rate": 5.9383118799430094e-08, "loss": 0.7668, "step": 49429 }, { "epoch": 0.93, "learning_rate": 5.93500249206741e-08, "loss": 0.7188, "step": 49430 }, { "epoch": 0.93, "learning_rate": 5.931694015523043e-08, "loss": 1.0164, "step": 49431 }, { "epoch": 0.93, "learning_rate": 5.928386450322204e-08, "loss": 1.0762, "step": 49432 }, { "epoch": 0.93, "learning_rate": 5.925079796477329e-08, "loss": 0.7611, "step": 49433 }, { "epoch": 0.93, "learning_rate": 5.92177405400074e-08, "loss": 0.7675, "step": 49434 }, { "epoch": 0.93, "learning_rate": 5.9184692229047044e-08, "loss": 0.9713, "step": 49435 }, { "epoch": 0.93, "learning_rate": 5.9151653032016586e-08, "loss": 0.8917, "step": 49436 }, { "epoch": 0.93, "learning_rate": 5.9118622949038975e-08, "loss": 1.0709, "step": 49437 }, { "epoch": 0.93, "learning_rate": 5.908560198023744e-08, "loss": 0.9656, "step": 49438 }, { "epoch": 0.93, "learning_rate": 5.90525901257355e-08, "loss": 0.8627, "step": 49439 }, { "epoch": 0.93, "learning_rate": 5.901958738565638e-08, "loss": 0.8508, "step": 49440 }, { "epoch": 0.93, "learning_rate": 5.8986593760123334e-08, "loss": 0.9324, "step": 49441 }, { "epoch": 0.93, "learning_rate": 5.89536092492593e-08, "loss": 0.8531, "step": 49442 }, { "epoch": 0.93, "learning_rate": 5.892063385318808e-08, "loss": 0.9656, "step": 49443 }, { "epoch": 0.93, "learning_rate": 5.888766757203179e-08, "loss": 1.0258, "step": 49444 }, { "epoch": 0.93, "learning_rate": 5.8854710405914785e-08, "loss": 1.0274, "step": 49445 }, { "epoch": 0.93, "learning_rate": 5.88217623549589e-08, "loss": 0.8167, "step": 49446 }, { "epoch": 0.93, "learning_rate": 5.878882341928793e-08, "loss": 0.9811, "step": 49447 }, { "epoch": 0.93, "learning_rate": 5.875589359902456e-08, "loss": 0.9024, "step": 49448 }, { "epoch": 0.93, "learning_rate": 5.872297289429174e-08, "loss": 0.9689, "step": 49449 }, { "epoch": 0.93, "learning_rate": 5.869006130521243e-08, "loss": 0.9102, "step": 49450 }, { "epoch": 0.93, "learning_rate": 5.8657158831909867e-08, "loss": 1.0214, "step": 49451 }, { "epoch": 0.93, "learning_rate": 5.862426547450672e-08, "loss": 0.7346, "step": 49452 }, { "epoch": 0.93, "learning_rate": 5.859138123312513e-08, "loss": 0.7352, "step": 49453 }, { "epoch": 0.93, "learning_rate": 5.855850610788888e-08, "loss": 0.7983, "step": 49454 }, { "epoch": 0.93, "learning_rate": 5.852564009892037e-08, "loss": 0.7889, "step": 49455 }, { "epoch": 0.93, "learning_rate": 5.8492783206342e-08, "loss": 1.0741, "step": 49456 }, { "epoch": 0.93, "learning_rate": 5.8459935430277005e-08, "loss": 0.7843, "step": 49457 }, { "epoch": 0.93, "learning_rate": 5.842709677084751e-08, "loss": 0.7977, "step": 49458 }, { "epoch": 0.93, "learning_rate": 5.8394267228176484e-08, "loss": 0.8893, "step": 49459 }, { "epoch": 0.93, "learning_rate": 5.836144680238659e-08, "loss": 0.7557, "step": 49460 }, { "epoch": 0.93, "learning_rate": 5.832863549359996e-08, "loss": 0.7732, "step": 49461 }, { "epoch": 0.93, "learning_rate": 5.829583330193928e-08, "loss": 1.0831, "step": 49462 }, { "epoch": 0.93, "learning_rate": 5.8263040227527214e-08, "loss": 0.7108, "step": 49463 }, { "epoch": 0.93, "learning_rate": 5.8230256270486176e-08, "loss": 0.8901, "step": 49464 }, { "epoch": 0.93, "learning_rate": 5.819748143093829e-08, "loss": 0.7949, "step": 49465 }, { "epoch": 0.93, "learning_rate": 5.8164715709006225e-08, "loss": 0.6556, "step": 49466 }, { "epoch": 0.93, "learning_rate": 5.81319591048124e-08, "loss": 0.7911, "step": 49467 }, { "epoch": 0.93, "learning_rate": 5.8099211618478643e-08, "loss": 1.1238, "step": 49468 }, { "epoch": 0.93, "learning_rate": 5.806647325012793e-08, "loss": 1.0479, "step": 49469 }, { "epoch": 0.93, "learning_rate": 5.803374399988182e-08, "loss": 0.8847, "step": 49470 }, { "epoch": 0.93, "learning_rate": 5.800102386786299e-08, "loss": 0.983, "step": 49471 }, { "epoch": 0.93, "learning_rate": 5.79683128541933e-08, "loss": 1.0135, "step": 49472 }, { "epoch": 0.93, "learning_rate": 5.7935610958995415e-08, "loss": 0.8393, "step": 49473 }, { "epoch": 0.93, "learning_rate": 5.790291818239063e-08, "loss": 0.8554, "step": 49474 }, { "epoch": 0.93, "learning_rate": 5.787023452450163e-08, "loss": 0.9326, "step": 49475 }, { "epoch": 0.93, "learning_rate": 5.7837559985450816e-08, "loss": 0.8741, "step": 49476 }, { "epoch": 0.93, "learning_rate": 5.780489456535893e-08, "loss": 0.8403, "step": 49477 }, { "epoch": 0.93, "learning_rate": 5.777223826434919e-08, "loss": 0.9488, "step": 49478 }, { "epoch": 0.93, "learning_rate": 5.77395910825429e-08, "loss": 0.8752, "step": 49479 }, { "epoch": 0.93, "learning_rate": 5.7706953020061906e-08, "loss": 0.9216, "step": 49480 }, { "epoch": 0.93, "learning_rate": 5.767432407702833e-08, "loss": 0.9516, "step": 49481 }, { "epoch": 0.93, "learning_rate": 5.7641704253564024e-08, "loss": 1.0175, "step": 49482 }, { "epoch": 0.93, "learning_rate": 5.7609093549790554e-08, "loss": 0.8839, "step": 49483 }, { "epoch": 0.93, "learning_rate": 5.757649196583004e-08, "loss": 0.7084, "step": 49484 }, { "epoch": 0.93, "learning_rate": 5.7543899501804334e-08, "loss": 0.8907, "step": 49485 }, { "epoch": 0.93, "learning_rate": 5.751131615783417e-08, "loss": 0.7336, "step": 49486 }, { "epoch": 0.93, "learning_rate": 5.747874193404224e-08, "loss": 1.1323, "step": 49487 }, { "epoch": 0.93, "learning_rate": 5.744617683054954e-08, "loss": 1.0453, "step": 49488 }, { "epoch": 0.93, "learning_rate": 5.74136208474782e-08, "loss": 0.7134, "step": 49489 }, { "epoch": 0.93, "learning_rate": 5.7381073984949243e-08, "loss": 1.0165, "step": 49490 }, { "epoch": 0.93, "learning_rate": 5.734853624308478e-08, "loss": 0.846, "step": 49491 }, { "epoch": 0.93, "learning_rate": 5.731600762200584e-08, "loss": 0.7678, "step": 49492 }, { "epoch": 0.93, "learning_rate": 5.7283488121833984e-08, "loss": 1.0709, "step": 49493 }, { "epoch": 0.93, "learning_rate": 5.725097774269078e-08, "loss": 0.999, "step": 49494 }, { "epoch": 0.93, "learning_rate": 5.721847648469725e-08, "loss": 0.8579, "step": 49495 }, { "epoch": 0.93, "learning_rate": 5.718598434797523e-08, "loss": 0.986, "step": 49496 }, { "epoch": 0.93, "learning_rate": 5.7153501332646025e-08, "loss": 0.7518, "step": 49497 }, { "epoch": 0.93, "learning_rate": 5.712102743883036e-08, "loss": 0.9033, "step": 49498 }, { "epoch": 0.93, "learning_rate": 5.708856266665036e-08, "loss": 0.8119, "step": 49499 }, { "epoch": 0.93, "learning_rate": 5.7056107016226494e-08, "loss": 1.0449, "step": 49500 }, { "epoch": 0.93, "learning_rate": 5.7023660487680324e-08, "loss": 1.0157, "step": 49501 }, { "epoch": 0.93, "learning_rate": 5.6991223081132587e-08, "loss": 0.8901, "step": 49502 }, { "epoch": 0.93, "learning_rate": 5.695879479670513e-08, "loss": 0.8182, "step": 49503 }, { "epoch": 0.93, "learning_rate": 5.6926375634518416e-08, "loss": 0.8644, "step": 49504 }, { "epoch": 0.93, "learning_rate": 5.689396559469346e-08, "loss": 0.9164, "step": 49505 }, { "epoch": 0.93, "learning_rate": 5.68615646773521e-08, "loss": 0.9965, "step": 49506 }, { "epoch": 0.93, "learning_rate": 5.682917288261425e-08, "loss": 0.8277, "step": 49507 }, { "epoch": 0.93, "learning_rate": 5.679679021060175e-08, "loss": 0.8725, "step": 49508 }, { "epoch": 0.93, "learning_rate": 5.676441666143506e-08, "loss": 0.8309, "step": 49509 }, { "epoch": 0.93, "learning_rate": 5.6732052235234924e-08, "loss": 0.8143, "step": 49510 }, { "epoch": 0.93, "learning_rate": 5.669969693212235e-08, "loss": 0.9576, "step": 49511 }, { "epoch": 0.93, "learning_rate": 5.6667350752218355e-08, "loss": 0.9033, "step": 49512 }, { "epoch": 0.93, "learning_rate": 5.6635013695643395e-08, "loss": 0.9897, "step": 49513 }, { "epoch": 0.93, "learning_rate": 5.6602685762518484e-08, "loss": 0.9145, "step": 49514 }, { "epoch": 0.93, "learning_rate": 5.657036695296464e-08, "loss": 1.124, "step": 49515 }, { "epoch": 0.93, "learning_rate": 5.6538057267101485e-08, "loss": 0.9305, "step": 49516 }, { "epoch": 0.93, "learning_rate": 5.6505756705050596e-08, "loss": 0.6701, "step": 49517 }, { "epoch": 0.93, "learning_rate": 5.6473465266932426e-08, "loss": 1.2026, "step": 49518 }, { "epoch": 0.93, "learning_rate": 5.644118295286688e-08, "loss": 1.2694, "step": 49519 }, { "epoch": 0.93, "learning_rate": 5.6408909762975806e-08, "loss": 0.9354, "step": 49520 }, { "epoch": 0.93, "learning_rate": 5.637664569737827e-08, "loss": 0.8525, "step": 49521 }, { "epoch": 0.93, "learning_rate": 5.6344390756195854e-08, "loss": 0.8738, "step": 49522 }, { "epoch": 0.93, "learning_rate": 5.6312144939548177e-08, "loss": 0.8107, "step": 49523 }, { "epoch": 0.93, "learning_rate": 5.627990824755625e-08, "loss": 0.8103, "step": 49524 }, { "epoch": 0.93, "learning_rate": 5.624768068034026e-08, "loss": 1.0037, "step": 49525 }, { "epoch": 0.93, "learning_rate": 5.621546223802038e-08, "loss": 0.8905, "step": 49526 }, { "epoch": 0.93, "learning_rate": 5.618325292071736e-08, "loss": 0.9694, "step": 49527 }, { "epoch": 0.93, "learning_rate": 5.6151052728550535e-08, "loss": 0.8722, "step": 49528 }, { "epoch": 0.93, "learning_rate": 5.611886166164149e-08, "loss": 0.7637, "step": 49529 }, { "epoch": 0.93, "learning_rate": 5.608667972010928e-08, "loss": 0.8221, "step": 49530 }, { "epoch": 0.93, "learning_rate": 5.605450690407438e-08, "loss": 1.1581, "step": 49531 }, { "epoch": 0.93, "learning_rate": 5.6022343213657236e-08, "loss": 1.0725, "step": 49532 }, { "epoch": 0.93, "learning_rate": 5.599018864897748e-08, "loss": 0.8802, "step": 49533 }, { "epoch": 0.93, "learning_rate": 5.595804321015558e-08, "loss": 0.8392, "step": 49534 }, { "epoch": 0.93, "learning_rate": 5.5925906897311424e-08, "loss": 0.6824, "step": 49535 }, { "epoch": 0.93, "learning_rate": 5.58937797105652e-08, "loss": 0.8576, "step": 49536 }, { "epoch": 0.93, "learning_rate": 5.586166165003626e-08, "loss": 0.957, "step": 49537 }, { "epoch": 0.93, "learning_rate": 5.582955271584506e-08, "loss": 0.9673, "step": 49538 }, { "epoch": 0.93, "learning_rate": 5.5797452908111506e-08, "loss": 0.841, "step": 49539 }, { "epoch": 0.93, "learning_rate": 5.576536222695495e-08, "loss": 0.8517, "step": 49540 }, { "epoch": 0.93, "learning_rate": 5.5733280672496114e-08, "loss": 0.8154, "step": 49541 }, { "epoch": 0.93, "learning_rate": 5.570120824485409e-08, "loss": 0.7449, "step": 49542 }, { "epoch": 0.93, "learning_rate": 5.566914494414877e-08, "loss": 0.6135, "step": 49543 }, { "epoch": 0.93, "learning_rate": 5.563709077049978e-08, "loss": 1.1291, "step": 49544 }, { "epoch": 0.93, "learning_rate": 5.5605045724027026e-08, "loss": 0.9211, "step": 49545 }, { "epoch": 0.93, "learning_rate": 5.557300980485014e-08, "loss": 0.7607, "step": 49546 }, { "epoch": 0.93, "learning_rate": 5.554098301308874e-08, "loss": 0.9321, "step": 49547 }, { "epoch": 0.93, "learning_rate": 5.550896534886247e-08, "loss": 0.8283, "step": 49548 }, { "epoch": 0.93, "learning_rate": 5.547695681229037e-08, "loss": 0.9583, "step": 49549 }, { "epoch": 0.93, "learning_rate": 5.544495740349265e-08, "loss": 1.1755, "step": 49550 }, { "epoch": 0.93, "learning_rate": 5.5412967122588644e-08, "loss": 0.9924, "step": 49551 }, { "epoch": 0.93, "learning_rate": 5.538098596969743e-08, "loss": 0.7224, "step": 49552 }, { "epoch": 0.93, "learning_rate": 5.5349013944938636e-08, "loss": 0.7927, "step": 49553 }, { "epoch": 0.93, "learning_rate": 5.53170510484316e-08, "loss": 0.8871, "step": 49554 }, { "epoch": 0.93, "learning_rate": 5.5285097280295964e-08, "loss": 0.7198, "step": 49555 }, { "epoch": 0.93, "learning_rate": 5.525315264065079e-08, "loss": 1.1555, "step": 49556 }, { "epoch": 0.93, "learning_rate": 5.5221217129615425e-08, "loss": 1.1555, "step": 49557 }, { "epoch": 0.94, "learning_rate": 5.5189290747308667e-08, "loss": 0.7387, "step": 49558 }, { "epoch": 0.94, "learning_rate": 5.515737349385042e-08, "loss": 0.8624, "step": 49559 }, { "epoch": 0.94, "learning_rate": 5.512546536935975e-08, "loss": 0.8922, "step": 49560 }, { "epoch": 0.94, "learning_rate": 5.509356637395546e-08, "loss": 0.9304, "step": 49561 }, { "epoch": 0.94, "learning_rate": 5.50616765077569e-08, "loss": 1.1755, "step": 49562 }, { "epoch": 0.94, "learning_rate": 5.502979577088313e-08, "loss": 0.9855, "step": 49563 }, { "epoch": 0.94, "learning_rate": 5.4997924163452956e-08, "loss": 0.5549, "step": 49564 }, { "epoch": 0.94, "learning_rate": 5.4966061685585715e-08, "loss": 0.9435, "step": 49565 }, { "epoch": 0.94, "learning_rate": 5.493420833740021e-08, "loss": 0.7721, "step": 49566 }, { "epoch": 0.94, "learning_rate": 5.490236411901523e-08, "loss": 0.7839, "step": 49567 }, { "epoch": 0.94, "learning_rate": 5.4870529030549846e-08, "loss": 0.9822, "step": 49568 }, { "epoch": 0.94, "learning_rate": 5.483870307212341e-08, "loss": 0.8806, "step": 49569 }, { "epoch": 0.94, "learning_rate": 5.4806886243853605e-08, "loss": 0.879, "step": 49570 }, { "epoch": 0.94, "learning_rate": 5.477507854586061e-08, "loss": 0.98, "step": 49571 }, { "epoch": 0.94, "learning_rate": 5.474327997826212e-08, "loss": 0.7677, "step": 49572 }, { "epoch": 0.94, "learning_rate": 5.4711490541177195e-08, "loss": 0.7645, "step": 49573 }, { "epoch": 0.94, "learning_rate": 5.4679710234724626e-08, "loss": 0.9429, "step": 49574 }, { "epoch": 0.94, "learning_rate": 5.464793905902321e-08, "loss": 1.0109, "step": 49575 }, { "epoch": 0.94, "learning_rate": 5.4616177014191194e-08, "loss": 0.8097, "step": 49576 }, { "epoch": 0.94, "learning_rate": 5.4584424100347646e-08, "loss": 0.6854, "step": 49577 }, { "epoch": 0.94, "learning_rate": 5.4552680317610796e-08, "loss": 1.0391, "step": 49578 }, { "epoch": 0.94, "learning_rate": 5.452094566609889e-08, "loss": 0.7794, "step": 49579 }, { "epoch": 0.94, "learning_rate": 5.448922014593128e-08, "loss": 0.7968, "step": 49580 }, { "epoch": 0.94, "learning_rate": 5.4457503757225916e-08, "loss": 1.1572, "step": 49581 }, { "epoch": 0.94, "learning_rate": 5.442579650010077e-08, "loss": 0.8759, "step": 49582 }, { "epoch": 0.94, "learning_rate": 5.4394098374675186e-08, "loss": 0.8354, "step": 49583 }, { "epoch": 0.94, "learning_rate": 5.436240938106713e-08, "loss": 0.8422, "step": 49584 }, { "epoch": 0.94, "learning_rate": 5.4330729519394556e-08, "loss": 0.6539, "step": 49585 }, { "epoch": 0.94, "learning_rate": 5.429905878977598e-08, "loss": 0.9041, "step": 49586 }, { "epoch": 0.94, "learning_rate": 5.426739719232993e-08, "loss": 0.8942, "step": 49587 }, { "epoch": 0.94, "learning_rate": 5.423574472717436e-08, "loss": 0.9979, "step": 49588 }, { "epoch": 0.94, "learning_rate": 5.42041013944275e-08, "loss": 0.9847, "step": 49589 }, { "epoch": 0.94, "learning_rate": 5.4172467194207877e-08, "loss": 0.9318, "step": 49590 }, { "epoch": 0.94, "learning_rate": 5.414084212663262e-08, "loss": 0.6312, "step": 49591 }, { "epoch": 0.94, "learning_rate": 5.410922619182107e-08, "loss": 0.8172, "step": 49592 }, { "epoch": 0.94, "learning_rate": 5.4077619389890646e-08, "loss": 0.8956, "step": 49593 }, { "epoch": 0.94, "learning_rate": 5.404602172095902e-08, "loss": 1.0103, "step": 49594 }, { "epoch": 0.94, "learning_rate": 5.401443318514471e-08, "loss": 0.807, "step": 49595 }, { "epoch": 0.94, "learning_rate": 5.3982853782565406e-08, "loss": 0.9219, "step": 49596 }, { "epoch": 0.94, "learning_rate": 5.3951283513339333e-08, "loss": 0.958, "step": 49597 }, { "epoch": 0.94, "learning_rate": 5.391972237758419e-08, "loss": 0.7598, "step": 49598 }, { "epoch": 0.94, "learning_rate": 5.388817037541793e-08, "loss": 0.9926, "step": 49599 }, { "epoch": 0.94, "learning_rate": 5.385662750695769e-08, "loss": 1.3508, "step": 49600 }, { "epoch": 0.94, "learning_rate": 5.382509377232198e-08, "loss": 1.0701, "step": 49601 }, { "epoch": 0.94, "learning_rate": 5.379356917162876e-08, "loss": 0.9799, "step": 49602 }, { "epoch": 0.94, "learning_rate": 5.3762053704994875e-08, "loss": 0.8759, "step": 49603 }, { "epoch": 0.94, "learning_rate": 5.373054737253885e-08, "loss": 0.8116, "step": 49604 }, { "epoch": 0.94, "learning_rate": 5.369905017437782e-08, "loss": 1.0319, "step": 49605 }, { "epoch": 0.94, "learning_rate": 5.3667562110629736e-08, "loss": 0.9985, "step": 49606 }, { "epoch": 0.94, "learning_rate": 5.363608318141173e-08, "loss": 1.0058, "step": 49607 }, { "epoch": 0.94, "learning_rate": 5.360461338684148e-08, "loss": 0.747, "step": 49608 }, { "epoch": 0.94, "learning_rate": 5.357315272703667e-08, "loss": 1.0623, "step": 49609 }, { "epoch": 0.94, "learning_rate": 5.354170120211472e-08, "loss": 0.8566, "step": 49610 }, { "epoch": 0.94, "learning_rate": 5.3510258812193295e-08, "loss": 0.8611, "step": 49611 }, { "epoch": 0.94, "learning_rate": 5.3478825557389256e-08, "loss": 0.9808, "step": 49612 }, { "epoch": 0.94, "learning_rate": 5.3447401437820565e-08, "loss": 1.013, "step": 49613 }, { "epoch": 0.94, "learning_rate": 5.341598645360407e-08, "loss": 0.9245, "step": 49614 }, { "epoch": 0.94, "learning_rate": 5.3384580604857185e-08, "loss": 0.899, "step": 49615 }, { "epoch": 0.94, "learning_rate": 5.33531838916973e-08, "loss": 0.8895, "step": 49616 }, { "epoch": 0.94, "learning_rate": 5.332179631424156e-08, "loss": 0.6823, "step": 49617 }, { "epoch": 0.94, "learning_rate": 5.329041787260764e-08, "loss": 0.7555, "step": 49618 }, { "epoch": 0.94, "learning_rate": 5.325904856691155e-08, "loss": 1.0743, "step": 49619 }, { "epoch": 0.94, "learning_rate": 5.3227688397271825e-08, "loss": 0.9423, "step": 49620 }, { "epoch": 0.94, "learning_rate": 5.3196337363804476e-08, "loss": 0.7837, "step": 49621 }, { "epoch": 0.94, "learning_rate": 5.31649954666269e-08, "loss": 0.784, "step": 49622 }, { "epoch": 0.94, "learning_rate": 5.313366270585679e-08, "loss": 0.7154, "step": 49623 }, { "epoch": 0.94, "learning_rate": 5.310233908161017e-08, "loss": 0.8859, "step": 49624 }, { "epoch": 0.94, "learning_rate": 5.307102459400415e-08, "loss": 0.9312, "step": 49625 }, { "epoch": 0.94, "learning_rate": 5.303971924315615e-08, "loss": 1.0187, "step": 49626 }, { "epoch": 0.94, "learning_rate": 5.300842302918302e-08, "loss": 0.9714, "step": 49627 }, { "epoch": 0.94, "learning_rate": 5.297713595220105e-08, "loss": 0.7949, "step": 49628 }, { "epoch": 0.94, "learning_rate": 5.2945858012327655e-08, "loss": 0.9556, "step": 49629 }, { "epoch": 0.94, "learning_rate": 5.2914589209679677e-08, "loss": 0.8525, "step": 49630 }, { "epoch": 0.94, "learning_rate": 5.288332954437286e-08, "loss": 0.8149, "step": 49631 }, { "epoch": 0.94, "learning_rate": 5.2852079016525174e-08, "loss": 0.9865, "step": 49632 }, { "epoch": 0.94, "learning_rate": 5.2820837626252894e-08, "loss": 0.8594, "step": 49633 }, { "epoch": 0.94, "learning_rate": 5.278960537367234e-08, "loss": 0.9117, "step": 49634 }, { "epoch": 0.94, "learning_rate": 5.275838225890034e-08, "loss": 0.7825, "step": 49635 }, { "epoch": 0.94, "learning_rate": 5.272716828205349e-08, "loss": 0.7784, "step": 49636 }, { "epoch": 0.94, "learning_rate": 5.2695963443248347e-08, "loss": 0.9905, "step": 49637 }, { "epoch": 0.94, "learning_rate": 5.2664767742601485e-08, "loss": 1.0506, "step": 49638 }, { "epoch": 0.94, "learning_rate": 5.263358118022949e-08, "loss": 0.8897, "step": 49639 }, { "epoch": 0.94, "learning_rate": 5.260240375624837e-08, "loss": 0.9671, "step": 49640 }, { "epoch": 0.94, "learning_rate": 5.257123547077525e-08, "loss": 0.8585, "step": 49641 }, { "epoch": 0.94, "learning_rate": 5.2540076323925884e-08, "loss": 0.9205, "step": 49642 }, { "epoch": 0.94, "learning_rate": 5.250892631581655e-08, "loss": 0.9604, "step": 49643 }, { "epoch": 0.94, "learning_rate": 5.24777854465644e-08, "loss": 0.8346, "step": 49644 }, { "epoch": 0.94, "learning_rate": 5.244665371628488e-08, "loss": 0.8166, "step": 49645 }, { "epoch": 0.94, "learning_rate": 5.241553112509429e-08, "loss": 0.7978, "step": 49646 }, { "epoch": 0.94, "learning_rate": 5.23844176731092e-08, "loss": 0.9203, "step": 49647 }, { "epoch": 0.94, "learning_rate": 5.2353313360445914e-08, "loss": 0.9025, "step": 49648 }, { "epoch": 0.94, "learning_rate": 5.2322218187219885e-08, "loss": 1.3301, "step": 49649 }, { "epoch": 0.94, "learning_rate": 5.229113215354797e-08, "loss": 1.1508, "step": 49650 }, { "epoch": 0.94, "learning_rate": 5.226005525954592e-08, "loss": 0.9887, "step": 49651 }, { "epoch": 0.94, "learning_rate": 5.222898750532946e-08, "loss": 1.0275, "step": 49652 }, { "epoch": 0.94, "learning_rate": 5.2197928891015436e-08, "loss": 0.813, "step": 49653 }, { "epoch": 0.94, "learning_rate": 5.2166879416718774e-08, "loss": 0.9363, "step": 49654 }, { "epoch": 0.94, "learning_rate": 5.2135839082556314e-08, "loss": 0.8986, "step": 49655 }, { "epoch": 0.94, "learning_rate": 5.210480788864325e-08, "loss": 1.0326, "step": 49656 }, { "epoch": 0.94, "learning_rate": 5.207378583509587e-08, "loss": 1.1214, "step": 49657 }, { "epoch": 0.94, "learning_rate": 5.2042772922030196e-08, "loss": 0.7873, "step": 49658 }, { "epoch": 0.94, "learning_rate": 5.201176914956141e-08, "loss": 0.873, "step": 49659 }, { "epoch": 0.94, "learning_rate": 5.198077451780581e-08, "loss": 0.715, "step": 49660 }, { "epoch": 0.94, "learning_rate": 5.194978902687886e-08, "loss": 0.9351, "step": 49661 }, { "epoch": 0.94, "learning_rate": 5.191881267689658e-08, "loss": 1.0291, "step": 49662 }, { "epoch": 0.94, "learning_rate": 5.188784546797415e-08, "loss": 1.0902, "step": 49663 }, { "epoch": 0.94, "learning_rate": 5.185688740022704e-08, "loss": 0.8962, "step": 49664 }, { "epoch": 0.94, "learning_rate": 5.182593847377182e-08, "loss": 0.9105, "step": 49665 }, { "epoch": 0.94, "learning_rate": 5.17949986887234e-08, "loss": 0.7364, "step": 49666 }, { "epoch": 0.94, "learning_rate": 5.1764068045197236e-08, "loss": 0.8745, "step": 49667 }, { "epoch": 0.94, "learning_rate": 5.173314654330908e-08, "loss": 0.86, "step": 49668 }, { "epoch": 0.94, "learning_rate": 5.170223418317438e-08, "loss": 0.9443, "step": 49669 }, { "epoch": 0.94, "learning_rate": 5.167133096490834e-08, "loss": 0.7822, "step": 49670 }, { "epoch": 0.94, "learning_rate": 5.164043688862641e-08, "loss": 0.8879, "step": 49671 }, { "epoch": 0.94, "learning_rate": 5.160955195444434e-08, "loss": 0.7427, "step": 49672 }, { "epoch": 0.94, "learning_rate": 5.1578676162476746e-08, "loss": 0.867, "step": 49673 }, { "epoch": 0.94, "learning_rate": 5.1547809512839666e-08, "loss": 0.8397, "step": 49674 }, { "epoch": 0.94, "learning_rate": 5.151695200564771e-08, "loss": 1.1152, "step": 49675 }, { "epoch": 0.94, "learning_rate": 5.148610364101664e-08, "loss": 1.0066, "step": 49676 }, { "epoch": 0.94, "learning_rate": 5.145526441906107e-08, "loss": 0.9705, "step": 49677 }, { "epoch": 0.94, "learning_rate": 5.142443433989674e-08, "loss": 0.9673, "step": 49678 }, { "epoch": 0.94, "learning_rate": 5.13936134036383e-08, "loss": 0.7819, "step": 49679 }, { "epoch": 0.94, "learning_rate": 5.1362801610400914e-08, "loss": 0.9081, "step": 49680 }, { "epoch": 0.94, "learning_rate": 5.1331998960300336e-08, "loss": 0.9948, "step": 49681 }, { "epoch": 0.94, "learning_rate": 5.130120545345035e-08, "loss": 0.7587, "step": 49682 }, { "epoch": 0.94, "learning_rate": 5.1270421089966996e-08, "loss": 0.6666, "step": 49683 }, { "epoch": 0.94, "learning_rate": 5.123964586996461e-08, "loss": 0.8827, "step": 49684 }, { "epoch": 0.94, "learning_rate": 5.12088797935581e-08, "loss": 0.7411, "step": 49685 }, { "epoch": 0.94, "learning_rate": 5.117812286086293e-08, "loss": 0.7808, "step": 49686 }, { "epoch": 0.94, "learning_rate": 5.1147375071993465e-08, "loss": 1.0941, "step": 49687 }, { "epoch": 0.94, "learning_rate": 5.1116636427064605e-08, "loss": 1.0048, "step": 49688 }, { "epoch": 0.94, "learning_rate": 5.1085906926191255e-08, "loss": 0.6497, "step": 49689 }, { "epoch": 0.94, "learning_rate": 5.105518656948777e-08, "loss": 0.859, "step": 49690 }, { "epoch": 0.94, "learning_rate": 5.1024475357069336e-08, "loss": 1.0059, "step": 49691 }, { "epoch": 0.94, "learning_rate": 5.099377328905031e-08, "loss": 0.9109, "step": 49692 }, { "epoch": 0.94, "learning_rate": 5.0963080365545595e-08, "loss": 0.8598, "step": 49693 }, { "epoch": 0.94, "learning_rate": 5.093239658666954e-08, "loss": 0.9973, "step": 49694 }, { "epoch": 0.94, "learning_rate": 5.0901721952537064e-08, "loss": 0.955, "step": 49695 }, { "epoch": 0.94, "learning_rate": 5.087105646326196e-08, "loss": 0.929, "step": 49696 }, { "epoch": 0.94, "learning_rate": 5.084040011895969e-08, "loss": 0.9716, "step": 49697 }, { "epoch": 0.94, "learning_rate": 5.0809752919744046e-08, "loss": 0.8979, "step": 49698 }, { "epoch": 0.94, "learning_rate": 5.0779114865729675e-08, "loss": 1.1638, "step": 49699 }, { "epoch": 0.94, "learning_rate": 5.074848595703119e-08, "loss": 1.0884, "step": 49700 }, { "epoch": 0.94, "learning_rate": 5.07178661937624e-08, "loss": 0.9807, "step": 49701 }, { "epoch": 0.94, "learning_rate": 5.068725557603849e-08, "loss": 0.9861, "step": 49702 }, { "epoch": 0.94, "learning_rate": 5.065665410397297e-08, "loss": 0.9043, "step": 49703 }, { "epoch": 0.94, "learning_rate": 5.062606177768048e-08, "loss": 0.6352, "step": 49704 }, { "epoch": 0.94, "learning_rate": 5.0595478597275374e-08, "loss": 0.8466, "step": 49705 }, { "epoch": 0.94, "learning_rate": 5.056490456287117e-08, "loss": 1.0754, "step": 49706 }, { "epoch": 0.94, "learning_rate": 5.053433967458276e-08, "loss": 0.7951, "step": 49707 }, { "epoch": 0.94, "learning_rate": 5.0503783932524254e-08, "loss": 0.8714, "step": 49708 }, { "epoch": 0.94, "learning_rate": 5.047323733680914e-08, "loss": 0.723, "step": 49709 }, { "epoch": 0.94, "learning_rate": 5.044269988755207e-08, "loss": 0.8217, "step": 49710 }, { "epoch": 0.94, "learning_rate": 5.0412171584866833e-08, "loss": 0.7572, "step": 49711 }, { "epoch": 0.94, "learning_rate": 5.038165242886722e-08, "loss": 1.0825, "step": 49712 }, { "epoch": 0.94, "learning_rate": 5.03511424196676e-08, "loss": 1.0129, "step": 49713 }, { "epoch": 0.94, "learning_rate": 5.032064155738203e-08, "loss": 0.9725, "step": 49714 }, { "epoch": 0.94, "learning_rate": 5.029014984212349e-08, "loss": 0.933, "step": 49715 }, { "epoch": 0.94, "learning_rate": 5.0259667274006884e-08, "loss": 0.9949, "step": 49716 }, { "epoch": 0.94, "learning_rate": 5.0229193853145175e-08, "loss": 0.8018, "step": 49717 }, { "epoch": 0.94, "learning_rate": 5.019872957965272e-08, "loss": 1.0739, "step": 49718 }, { "epoch": 0.94, "learning_rate": 5.016827445364303e-08, "loss": 1.1117, "step": 49719 }, { "epoch": 0.94, "learning_rate": 5.013782847523019e-08, "loss": 0.7568, "step": 49720 }, { "epoch": 0.94, "learning_rate": 5.010739164452716e-08, "loss": 0.7754, "step": 49721 }, { "epoch": 0.94, "learning_rate": 5.0076963961648294e-08, "loss": 0.721, "step": 49722 }, { "epoch": 0.94, "learning_rate": 5.0046545426707116e-08, "loss": 0.9255, "step": 49723 }, { "epoch": 0.94, "learning_rate": 5.001613603981631e-08, "loss": 0.9102, "step": 49724 }, { "epoch": 0.94, "learning_rate": 4.998573580109079e-08, "loss": 1.0686, "step": 49725 }, { "epoch": 0.94, "learning_rate": 4.995534471064323e-08, "loss": 1.045, "step": 49726 }, { "epoch": 0.94, "learning_rate": 4.992496276858716e-08, "loss": 0.8682, "step": 49727 }, { "epoch": 0.94, "learning_rate": 4.989458997503638e-08, "loss": 0.8247, "step": 49728 }, { "epoch": 0.94, "learning_rate": 4.986422633010385e-08, "loss": 0.9261, "step": 49729 }, { "epoch": 0.94, "learning_rate": 4.983387183390337e-08, "loss": 0.8177, "step": 49730 }, { "epoch": 0.94, "learning_rate": 4.98035264865479e-08, "loss": 1.0246, "step": 49731 }, { "epoch": 0.94, "learning_rate": 4.977319028815125e-08, "loss": 0.9653, "step": 49732 }, { "epoch": 0.94, "learning_rate": 4.97428632388261e-08, "loss": 0.921, "step": 49733 }, { "epoch": 0.94, "learning_rate": 4.971254533868597e-08, "loss": 0.6607, "step": 49734 }, { "epoch": 0.94, "learning_rate": 4.9682236587844376e-08, "loss": 0.9557, "step": 49735 }, { "epoch": 0.94, "learning_rate": 4.965193698641374e-08, "loss": 0.7681, "step": 49736 }, { "epoch": 0.94, "learning_rate": 4.962164653450813e-08, "loss": 0.9156, "step": 49737 }, { "epoch": 0.94, "learning_rate": 4.9591365232239676e-08, "loss": 0.8693, "step": 49738 }, { "epoch": 0.94, "learning_rate": 4.9561093079722175e-08, "loss": 0.7834, "step": 49739 }, { "epoch": 0.94, "learning_rate": 4.9530830077068326e-08, "loss": 0.8348, "step": 49740 }, { "epoch": 0.94, "learning_rate": 4.950057622439136e-08, "loss": 0.7043, "step": 49741 }, { "epoch": 0.94, "learning_rate": 4.947033152180397e-08, "loss": 0.8076, "step": 49742 }, { "epoch": 0.94, "learning_rate": 4.94400959694194e-08, "loss": 0.9824, "step": 49743 }, { "epoch": 0.94, "learning_rate": 4.940986956735033e-08, "loss": 1.0659, "step": 49744 }, { "epoch": 0.94, "learning_rate": 4.937965231570946e-08, "loss": 0.7912, "step": 49745 }, { "epoch": 0.94, "learning_rate": 4.934944421461002e-08, "loss": 0.9582, "step": 49746 }, { "epoch": 0.94, "learning_rate": 4.93192452641647e-08, "loss": 0.6771, "step": 49747 }, { "epoch": 0.94, "learning_rate": 4.928905546448592e-08, "loss": 0.7805, "step": 49748 }, { "epoch": 0.94, "learning_rate": 4.925887481568692e-08, "loss": 1.02, "step": 49749 }, { "epoch": 0.94, "learning_rate": 4.92287033178801e-08, "loss": 1.0696, "step": 49750 }, { "epoch": 0.94, "learning_rate": 4.9198540971177876e-08, "loss": 1.0502, "step": 49751 }, { "epoch": 0.94, "learning_rate": 4.916838777569349e-08, "loss": 0.8672, "step": 49752 }, { "epoch": 0.94, "learning_rate": 4.913824373153908e-08, "loss": 0.9595, "step": 49753 }, { "epoch": 0.94, "learning_rate": 4.910810883882705e-08, "loss": 0.7249, "step": 49754 }, { "epoch": 0.94, "learning_rate": 4.9077983097670644e-08, "loss": 0.7734, "step": 49755 }, { "epoch": 0.94, "learning_rate": 4.904786650818172e-08, "loss": 1.1448, "step": 49756 }, { "epoch": 0.94, "learning_rate": 4.901775907047268e-08, "loss": 0.8019, "step": 49757 }, { "epoch": 0.94, "learning_rate": 4.898766078465678e-08, "loss": 0.7261, "step": 49758 }, { "epoch": 0.94, "learning_rate": 4.8957571650845306e-08, "loss": 0.9883, "step": 49759 }, { "epoch": 0.94, "learning_rate": 4.892749166915123e-08, "loss": 0.8745, "step": 49760 }, { "epoch": 0.94, "learning_rate": 4.889742083968668e-08, "loss": 1.012, "step": 49761 }, { "epoch": 0.94, "learning_rate": 4.8867359162564074e-08, "loss": 0.9796, "step": 49762 }, { "epoch": 0.94, "learning_rate": 4.883730663789582e-08, "loss": 1.0562, "step": 49763 }, { "epoch": 0.94, "learning_rate": 4.880726326579349e-08, "loss": 1.1583, "step": 49764 }, { "epoch": 0.94, "learning_rate": 4.8777229046370055e-08, "loss": 0.8347, "step": 49765 }, { "epoch": 0.94, "learning_rate": 4.874720397973709e-08, "loss": 0.7252, "step": 49766 }, { "epoch": 0.94, "learning_rate": 4.871718806600701e-08, "loss": 0.8484, "step": 49767 }, { "epoch": 0.94, "learning_rate": 4.868718130529165e-08, "loss": 1.0473, "step": 49768 }, { "epoch": 0.94, "learning_rate": 4.865718369770317e-08, "loss": 0.8373, "step": 49769 }, { "epoch": 0.94, "learning_rate": 4.8627195243353964e-08, "loss": 0.8255, "step": 49770 }, { "epoch": 0.94, "learning_rate": 4.8597215942355336e-08, "loss": 0.8052, "step": 49771 }, { "epoch": 0.94, "learning_rate": 4.8567245794819695e-08, "loss": 0.9594, "step": 49772 }, { "epoch": 0.94, "learning_rate": 4.853728480085862e-08, "loss": 0.723, "step": 49773 }, { "epoch": 0.94, "learning_rate": 4.8507332960584244e-08, "loss": 0.911, "step": 49774 }, { "epoch": 0.94, "learning_rate": 4.8477390274108137e-08, "loss": 1.0075, "step": 49775 }, { "epoch": 0.94, "learning_rate": 4.844745674154244e-08, "loss": 0.8184, "step": 49776 }, { "epoch": 0.94, "learning_rate": 4.841753236299901e-08, "loss": 0.8546, "step": 49777 }, { "epoch": 0.94, "learning_rate": 4.838761713858914e-08, "loss": 0.7927, "step": 49778 }, { "epoch": 0.94, "learning_rate": 4.8357711068424684e-08, "loss": 0.6588, "step": 49779 }, { "epoch": 0.94, "learning_rate": 4.8327814152617504e-08, "loss": 0.9178, "step": 49780 }, { "epoch": 0.94, "learning_rate": 4.829792639127889e-08, "loss": 1.0082, "step": 49781 }, { "epoch": 0.94, "learning_rate": 4.826804778452099e-08, "loss": 0.8962, "step": 49782 }, { "epoch": 0.94, "learning_rate": 4.823817833245481e-08, "loss": 0.6683, "step": 49783 }, { "epoch": 0.94, "learning_rate": 4.8208318035191935e-08, "loss": 0.9095, "step": 49784 }, { "epoch": 0.94, "learning_rate": 4.817846689284422e-08, "loss": 1.0225, "step": 49785 }, { "epoch": 0.94, "learning_rate": 4.814862490552297e-08, "loss": 0.9138, "step": 49786 }, { "epoch": 0.94, "learning_rate": 4.811879207333947e-08, "loss": 0.9507, "step": 49787 }, { "epoch": 0.94, "learning_rate": 4.808896839640531e-08, "loss": 0.9774, "step": 49788 }, { "epoch": 0.94, "learning_rate": 4.805915387483179e-08, "loss": 0.9915, "step": 49789 }, { "epoch": 0.94, "learning_rate": 4.8029348508729925e-08, "loss": 1.0269, "step": 49790 }, { "epoch": 0.94, "learning_rate": 4.799955229821185e-08, "loss": 0.7816, "step": 49791 }, { "epoch": 0.94, "learning_rate": 4.796976524338776e-08, "loss": 0.9547, "step": 49792 }, { "epoch": 0.94, "learning_rate": 4.79399873443695e-08, "loss": 1.1591, "step": 49793 }, { "epoch": 0.94, "learning_rate": 4.7910218601268376e-08, "loss": 1.1439, "step": 49794 }, { "epoch": 0.94, "learning_rate": 4.7880459014195134e-08, "loss": 0.8527, "step": 49795 }, { "epoch": 0.94, "learning_rate": 4.785070858326107e-08, "loss": 0.9682, "step": 49796 }, { "epoch": 0.94, "learning_rate": 4.7820967308577214e-08, "loss": 0.849, "step": 49797 }, { "epoch": 0.94, "learning_rate": 4.7791235190254856e-08, "loss": 0.7293, "step": 49798 }, { "epoch": 0.94, "learning_rate": 4.776151222840447e-08, "loss": 0.9695, "step": 49799 }, { "epoch": 0.94, "learning_rate": 4.773179842313791e-08, "loss": 1.0486, "step": 49800 }, { "epoch": 0.94, "learning_rate": 4.770209377456536e-08, "loss": 0.9738, "step": 49801 }, { "epoch": 0.94, "learning_rate": 4.767239828279813e-08, "loss": 0.7094, "step": 49802 }, { "epoch": 0.94, "learning_rate": 4.7642711947946675e-08, "loss": 0.975, "step": 49803 }, { "epoch": 0.94, "learning_rate": 4.761303477012258e-08, "loss": 0.8964, "step": 49804 }, { "epoch": 0.94, "learning_rate": 4.7583366749435754e-08, "loss": 0.7686, "step": 49805 }, { "epoch": 0.94, "learning_rate": 4.755370788599778e-08, "loss": 0.9102, "step": 49806 }, { "epoch": 0.94, "learning_rate": 4.7524058179919117e-08, "loss": 0.9333, "step": 49807 }, { "epoch": 0.94, "learning_rate": 4.7494417631309966e-08, "loss": 0.9016, "step": 49808 }, { "epoch": 0.94, "learning_rate": 4.746478624028217e-08, "loss": 0.8789, "step": 49809 }, { "epoch": 0.94, "learning_rate": 4.743516400694509e-08, "loss": 0.6998, "step": 49810 }, { "epoch": 0.94, "learning_rate": 4.7405550931410025e-08, "loss": 0.9727, "step": 49811 }, { "epoch": 0.94, "learning_rate": 4.7375947013787724e-08, "loss": 0.9688, "step": 49812 }, { "epoch": 0.94, "learning_rate": 4.73463522541881e-08, "loss": 1.0855, "step": 49813 }, { "epoch": 0.94, "learning_rate": 4.731676665272217e-08, "loss": 1.0057, "step": 49814 }, { "epoch": 0.94, "learning_rate": 4.728719020950012e-08, "loss": 0.8282, "step": 49815 }, { "epoch": 0.94, "learning_rate": 4.725762292463243e-08, "loss": 0.9036, "step": 49816 }, { "epoch": 0.94, "learning_rate": 4.722806479822983e-08, "loss": 0.7435, "step": 49817 }, { "epoch": 0.94, "learning_rate": 4.719851583040225e-08, "loss": 0.8956, "step": 49818 }, { "epoch": 0.94, "learning_rate": 4.716897602126042e-08, "loss": 1.0932, "step": 49819 }, { "epoch": 0.94, "learning_rate": 4.713944537091397e-08, "loss": 0.922, "step": 49820 }, { "epoch": 0.94, "learning_rate": 4.710992387947422e-08, "loss": 0.8903, "step": 49821 }, { "epoch": 0.94, "learning_rate": 4.708041154705051e-08, "loss": 0.6458, "step": 49822 }, { "epoch": 0.94, "learning_rate": 4.7050908373753314e-08, "loss": 0.8564, "step": 49823 }, { "epoch": 0.94, "learning_rate": 4.702141435969282e-08, "loss": 1.0126, "step": 49824 }, { "epoch": 0.94, "learning_rate": 4.6991929504979214e-08, "loss": 0.7687, "step": 49825 }, { "epoch": 0.94, "learning_rate": 4.696245380972242e-08, "loss": 0.866, "step": 49826 }, { "epoch": 0.94, "learning_rate": 4.6932987274032615e-08, "loss": 0.845, "step": 49827 }, { "epoch": 0.94, "learning_rate": 4.6903529898019996e-08, "loss": 1.0484, "step": 49828 }, { "epoch": 0.94, "learning_rate": 4.687408168179419e-08, "loss": 0.8099, "step": 49829 }, { "epoch": 0.94, "learning_rate": 4.684464262546568e-08, "loss": 1.0294, "step": 49830 }, { "epoch": 0.94, "learning_rate": 4.6815212729143524e-08, "loss": 1.1529, "step": 49831 }, { "epoch": 0.94, "learning_rate": 4.67857919929382e-08, "loss": 0.9396, "step": 49832 }, { "epoch": 0.94, "learning_rate": 4.675638041696018e-08, "loss": 0.7184, "step": 49833 }, { "epoch": 0.94, "learning_rate": 4.672697800131798e-08, "loss": 0.8398, "step": 49834 }, { "epoch": 0.94, "learning_rate": 4.669758474612235e-08, "loss": 0.7795, "step": 49835 }, { "epoch": 0.94, "learning_rate": 4.666820065148264e-08, "loss": 1.0252, "step": 49836 }, { "epoch": 0.94, "learning_rate": 4.663882571750849e-08, "loss": 1.1072, "step": 49837 }, { "epoch": 0.94, "learning_rate": 4.660945994430982e-08, "loss": 0.9807, "step": 49838 }, { "epoch": 0.94, "learning_rate": 4.658010333199625e-08, "loss": 0.9883, "step": 49839 }, { "epoch": 0.94, "learning_rate": 4.655075588067742e-08, "loss": 0.8807, "step": 49840 }, { "epoch": 0.94, "learning_rate": 4.652141759046269e-08, "loss": 0.893, "step": 49841 }, { "epoch": 0.94, "learning_rate": 4.6492088461461973e-08, "loss": 0.7622, "step": 49842 }, { "epoch": 0.94, "learning_rate": 4.646276849378434e-08, "loss": 0.9921, "step": 49843 }, { "epoch": 0.94, "learning_rate": 4.643345768753971e-08, "loss": 0.9777, "step": 49844 }, { "epoch": 0.94, "learning_rate": 4.6404156042837156e-08, "loss": 0.9341, "step": 49845 }, { "epoch": 0.94, "learning_rate": 4.637486355978632e-08, "loss": 0.9373, "step": 49846 }, { "epoch": 0.94, "learning_rate": 4.6345580238496554e-08, "loss": 0.9568, "step": 49847 }, { "epoch": 0.94, "learning_rate": 4.6316306079076945e-08, "loss": 0.7162, "step": 49848 }, { "epoch": 0.94, "learning_rate": 4.62870410816374e-08, "loss": 0.9336, "step": 49849 }, { "epoch": 0.94, "learning_rate": 4.625778524628671e-08, "loss": 1.2227, "step": 49850 }, { "epoch": 0.94, "learning_rate": 4.622853857313397e-08, "loss": 0.8174, "step": 49851 }, { "epoch": 0.94, "learning_rate": 4.6199301062288813e-08, "loss": 0.8482, "step": 49852 }, { "epoch": 0.94, "learning_rate": 4.617007271386004e-08, "loss": 0.942, "step": 49853 }, { "epoch": 0.94, "learning_rate": 4.6140853527957276e-08, "loss": 0.754, "step": 49854 }, { "epoch": 0.94, "learning_rate": 4.611164350468905e-08, "loss": 0.7774, "step": 49855 }, { "epoch": 0.94, "learning_rate": 4.608244264416501e-08, "loss": 1.099, "step": 49856 }, { "epoch": 0.94, "learning_rate": 4.605325094649338e-08, "loss": 0.8546, "step": 49857 }, { "epoch": 0.94, "learning_rate": 4.6024068411784086e-08, "loss": 0.8187, "step": 49858 }, { "epoch": 0.94, "learning_rate": 4.5994895040145926e-08, "loss": 1.0338, "step": 49859 }, { "epoch": 0.94, "learning_rate": 4.596573083168687e-08, "loss": 0.7253, "step": 49860 }, { "epoch": 0.94, "learning_rate": 4.593657578651711e-08, "loss": 0.9131, "step": 49861 }, { "epoch": 0.94, "learning_rate": 4.590742990474489e-08, "loss": 0.996, "step": 49862 }, { "epoch": 0.94, "learning_rate": 4.587829318647874e-08, "loss": 1.0074, "step": 49863 }, { "epoch": 0.94, "learning_rate": 4.5849165631828006e-08, "loss": 0.9177, "step": 49864 }, { "epoch": 0.94, "learning_rate": 4.582004724090122e-08, "loss": 0.7957, "step": 49865 }, { "epoch": 0.94, "learning_rate": 4.579093801380718e-08, "loss": 0.7574, "step": 49866 }, { "epoch": 0.94, "learning_rate": 4.576183795065442e-08, "loss": 0.6436, "step": 49867 }, { "epoch": 0.94, "learning_rate": 4.5732747051552005e-08, "loss": 0.9954, "step": 49868 }, { "epoch": 0.94, "learning_rate": 4.570366531660791e-08, "loss": 1.0272, "step": 49869 }, { "epoch": 0.94, "learning_rate": 4.5674592745931226e-08, "loss": 1.134, "step": 49870 }, { "epoch": 0.94, "learning_rate": 4.5645529339630456e-08, "loss": 0.5735, "step": 49871 }, { "epoch": 0.94, "learning_rate": 4.561647509781386e-08, "loss": 0.8561, "step": 49872 }, { "epoch": 0.94, "learning_rate": 4.558743002059024e-08, "loss": 0.7822, "step": 49873 }, { "epoch": 0.94, "learning_rate": 4.5558394108067564e-08, "loss": 0.8628, "step": 49874 }, { "epoch": 0.94, "learning_rate": 4.5529367360354906e-08, "loss": 0.982, "step": 49875 }, { "epoch": 0.94, "learning_rate": 4.550034977756024e-08, "loss": 0.9286, "step": 49876 }, { "epoch": 0.94, "learning_rate": 4.547134135979236e-08, "loss": 0.9785, "step": 49877 }, { "epoch": 0.94, "learning_rate": 4.5442342107158423e-08, "loss": 0.9319, "step": 49878 }, { "epoch": 0.94, "learning_rate": 4.541335201976804e-08, "loss": 0.7565, "step": 49879 }, { "epoch": 0.94, "learning_rate": 4.53843710977292e-08, "loss": 0.8639, "step": 49880 }, { "epoch": 0.94, "learning_rate": 4.53553993411493e-08, "loss": 1.0528, "step": 49881 }, { "epoch": 0.94, "learning_rate": 4.5326436750137426e-08, "loss": 1.0692, "step": 49882 }, { "epoch": 0.94, "learning_rate": 4.529748332480127e-08, "loss": 0.7934, "step": 49883 }, { "epoch": 0.94, "learning_rate": 4.526853906524909e-08, "loss": 0.8723, "step": 49884 }, { "epoch": 0.94, "learning_rate": 4.5239603971589105e-08, "loss": 0.9244, "step": 49885 }, { "epoch": 0.94, "learning_rate": 4.521067804392876e-08, "loss": 0.8178, "step": 49886 }, { "epoch": 0.94, "learning_rate": 4.5181761282376837e-08, "loss": 0.9139, "step": 49887 }, { "epoch": 0.94, "learning_rate": 4.5152853687040755e-08, "loss": 0.933, "step": 49888 }, { "epoch": 0.94, "learning_rate": 4.5123955258028765e-08, "loss": 1.0305, "step": 49889 }, { "epoch": 0.94, "learning_rate": 4.509506599544855e-08, "loss": 0.959, "step": 49890 }, { "epoch": 0.94, "learning_rate": 4.506618589940809e-08, "loss": 0.7279, "step": 49891 }, { "epoch": 0.94, "learning_rate": 4.5037314970015344e-08, "loss": 1.0198, "step": 49892 }, { "epoch": 0.94, "learning_rate": 4.500845320737801e-08, "loss": 0.9948, "step": 49893 }, { "epoch": 0.94, "learning_rate": 4.49796006116035e-08, "loss": 1.1868, "step": 49894 }, { "epoch": 0.94, "learning_rate": 4.495075718280034e-08, "loss": 0.899, "step": 49895 }, { "epoch": 0.94, "learning_rate": 4.492192292107539e-08, "loss": 0.7331, "step": 49896 }, { "epoch": 0.94, "learning_rate": 4.489309782653689e-08, "loss": 0.838, "step": 49897 }, { "epoch": 0.94, "learning_rate": 4.486428189929254e-08, "loss": 0.8363, "step": 49898 }, { "epoch": 0.94, "learning_rate": 4.483547513944919e-08, "loss": 0.8833, "step": 49899 }, { "epoch": 0.94, "learning_rate": 4.4806677547115096e-08, "loss": 1.0661, "step": 49900 }, { "epoch": 0.94, "learning_rate": 4.477788912239794e-08, "loss": 0.8912, "step": 49901 }, { "epoch": 0.94, "learning_rate": 4.4749109865404315e-08, "loss": 0.7215, "step": 49902 }, { "epoch": 0.94, "learning_rate": 4.472033977624246e-08, "loss": 0.933, "step": 49903 }, { "epoch": 0.94, "learning_rate": 4.469157885501979e-08, "loss": 0.7117, "step": 49904 }, { "epoch": 0.94, "learning_rate": 4.466282710184317e-08, "loss": 1.012, "step": 49905 }, { "epoch": 0.94, "learning_rate": 4.463408451682028e-08, "loss": 1.0399, "step": 49906 }, { "epoch": 0.94, "learning_rate": 4.460535110005854e-08, "loss": 1.0813, "step": 49907 }, { "epoch": 0.94, "learning_rate": 4.457662685166508e-08, "loss": 0.7515, "step": 49908 }, { "epoch": 0.94, "learning_rate": 4.454791177174733e-08, "loss": 0.7921, "step": 49909 }, { "epoch": 0.94, "learning_rate": 4.45192058604127e-08, "loss": 0.7644, "step": 49910 }, { "epoch": 0.94, "learning_rate": 4.449050911776748e-08, "loss": 0.7605, "step": 49911 }, { "epoch": 0.94, "learning_rate": 4.446182154391965e-08, "loss": 0.9279, "step": 49912 }, { "epoch": 0.94, "learning_rate": 4.4433143138976065e-08, "loss": 0.7942, "step": 49913 }, { "epoch": 0.94, "learning_rate": 4.440447390304387e-08, "loss": 0.8631, "step": 49914 }, { "epoch": 0.94, "learning_rate": 4.4375813836229905e-08, "loss": 1.0567, "step": 49915 }, { "epoch": 0.94, "learning_rate": 4.434716293864161e-08, "loss": 0.7806, "step": 49916 }, { "epoch": 0.94, "learning_rate": 4.4318521210385545e-08, "loss": 0.9359, "step": 49917 }, { "epoch": 0.94, "learning_rate": 4.428988865156886e-08, "loss": 0.8637, "step": 49918 }, { "epoch": 0.94, "learning_rate": 4.426126526229868e-08, "loss": 0.9773, "step": 49919 }, { "epoch": 0.94, "learning_rate": 4.4232651042681316e-08, "loss": 1.0369, "step": 49920 }, { "epoch": 0.94, "learning_rate": 4.420404599282391e-08, "loss": 0.9872, "step": 49921 }, { "epoch": 0.94, "learning_rate": 4.4175450112833585e-08, "loss": 0.9755, "step": 49922 }, { "epoch": 0.94, "learning_rate": 4.4146863402816654e-08, "loss": 0.8722, "step": 49923 }, { "epoch": 0.94, "learning_rate": 4.411828586288025e-08, "loss": 0.9412, "step": 49924 }, { "epoch": 0.94, "learning_rate": 4.4089717493130676e-08, "loss": 1.016, "step": 49925 }, { "epoch": 0.94, "learning_rate": 4.40611582936748e-08, "loss": 0.9392, "step": 49926 }, { "epoch": 0.94, "learning_rate": 4.403260826461919e-08, "loss": 0.6936, "step": 49927 }, { "epoch": 0.94, "learning_rate": 4.400406740607044e-08, "loss": 0.7517, "step": 49928 }, { "epoch": 0.94, "learning_rate": 4.39755357181354e-08, "loss": 0.8074, "step": 49929 }, { "epoch": 0.94, "learning_rate": 4.3947013200920375e-08, "loss": 0.876, "step": 49930 }, { "epoch": 0.94, "learning_rate": 4.3918499854532226e-08, "loss": 1.1744, "step": 49931 }, { "epoch": 0.94, "learning_rate": 4.3889995679076425e-08, "loss": 0.7469, "step": 49932 }, { "epoch": 0.94, "learning_rate": 4.386150067466066e-08, "loss": 0.8913, "step": 49933 }, { "epoch": 0.94, "learning_rate": 4.383301484139041e-08, "loss": 1.0172, "step": 49934 }, { "epoch": 0.94, "learning_rate": 4.380453817937253e-08, "loss": 0.8855, "step": 49935 }, { "epoch": 0.94, "learning_rate": 4.3776070688713037e-08, "loss": 0.9971, "step": 49936 }, { "epoch": 0.94, "learning_rate": 4.3747612369518525e-08, "loss": 0.9854, "step": 49937 }, { "epoch": 0.94, "learning_rate": 4.371916322189501e-08, "loss": 0.8099, "step": 49938 }, { "epoch": 0.94, "learning_rate": 4.3690723245948806e-08, "loss": 0.7571, "step": 49939 }, { "epoch": 0.94, "learning_rate": 4.366229244178649e-08, "loss": 0.8651, "step": 49940 }, { "epoch": 0.94, "learning_rate": 4.3633870809513256e-08, "loss": 0.9426, "step": 49941 }, { "epoch": 0.94, "learning_rate": 4.360545834923624e-08, "loss": 0.972, "step": 49942 }, { "epoch": 0.94, "learning_rate": 4.357705506106119e-08, "loss": 0.9545, "step": 49943 }, { "epoch": 0.94, "learning_rate": 4.354866094509358e-08, "loss": 1.1301, "step": 49944 }, { "epoch": 0.94, "learning_rate": 4.352027600144054e-08, "loss": 0.7495, "step": 49945 }, { "epoch": 0.94, "learning_rate": 4.3491900230207274e-08, "loss": 0.6635, "step": 49946 }, { "epoch": 0.94, "learning_rate": 4.346353363150008e-08, "loss": 0.6903, "step": 49947 }, { "epoch": 0.94, "learning_rate": 4.3435176205424424e-08, "loss": 0.8483, "step": 49948 }, { "epoch": 0.94, "learning_rate": 4.340682795208662e-08, "loss": 0.8292, "step": 49949 }, { "epoch": 0.94, "learning_rate": 4.3378488871592406e-08, "loss": 0.9967, "step": 49950 }, { "epoch": 0.94, "learning_rate": 4.3350158964047536e-08, "loss": 0.9825, "step": 49951 }, { "epoch": 0.94, "learning_rate": 4.332183822955832e-08, "loss": 0.9081, "step": 49952 }, { "epoch": 0.94, "learning_rate": 4.329352666822939e-08, "loss": 0.8183, "step": 49953 }, { "epoch": 0.94, "learning_rate": 4.3265224280167605e-08, "loss": 0.8685, "step": 49954 }, { "epoch": 0.94, "learning_rate": 4.3236931065477883e-08, "loss": 1.0031, "step": 49955 }, { "epoch": 0.94, "learning_rate": 4.320864702426569e-08, "loss": 1.2269, "step": 49956 }, { "epoch": 0.94, "learning_rate": 4.31803721566379e-08, "loss": 0.8718, "step": 49957 }, { "epoch": 0.94, "learning_rate": 4.315210646269885e-08, "loss": 0.7066, "step": 49958 }, { "epoch": 0.94, "learning_rate": 4.3123849942554584e-08, "loss": 0.7119, "step": 49959 }, { "epoch": 0.94, "learning_rate": 4.309560259631057e-08, "loss": 0.8433, "step": 49960 }, { "epoch": 0.94, "learning_rate": 4.3067364424072e-08, "loss": 0.9188, "step": 49961 }, { "epoch": 0.94, "learning_rate": 4.30391354259449e-08, "loss": 0.8814, "step": 49962 }, { "epoch": 0.94, "learning_rate": 4.301091560203419e-08, "loss": 1.1035, "step": 49963 }, { "epoch": 0.94, "learning_rate": 4.298270495244561e-08, "loss": 1.0383, "step": 49964 }, { "epoch": 0.94, "learning_rate": 4.29545034772838e-08, "loss": 0.6475, "step": 49965 }, { "epoch": 0.94, "learning_rate": 4.292631117665508e-08, "loss": 1.023, "step": 49966 }, { "epoch": 0.94, "learning_rate": 4.289812805066379e-08, "loss": 0.7682, "step": 49967 }, { "epoch": 0.94, "learning_rate": 4.286995409941569e-08, "loss": 1.1307, "step": 49968 }, { "epoch": 0.94, "learning_rate": 4.284178932301569e-08, "loss": 0.9938, "step": 49969 }, { "epoch": 0.94, "learning_rate": 4.281363372156927e-08, "loss": 0.9202, "step": 49970 }, { "epoch": 0.94, "learning_rate": 4.2785487295181336e-08, "loss": 0.8857, "step": 49971 }, { "epoch": 0.94, "learning_rate": 4.275735004395709e-08, "loss": 0.9057, "step": 49972 }, { "epoch": 0.94, "learning_rate": 4.272922196800172e-08, "loss": 0.8947, "step": 49973 }, { "epoch": 0.94, "learning_rate": 4.270110306741959e-08, "loss": 0.8515, "step": 49974 }, { "epoch": 0.94, "learning_rate": 4.267299334231673e-08, "loss": 1.1373, "step": 49975 }, { "epoch": 0.94, "learning_rate": 4.264489279279749e-08, "loss": 0.847, "step": 49976 }, { "epoch": 0.94, "learning_rate": 4.2616801418966514e-08, "loss": 0.5417, "step": 49977 }, { "epoch": 0.94, "learning_rate": 4.258871922092955e-08, "loss": 0.9189, "step": 49978 }, { "epoch": 0.94, "learning_rate": 4.256064619879069e-08, "loss": 0.8618, "step": 49979 }, { "epoch": 0.94, "learning_rate": 4.2532582352655114e-08, "loss": 0.8596, "step": 49980 }, { "epoch": 0.94, "learning_rate": 4.250452768262747e-08, "loss": 1.0148, "step": 49981 }, { "epoch": 0.94, "learning_rate": 4.2476482188812396e-08, "loss": 0.8097, "step": 49982 }, { "epoch": 0.94, "learning_rate": 4.244844587131508e-08, "loss": 0.8892, "step": 49983 }, { "epoch": 0.94, "learning_rate": 4.242041873023961e-08, "loss": 0.8211, "step": 49984 }, { "epoch": 0.94, "learning_rate": 4.2392400765691455e-08, "loss": 1.0179, "step": 49985 }, { "epoch": 0.94, "learning_rate": 4.236439197777415e-08, "loss": 0.7036, "step": 49986 }, { "epoch": 0.94, "learning_rate": 4.2336392366593426e-08, "loss": 1.1497, "step": 49987 }, { "epoch": 0.94, "learning_rate": 4.230840193225283e-08, "loss": 0.9571, "step": 49988 }, { "epoch": 0.94, "learning_rate": 4.228042067485727e-08, "loss": 0.7419, "step": 49989 }, { "epoch": 0.94, "learning_rate": 4.2252448594511386e-08, "loss": 0.711, "step": 49990 }, { "epoch": 0.94, "learning_rate": 4.222448569131954e-08, "loss": 0.8623, "step": 49991 }, { "epoch": 0.94, "learning_rate": 4.219653196538609e-08, "loss": 0.7916, "step": 49992 }, { "epoch": 0.94, "learning_rate": 4.21685874168154e-08, "loss": 0.9553, "step": 49993 }, { "epoch": 0.94, "learning_rate": 4.2140652045712107e-08, "loss": 0.9216, "step": 49994 }, { "epoch": 0.94, "learning_rate": 4.211272585218001e-08, "loss": 0.8823, "step": 49995 }, { "epoch": 0.94, "learning_rate": 4.2084808836323765e-08, "loss": 0.9968, "step": 49996 }, { "epoch": 0.94, "learning_rate": 4.205690099824744e-08, "loss": 0.8984, "step": 49997 }, { "epoch": 0.94, "learning_rate": 4.2029002338054846e-08, "loss": 0.8587, "step": 49998 }, { "epoch": 0.94, "learning_rate": 4.200111285585118e-08, "loss": 0.8845, "step": 49999 }, { "epoch": 0.94, "learning_rate": 4.197323255173968e-08, "loss": 1.0015, "step": 50000 }, { "epoch": 0.94, "learning_rate": 4.1945361425825004e-08, "loss": 0.9788, "step": 50001 }, { "epoch": 0.94, "learning_rate": 4.191749947821094e-08, "loss": 0.8453, "step": 50002 }, { "epoch": 0.94, "learning_rate": 4.188964670900131e-08, "loss": 1.023, "step": 50003 }, { "epoch": 0.94, "learning_rate": 4.186180311830046e-08, "loss": 0.6782, "step": 50004 }, { "epoch": 0.94, "learning_rate": 4.183396870621248e-08, "loss": 1.3036, "step": 50005 }, { "epoch": 0.94, "learning_rate": 4.1806143472841174e-08, "loss": 1.1397, "step": 50006 }, { "epoch": 0.94, "learning_rate": 4.17783274182898e-08, "loss": 0.7448, "step": 50007 }, { "epoch": 0.94, "learning_rate": 4.1750520542663265e-08, "loss": 0.9727, "step": 50008 }, { "epoch": 0.94, "learning_rate": 4.172272284606482e-08, "loss": 0.644, "step": 50009 }, { "epoch": 0.94, "learning_rate": 4.169493432859828e-08, "loss": 0.8132, "step": 50010 }, { "epoch": 0.94, "learning_rate": 4.166715499036744e-08, "loss": 0.6604, "step": 50011 }, { "epoch": 0.94, "learning_rate": 4.163938483147612e-08, "loss": 1.0932, "step": 50012 }, { "epoch": 0.94, "learning_rate": 4.1611623852028104e-08, "loss": 1.0941, "step": 50013 }, { "epoch": 0.94, "learning_rate": 4.158387205212666e-08, "loss": 0.8791, "step": 50014 }, { "epoch": 0.94, "learning_rate": 4.155612943187615e-08, "loss": 0.7697, "step": 50015 }, { "epoch": 0.94, "learning_rate": 4.152839599137898e-08, "loss": 0.8986, "step": 50016 }, { "epoch": 0.94, "learning_rate": 4.1500671730740075e-08, "loss": 1.1223, "step": 50017 }, { "epoch": 0.94, "learning_rate": 4.1472956650061844e-08, "loss": 1.1659, "step": 50018 }, { "epoch": 0.94, "learning_rate": 4.1445250749448106e-08, "loss": 0.9447, "step": 50019 }, { "epoch": 0.94, "learning_rate": 4.141755402900266e-08, "loss": 0.8219, "step": 50020 }, { "epoch": 0.94, "learning_rate": 4.1389866488828755e-08, "loss": 0.8031, "step": 50021 }, { "epoch": 0.94, "learning_rate": 4.1362188129029644e-08, "loss": 0.7687, "step": 50022 }, { "epoch": 0.94, "learning_rate": 4.133451894970858e-08, "loss": 0.9067, "step": 50023 }, { "epoch": 0.94, "learning_rate": 4.1306858950969086e-08, "loss": 0.9833, "step": 50024 }, { "epoch": 0.94, "learning_rate": 4.1279208132914414e-08, "loss": 1.0753, "step": 50025 }, { "epoch": 0.94, "learning_rate": 4.12515664956481e-08, "loss": 0.7974, "step": 50026 }, { "epoch": 0.94, "learning_rate": 4.1223934039272826e-08, "loss": 0.715, "step": 50027 }, { "epoch": 0.94, "learning_rate": 4.119631076389185e-08, "loss": 1.0245, "step": 50028 }, { "epoch": 0.94, "learning_rate": 4.1168696669608707e-08, "loss": 0.8636, "step": 50029 }, { "epoch": 0.94, "learning_rate": 4.1141091756526084e-08, "loss": 0.786, "step": 50030 }, { "epoch": 0.94, "learning_rate": 4.111349602474724e-08, "loss": 1.1708, "step": 50031 }, { "epoch": 0.94, "learning_rate": 4.1085909474375127e-08, "loss": 0.8825, "step": 50032 }, { "epoch": 0.94, "learning_rate": 4.1058332105513024e-08, "loss": 0.7548, "step": 50033 }, { "epoch": 0.94, "learning_rate": 4.1030763918263606e-08, "loss": 0.7984, "step": 50034 }, { "epoch": 0.94, "learning_rate": 4.100320491273013e-08, "loss": 0.9095, "step": 50035 }, { "epoch": 0.94, "learning_rate": 4.0975655089015296e-08, "loss": 0.8948, "step": 50036 }, { "epoch": 0.94, "learning_rate": 4.094811444722152e-08, "loss": 1.0509, "step": 50037 }, { "epoch": 0.94, "learning_rate": 4.0920582987452606e-08, "loss": 0.7624, "step": 50038 }, { "epoch": 0.94, "learning_rate": 4.0893060709810414e-08, "loss": 0.9202, "step": 50039 }, { "epoch": 0.94, "learning_rate": 4.08655476143982e-08, "loss": 0.7444, "step": 50040 }, { "epoch": 0.94, "learning_rate": 4.083804370131894e-08, "loss": 0.972, "step": 50041 }, { "epoch": 0.94, "learning_rate": 4.0810548970674766e-08, "loss": 0.938, "step": 50042 }, { "epoch": 0.94, "learning_rate": 4.0783063422568656e-08, "loss": 1.0955, "step": 50043 }, { "epoch": 0.94, "learning_rate": 4.075558705710331e-08, "loss": 1.1277, "step": 50044 }, { "epoch": 0.94, "learning_rate": 4.0728119874381134e-08, "loss": 0.9117, "step": 50045 }, { "epoch": 0.94, "learning_rate": 4.070066187450456e-08, "loss": 0.8875, "step": 50046 }, { "epoch": 0.94, "learning_rate": 4.067321305757654e-08, "loss": 0.7845, "step": 50047 }, { "epoch": 0.94, "learning_rate": 4.064577342369952e-08, "loss": 0.9329, "step": 50048 }, { "epoch": 0.94, "learning_rate": 4.061834297297534e-08, "loss": 0.8147, "step": 50049 }, { "epoch": 0.94, "learning_rate": 4.059092170550699e-08, "loss": 1.2507, "step": 50050 }, { "epoch": 0.94, "learning_rate": 4.056350962139688e-08, "loss": 0.7355, "step": 50051 }, { "epoch": 0.94, "learning_rate": 4.053610672074715e-08, "loss": 0.8123, "step": 50052 }, { "epoch": 0.94, "learning_rate": 4.0508713003660215e-08, "loss": 0.7959, "step": 50053 }, { "epoch": 0.94, "learning_rate": 4.0481328470238224e-08, "loss": 0.6823, "step": 50054 }, { "epoch": 0.94, "learning_rate": 4.045395312058359e-08, "loss": 0.8719, "step": 50055 }, { "epoch": 0.94, "learning_rate": 4.042658695479845e-08, "loss": 1.1043, "step": 50056 }, { "epoch": 0.94, "learning_rate": 4.039922997298523e-08, "loss": 0.9194, "step": 50057 }, { "epoch": 0.94, "learning_rate": 4.037188217524551e-08, "loss": 0.8564, "step": 50058 }, { "epoch": 0.94, "learning_rate": 4.034454356168227e-08, "loss": 0.7601, "step": 50059 }, { "epoch": 0.94, "learning_rate": 4.031721413239653e-08, "loss": 0.724, "step": 50060 }, { "epoch": 0.94, "learning_rate": 4.0289893887490994e-08, "loss": 0.6938, "step": 50061 }, { "epoch": 0.94, "learning_rate": 4.0262582827068077e-08, "loss": 0.8838, "step": 50062 }, { "epoch": 0.94, "learning_rate": 4.0235280951228805e-08, "loss": 0.9626, "step": 50063 }, { "epoch": 0.94, "learning_rate": 4.0207988260075605e-08, "loss": 0.9161, "step": 50064 }, { "epoch": 0.94, "learning_rate": 4.018070475371061e-08, "loss": 1.0768, "step": 50065 }, { "epoch": 0.94, "learning_rate": 4.015343043223513e-08, "loss": 0.716, "step": 50066 }, { "epoch": 0.94, "learning_rate": 4.0126165295751587e-08, "loss": 0.8055, "step": 50067 }, { "epoch": 0.94, "learning_rate": 4.009890934436128e-08, "loss": 1.0335, "step": 50068 }, { "epoch": 0.94, "learning_rate": 4.007166257816664e-08, "loss": 0.9983, "step": 50069 }, { "epoch": 0.94, "learning_rate": 4.00444249972684e-08, "loss": 0.8399, "step": 50070 }, { "epoch": 0.94, "learning_rate": 4.001719660176928e-08, "loss": 0.8765, "step": 50071 }, { "epoch": 0.94, "learning_rate": 3.998997739177029e-08, "loss": 0.9994, "step": 50072 }, { "epoch": 0.94, "learning_rate": 3.996276736737359e-08, "loss": 0.9014, "step": 50073 }, { "epoch": 0.94, "learning_rate": 3.9935566528680195e-08, "loss": 0.8519, "step": 50074 }, { "epoch": 0.94, "learning_rate": 3.990837487579197e-08, "loss": 0.9966, "step": 50075 }, { "epoch": 0.94, "learning_rate": 3.98811924088105e-08, "loss": 0.9626, "step": 50076 }, { "epoch": 0.94, "learning_rate": 3.985401912783737e-08, "loss": 0.9718, "step": 50077 }, { "epoch": 0.94, "learning_rate": 3.98268550329739e-08, "loss": 0.9143, "step": 50078 }, { "epoch": 0.94, "learning_rate": 3.9799700124321384e-08, "loss": 0.9211, "step": 50079 }, { "epoch": 0.94, "learning_rate": 3.9772554401981414e-08, "loss": 0.736, "step": 50080 }, { "epoch": 0.94, "learning_rate": 3.974541786605529e-08, "loss": 1.2123, "step": 50081 }, { "epoch": 0.94, "learning_rate": 3.971829051664433e-08, "loss": 1.0312, "step": 50082 }, { "epoch": 0.94, "learning_rate": 3.9691172353849837e-08, "loss": 0.7873, "step": 50083 }, { "epoch": 0.94, "learning_rate": 3.966406337777312e-08, "loss": 1.0558, "step": 50084 }, { "epoch": 0.94, "learning_rate": 3.9636963588515485e-08, "loss": 0.6855, "step": 50085 }, { "epoch": 0.94, "learning_rate": 3.960987298617769e-08, "loss": 0.9945, "step": 50086 }, { "epoch": 0.94, "learning_rate": 3.958279157086131e-08, "loss": 0.8717, "step": 50087 }, { "epoch": 0.95, "learning_rate": 3.9555719342667384e-08, "loss": 1.2772, "step": 50088 }, { "epoch": 0.95, "learning_rate": 3.952865630169694e-08, "loss": 0.8757, "step": 50089 }, { "epoch": 0.95, "learning_rate": 3.950160244805129e-08, "loss": 0.8936, "step": 50090 }, { "epoch": 0.95, "learning_rate": 3.94745577818309e-08, "loss": 0.6605, "step": 50091 }, { "epoch": 0.95, "learning_rate": 3.944752230313709e-08, "loss": 0.7922, "step": 50092 }, { "epoch": 0.95, "learning_rate": 3.942049601207087e-08, "loss": 0.8132, "step": 50093 }, { "epoch": 0.95, "learning_rate": 3.939347890873302e-08, "loss": 0.8997, "step": 50094 }, { "epoch": 0.95, "learning_rate": 3.936647099322455e-08, "loss": 1.0986, "step": 50095 }, { "epoch": 0.95, "learning_rate": 3.933947226564622e-08, "loss": 0.7084, "step": 50096 }, { "epoch": 0.95, "learning_rate": 3.9312482726098774e-08, "loss": 0.8137, "step": 50097 }, { "epoch": 0.95, "learning_rate": 3.9285502374682985e-08, "loss": 0.8125, "step": 50098 }, { "epoch": 0.95, "learning_rate": 3.925853121150014e-08, "loss": 0.9194, "step": 50099 }, { "epoch": 0.95, "learning_rate": 3.923156923665017e-08, "loss": 1.137, "step": 50100 }, { "epoch": 0.95, "learning_rate": 3.92046164502341e-08, "loss": 0.9722, "step": 50101 }, { "epoch": 0.95, "learning_rate": 3.917767285235241e-08, "loss": 0.7198, "step": 50102 }, { "epoch": 0.95, "learning_rate": 3.915073844310585e-08, "loss": 0.9313, "step": 50103 }, { "epoch": 0.95, "learning_rate": 3.912381322259517e-08, "loss": 0.7837, "step": 50104 }, { "epoch": 0.95, "learning_rate": 3.909689719092058e-08, "loss": 0.7776, "step": 50105 }, { "epoch": 0.95, "learning_rate": 3.906999034818282e-08, "loss": 0.8918, "step": 50106 }, { "epoch": 0.95, "learning_rate": 3.9043092694482086e-08, "loss": 0.8838, "step": 50107 }, { "epoch": 0.95, "learning_rate": 3.901620422991914e-08, "loss": 0.8699, "step": 50108 }, { "epoch": 0.95, "learning_rate": 3.8989324954594455e-08, "loss": 0.8371, "step": 50109 }, { "epoch": 0.95, "learning_rate": 3.896245486860767e-08, "loss": 1.0117, "step": 50110 }, { "epoch": 0.95, "learning_rate": 3.893559397206009e-08, "loss": 0.8926, "step": 50111 }, { "epoch": 0.95, "learning_rate": 3.890874226505137e-08, "loss": 0.9997, "step": 50112 }, { "epoch": 0.95, "learning_rate": 3.8881899747681695e-08, "loss": 0.9793, "step": 50113 }, { "epoch": 0.95, "learning_rate": 3.8855066420051825e-08, "loss": 0.8378, "step": 50114 }, { "epoch": 0.95, "learning_rate": 3.882824228226167e-08, "loss": 1.0089, "step": 50115 }, { "epoch": 0.95, "learning_rate": 3.880142733441117e-08, "loss": 0.8763, "step": 50116 }, { "epoch": 0.95, "learning_rate": 3.877462157660106e-08, "loss": 0.8379, "step": 50117 }, { "epoch": 0.95, "learning_rate": 3.874782500893098e-08, "loss": 1.1492, "step": 50118 }, { "epoch": 0.95, "learning_rate": 3.872103763150059e-08, "loss": 0.9648, "step": 50119 }, { "epoch": 0.95, "learning_rate": 3.8694259444410906e-08, "loss": 0.7997, "step": 50120 }, { "epoch": 0.95, "learning_rate": 3.8667490447761305e-08, "loss": 0.832, "step": 50121 }, { "epoch": 0.95, "learning_rate": 3.864073064165169e-08, "loss": 0.9491, "step": 50122 }, { "epoch": 0.95, "learning_rate": 3.8613980026182e-08, "loss": 1.0253, "step": 50123 }, { "epoch": 0.95, "learning_rate": 3.8587238601452417e-08, "loss": 0.9965, "step": 50124 }, { "epoch": 0.95, "learning_rate": 3.856050636756259e-08, "loss": 1.2424, "step": 50125 }, { "epoch": 0.95, "learning_rate": 3.853378332461244e-08, "loss": 0.971, "step": 50126 }, { "epoch": 0.95, "learning_rate": 3.8507069472701606e-08, "loss": 0.798, "step": 50127 }, { "epoch": 0.95, "learning_rate": 3.848036481192974e-08, "loss": 1.0585, "step": 50128 }, { "epoch": 0.95, "learning_rate": 3.845366934239703e-08, "loss": 0.9263, "step": 50129 }, { "epoch": 0.95, "learning_rate": 3.8426983064202836e-08, "loss": 0.8672, "step": 50130 }, { "epoch": 0.95, "learning_rate": 3.8400305977446263e-08, "loss": 1.2067, "step": 50131 }, { "epoch": 0.95, "learning_rate": 3.8373638082228047e-08, "loss": 0.9832, "step": 50132 }, { "epoch": 0.95, "learning_rate": 3.834697937864729e-08, "loss": 0.9027, "step": 50133 }, { "epoch": 0.95, "learning_rate": 3.8320329866803064e-08, "loss": 0.7044, "step": 50134 }, { "epoch": 0.95, "learning_rate": 3.82936895467953e-08, "loss": 0.9433, "step": 50135 }, { "epoch": 0.95, "learning_rate": 3.826705841872336e-08, "loss": 0.8229, "step": 50136 }, { "epoch": 0.95, "learning_rate": 3.8240436482686884e-08, "loss": 1.21, "step": 50137 }, { "epoch": 0.95, "learning_rate": 3.821382373878524e-08, "loss": 1.0905, "step": 50138 }, { "epoch": 0.95, "learning_rate": 3.818722018711779e-08, "loss": 0.8781, "step": 50139 }, { "epoch": 0.95, "learning_rate": 3.8160625827783346e-08, "loss": 0.8716, "step": 50140 }, { "epoch": 0.95, "learning_rate": 3.8134040660881835e-08, "loss": 0.888, "step": 50141 }, { "epoch": 0.95, "learning_rate": 3.810746468651233e-08, "loss": 0.6698, "step": 50142 }, { "epoch": 0.95, "learning_rate": 3.80808979047742e-08, "loss": 1.0292, "step": 50143 }, { "epoch": 0.95, "learning_rate": 3.8054340315766266e-08, "loss": 1.0337, "step": 50144 }, { "epoch": 0.95, "learning_rate": 3.8027791919588166e-08, "loss": 1.0685, "step": 50145 }, { "epoch": 0.95, "learning_rate": 3.80012527163387e-08, "loss": 0.9274, "step": 50146 }, { "epoch": 0.95, "learning_rate": 3.797472270611724e-08, "loss": 0.9633, "step": 50147 }, { "epoch": 0.95, "learning_rate": 3.79482018890226e-08, "loss": 0.938, "step": 50148 }, { "epoch": 0.95, "learning_rate": 3.792169026515358e-08, "loss": 0.887, "step": 50149 }, { "epoch": 0.95, "learning_rate": 3.7895187834609826e-08, "loss": 1.056, "step": 50150 }, { "epoch": 0.95, "learning_rate": 3.7868694597489876e-08, "loss": 0.9174, "step": 50151 }, { "epoch": 0.95, "learning_rate": 3.7842210553892536e-08, "loss": 0.8864, "step": 50152 }, { "epoch": 0.95, "learning_rate": 3.7815735703917166e-08, "loss": 0.8037, "step": 50153 }, { "epoch": 0.95, "learning_rate": 3.778927004766231e-08, "loss": 0.8075, "step": 50154 }, { "epoch": 0.95, "learning_rate": 3.7762813585226765e-08, "loss": 0.8751, "step": 50155 }, { "epoch": 0.95, "learning_rate": 3.773636631670935e-08, "loss": 0.6883, "step": 50156 }, { "epoch": 0.95, "learning_rate": 3.770992824220887e-08, "loss": 0.9889, "step": 50157 }, { "epoch": 0.95, "learning_rate": 3.768349936182386e-08, "loss": 0.7463, "step": 50158 }, { "epoch": 0.95, "learning_rate": 3.7657079675653406e-08, "loss": 0.9302, "step": 50159 }, { "epoch": 0.95, "learning_rate": 3.763066918379604e-08, "loss": 0.9594, "step": 50160 }, { "epoch": 0.95, "learning_rate": 3.760426788634974e-08, "loss": 0.7781, "step": 50161 }, { "epoch": 0.95, "learning_rate": 3.757787578341415e-08, "loss": 0.8574, "step": 50162 }, { "epoch": 0.95, "learning_rate": 3.755149287508697e-08, "loss": 0.9498, "step": 50163 }, { "epoch": 0.95, "learning_rate": 3.752511916146701e-08, "loss": 0.8858, "step": 50164 }, { "epoch": 0.95, "learning_rate": 3.749875464265307e-08, "loss": 1.069, "step": 50165 }, { "epoch": 0.95, "learning_rate": 3.747239931874286e-08, "loss": 0.795, "step": 50166 }, { "epoch": 0.95, "learning_rate": 3.7446053189835466e-08, "loss": 0.8232, "step": 50167 }, { "epoch": 0.95, "learning_rate": 3.741971625602886e-08, "loss": 1.0538, "step": 50168 }, { "epoch": 0.95, "learning_rate": 3.7393388517421856e-08, "loss": 0.9681, "step": 50169 }, { "epoch": 0.95, "learning_rate": 3.736706997411188e-08, "loss": 0.7216, "step": 50170 }, { "epoch": 0.95, "learning_rate": 3.734076062619801e-08, "loss": 0.7478, "step": 50171 }, { "epoch": 0.95, "learning_rate": 3.7314460473778516e-08, "loss": 0.7851, "step": 50172 }, { "epoch": 0.95, "learning_rate": 3.72881695169508e-08, "loss": 0.7217, "step": 50173 }, { "epoch": 0.95, "learning_rate": 3.7261887755813964e-08, "loss": 0.7807, "step": 50174 }, { "epoch": 0.95, "learning_rate": 3.7235615190465704e-08, "loss": 0.9995, "step": 50175 }, { "epoch": 0.95, "learning_rate": 3.720935182100399e-08, "loss": 0.9756, "step": 50176 }, { "epoch": 0.95, "learning_rate": 3.7183097647527086e-08, "loss": 1.0934, "step": 50177 }, { "epoch": 0.95, "learning_rate": 3.715685267013297e-08, "loss": 0.8925, "step": 50178 }, { "epoch": 0.95, "learning_rate": 3.7130616888919613e-08, "loss": 0.7509, "step": 50179 }, { "epoch": 0.95, "learning_rate": 3.7104390303984995e-08, "loss": 0.9489, "step": 50180 }, { "epoch": 0.95, "learning_rate": 3.707817291542737e-08, "loss": 1.1895, "step": 50181 }, { "epoch": 0.95, "learning_rate": 3.705196472334388e-08, "loss": 0.9794, "step": 50182 }, { "epoch": 0.95, "learning_rate": 3.702576572783334e-08, "loss": 0.8235, "step": 50183 }, { "epoch": 0.95, "learning_rate": 3.6999575928992895e-08, "loss": 0.8363, "step": 50184 }, { "epoch": 0.95, "learning_rate": 3.6973395326920234e-08, "loss": 0.8369, "step": 50185 }, { "epoch": 0.95, "learning_rate": 3.694722392171363e-08, "loss": 0.8687, "step": 50186 }, { "epoch": 0.95, "learning_rate": 3.692106171347048e-08, "loss": 0.8885, "step": 50187 }, { "epoch": 0.95, "learning_rate": 3.689490870228879e-08, "loss": 0.7472, "step": 50188 }, { "epoch": 0.95, "learning_rate": 3.6868764888265686e-08, "loss": 0.8369, "step": 50189 }, { "epoch": 0.95, "learning_rate": 3.6842630271499427e-08, "loss": 0.8322, "step": 50190 }, { "epoch": 0.95, "learning_rate": 3.6816504852086874e-08, "loss": 0.9297, "step": 50191 }, { "epoch": 0.95, "learning_rate": 3.67903886301263e-08, "loss": 0.8953, "step": 50192 }, { "epoch": 0.95, "learning_rate": 3.6764281605714827e-08, "loss": 1.0908, "step": 50193 }, { "epoch": 0.95, "learning_rate": 3.673818377894961e-08, "loss": 0.9677, "step": 50194 }, { "epoch": 0.95, "learning_rate": 3.6712095149929185e-08, "loss": 0.8991, "step": 50195 }, { "epoch": 0.95, "learning_rate": 3.668601571874986e-08, "loss": 0.8682, "step": 50196 }, { "epoch": 0.95, "learning_rate": 3.665994548550933e-08, "loss": 0.9145, "step": 50197 }, { "epoch": 0.95, "learning_rate": 3.66338844503053e-08, "loss": 0.6026, "step": 50198 }, { "epoch": 0.95, "learning_rate": 3.660783261323464e-08, "loss": 0.8504, "step": 50199 }, { "epoch": 0.95, "learning_rate": 3.6581789974394765e-08, "loss": 1.2319, "step": 50200 }, { "epoch": 0.95, "learning_rate": 3.65557565338831e-08, "loss": 0.9031, "step": 50201 }, { "epoch": 0.95, "learning_rate": 3.652973229179679e-08, "loss": 0.7455, "step": 50202 }, { "epoch": 0.95, "learning_rate": 3.650371724823243e-08, "loss": 1.0656, "step": 50203 }, { "epoch": 0.95, "learning_rate": 3.647771140328826e-08, "loss": 0.8734, "step": 50204 }, { "epoch": 0.95, "learning_rate": 3.645171475706061e-08, "loss": 0.5931, "step": 50205 }, { "epoch": 0.95, "learning_rate": 3.6425727309646606e-08, "loss": 1.0041, "step": 50206 }, { "epoch": 0.95, "learning_rate": 3.639974906114341e-08, "loss": 0.8459, "step": 50207 }, { "epoch": 0.95, "learning_rate": 3.6373780011647876e-08, "loss": 0.7437, "step": 50208 }, { "epoch": 0.95, "learning_rate": 3.634782016125743e-08, "loss": 0.9099, "step": 50209 }, { "epoch": 0.95, "learning_rate": 3.6321869510068385e-08, "loss": 0.6026, "step": 50210 }, { "epoch": 0.95, "learning_rate": 3.6295928058178445e-08, "loss": 1.0113, "step": 50211 }, { "epoch": 0.95, "learning_rate": 3.6269995805683355e-08, "loss": 1.0893, "step": 50212 }, { "epoch": 0.95, "learning_rate": 3.624407275268083e-08, "loss": 0.7822, "step": 50213 }, { "epoch": 0.95, "learning_rate": 3.621815889926744e-08, "loss": 0.8128, "step": 50214 }, { "epoch": 0.95, "learning_rate": 3.6192254245539796e-08, "loss": 0.9553, "step": 50215 }, { "epoch": 0.95, "learning_rate": 3.616635879159503e-08, "loss": 0.7716, "step": 50216 }, { "epoch": 0.95, "learning_rate": 3.614047253752917e-08, "loss": 0.8359, "step": 50217 }, { "epoch": 0.95, "learning_rate": 3.611459548343937e-08, "loss": 1.0029, "step": 50218 }, { "epoch": 0.95, "learning_rate": 3.6088727629422224e-08, "loss": 0.9993, "step": 50219 }, { "epoch": 0.95, "learning_rate": 3.6062868975574036e-08, "loss": 1.0283, "step": 50220 }, { "epoch": 0.95, "learning_rate": 3.603701952199168e-08, "loss": 0.8997, "step": 50221 }, { "epoch": 0.95, "learning_rate": 3.6011179268771454e-08, "loss": 0.8304, "step": 50222 }, { "epoch": 0.95, "learning_rate": 3.598534821601024e-08, "loss": 0.7784, "step": 50223 }, { "epoch": 0.95, "learning_rate": 3.595952636380379e-08, "loss": 1.1149, "step": 50224 }, { "epoch": 0.95, "learning_rate": 3.593371371224924e-08, "loss": 1.1215, "step": 50225 }, { "epoch": 0.95, "learning_rate": 3.590791026144236e-08, "loss": 0.9237, "step": 50226 }, { "epoch": 0.95, "learning_rate": 3.5882116011480004e-08, "loss": 1.027, "step": 50227 }, { "epoch": 0.95, "learning_rate": 3.585633096245794e-08, "loss": 0.9795, "step": 50228 }, { "epoch": 0.95, "learning_rate": 3.5830555114473034e-08, "loss": 0.7332, "step": 50229 }, { "epoch": 0.95, "learning_rate": 3.580478846762131e-08, "loss": 0.8667, "step": 50230 }, { "epoch": 0.95, "learning_rate": 3.5779031021999086e-08, "loss": 1.1628, "step": 50231 }, { "epoch": 0.95, "learning_rate": 3.57532827777024e-08, "loss": 0.992, "step": 50232 }, { "epoch": 0.95, "learning_rate": 3.5727543734827006e-08, "loss": 0.7574, "step": 50233 }, { "epoch": 0.95, "learning_rate": 3.570181389346949e-08, "loss": 0.8001, "step": 50234 }, { "epoch": 0.95, "learning_rate": 3.567609325372617e-08, "loss": 0.8636, "step": 50235 }, { "epoch": 0.95, "learning_rate": 3.565038181569253e-08, "loss": 0.8219, "step": 50236 }, { "epoch": 0.95, "learning_rate": 3.562467957946486e-08, "loss": 0.9949, "step": 50237 }, { "epoch": 0.95, "learning_rate": 3.559898654513921e-08, "loss": 0.9334, "step": 50238 }, { "epoch": 0.95, "learning_rate": 3.557330271281134e-08, "loss": 0.6861, "step": 50239 }, { "epoch": 0.95, "learning_rate": 3.5547628082577e-08, "loss": 0.9455, "step": 50240 }, { "epoch": 0.95, "learning_rate": 3.552196265453223e-08, "loss": 0.8762, "step": 50241 }, { "epoch": 0.95, "learning_rate": 3.5496306428773055e-08, "loss": 0.7734, "step": 50242 }, { "epoch": 0.95, "learning_rate": 3.547065940539524e-08, "loss": 0.9693, "step": 50243 }, { "epoch": 0.95, "learning_rate": 3.544502158449425e-08, "loss": 1.0308, "step": 50244 }, { "epoch": 0.95, "learning_rate": 3.541939296616587e-08, "loss": 0.8961, "step": 50245 }, { "epoch": 0.95, "learning_rate": 3.5393773550506104e-08, "loss": 0.8657, "step": 50246 }, { "epoch": 0.95, "learning_rate": 3.536816333761045e-08, "loss": 0.9253, "step": 50247 }, { "epoch": 0.95, "learning_rate": 3.534256232757438e-08, "loss": 0.6383, "step": 50248 }, { "epoch": 0.95, "learning_rate": 3.5316970520493655e-08, "loss": 1.1205, "step": 50249 }, { "epoch": 0.95, "learning_rate": 3.529138791646375e-08, "loss": 1.1596, "step": 50250 }, { "epoch": 0.95, "learning_rate": 3.526581451558014e-08, "loss": 0.924, "step": 50251 }, { "epoch": 0.95, "learning_rate": 3.52402503179386e-08, "loss": 0.8908, "step": 50252 }, { "epoch": 0.95, "learning_rate": 3.521469532363459e-08, "loss": 1.0178, "step": 50253 }, { "epoch": 0.95, "learning_rate": 3.5189149532762756e-08, "loss": 1.0115, "step": 50254 }, { "epoch": 0.95, "learning_rate": 3.516361294541942e-08, "loss": 0.7885, "step": 50255 }, { "epoch": 0.95, "learning_rate": 3.5138085561699785e-08, "loss": 1.0778, "step": 50256 }, { "epoch": 0.95, "learning_rate": 3.511256738169849e-08, "loss": 1.165, "step": 50257 }, { "epoch": 0.95, "learning_rate": 3.508705840551158e-08, "loss": 0.7291, "step": 50258 }, { "epoch": 0.95, "learning_rate": 3.506155863323396e-08, "loss": 0.7702, "step": 50259 }, { "epoch": 0.95, "learning_rate": 3.503606806496085e-08, "loss": 0.803, "step": 50260 }, { "epoch": 0.95, "learning_rate": 3.5010586700787443e-08, "loss": 0.8501, "step": 50261 }, { "epoch": 0.95, "learning_rate": 3.498511454080922e-08, "loss": 1.0162, "step": 50262 }, { "epoch": 0.95, "learning_rate": 3.4959651585120826e-08, "loss": 0.8257, "step": 50263 }, { "epoch": 0.95, "learning_rate": 3.493419783381746e-08, "loss": 0.8784, "step": 50264 }, { "epoch": 0.95, "learning_rate": 3.490875328699433e-08, "loss": 0.8898, "step": 50265 }, { "epoch": 0.95, "learning_rate": 3.4883317944746086e-08, "loss": 0.6733, "step": 50266 }, { "epoch": 0.95, "learning_rate": 3.48578918071682e-08, "loss": 0.9097, "step": 50267 }, { "epoch": 0.95, "learning_rate": 3.4832474874355315e-08, "loss": 1.1782, "step": 50268 }, { "epoch": 0.95, "learning_rate": 3.480706714640236e-08, "loss": 0.8058, "step": 50269 }, { "epoch": 0.95, "learning_rate": 3.4781668623404265e-08, "loss": 0.967, "step": 50270 }, { "epoch": 0.95, "learning_rate": 3.475627930545566e-08, "loss": 0.8648, "step": 50271 }, { "epoch": 0.95, "learning_rate": 3.473089919265177e-08, "loss": 0.9337, "step": 50272 }, { "epoch": 0.95, "learning_rate": 3.470552828508694e-08, "loss": 0.7779, "step": 50273 }, { "epoch": 0.95, "learning_rate": 3.468016658285611e-08, "loss": 0.9434, "step": 50274 }, { "epoch": 0.95, "learning_rate": 3.4654814086053924e-08, "loss": 1.0046, "step": 50275 }, { "epoch": 0.95, "learning_rate": 3.462947079477502e-08, "loss": 0.8832, "step": 50276 }, { "epoch": 0.95, "learning_rate": 3.460413670911433e-08, "loss": 1.082, "step": 50277 }, { "epoch": 0.95, "learning_rate": 3.457881182916595e-08, "loss": 0.8786, "step": 50278 }, { "epoch": 0.95, "learning_rate": 3.4553496155025066e-08, "loss": 0.6138, "step": 50279 }, { "epoch": 0.95, "learning_rate": 3.4528189686785504e-08, "loss": 1.1121, "step": 50280 }, { "epoch": 0.95, "learning_rate": 3.450289242454219e-08, "loss": 1.0773, "step": 50281 }, { "epoch": 0.95, "learning_rate": 3.4477604368389484e-08, "loss": 0.9127, "step": 50282 }, { "epoch": 0.95, "learning_rate": 3.445232551842176e-08, "loss": 0.9085, "step": 50283 }, { "epoch": 0.95, "learning_rate": 3.442705587473338e-08, "loss": 0.9833, "step": 50284 }, { "epoch": 0.95, "learning_rate": 3.440179543741873e-08, "loss": 0.7849, "step": 50285 }, { "epoch": 0.95, "learning_rate": 3.437654420657271e-08, "loss": 0.6403, "step": 50286 }, { "epoch": 0.95, "learning_rate": 3.4351302182288324e-08, "loss": 0.9796, "step": 50287 }, { "epoch": 0.95, "learning_rate": 3.432606936466104e-08, "loss": 1.0831, "step": 50288 }, { "epoch": 0.95, "learning_rate": 3.4300845753784676e-08, "loss": 0.8933, "step": 50289 }, { "epoch": 0.95, "learning_rate": 3.427563134975303e-08, "loss": 0.791, "step": 50290 }, { "epoch": 0.95, "learning_rate": 3.425042615266078e-08, "loss": 1.0077, "step": 50291 }, { "epoch": 0.95, "learning_rate": 3.422523016260171e-08, "loss": 0.8003, "step": 50292 }, { "epoch": 0.95, "learning_rate": 3.42000433796702e-08, "loss": 0.8752, "step": 50293 }, { "epoch": 0.95, "learning_rate": 3.4174865803960065e-08, "loss": 0.7437, "step": 50294 }, { "epoch": 0.95, "learning_rate": 3.4149697435565396e-08, "loss": 0.905, "step": 50295 }, { "epoch": 0.95, "learning_rate": 3.412453827458001e-08, "loss": 0.8049, "step": 50296 }, { "epoch": 0.95, "learning_rate": 3.409938832109799e-08, "loss": 0.9223, "step": 50297 }, { "epoch": 0.95, "learning_rate": 3.4074247575213716e-08, "loss": 0.7119, "step": 50298 }, { "epoch": 0.95, "learning_rate": 3.404911603701988e-08, "loss": 0.8023, "step": 50299 }, { "epoch": 0.95, "learning_rate": 3.402399370661169e-08, "loss": 1.1094, "step": 50300 }, { "epoch": 0.95, "learning_rate": 3.399888058408185e-08, "loss": 0.731, "step": 50301 }, { "epoch": 0.95, "learning_rate": 3.3973776669524724e-08, "loss": 0.8412, "step": 50302 }, { "epoch": 0.95, "learning_rate": 3.394868196303386e-08, "loss": 0.8313, "step": 50303 }, { "epoch": 0.95, "learning_rate": 3.392359646470306e-08, "loss": 0.8546, "step": 50304 }, { "epoch": 0.95, "learning_rate": 3.389852017462586e-08, "loss": 0.7778, "step": 50305 }, { "epoch": 0.95, "learning_rate": 3.387345309289608e-08, "loss": 0.9814, "step": 50306 }, { "epoch": 0.95, "learning_rate": 3.384839521960726e-08, "loss": 0.7648, "step": 50307 }, { "epoch": 0.95, "learning_rate": 3.382334655485264e-08, "loss": 0.9287, "step": 50308 }, { "epoch": 0.95, "learning_rate": 3.379830709872661e-08, "loss": 0.9451, "step": 50309 }, { "epoch": 0.95, "learning_rate": 3.377327685132159e-08, "loss": 0.7694, "step": 50310 }, { "epoch": 0.95, "learning_rate": 3.374825581273167e-08, "loss": 0.9658, "step": 50311 }, { "epoch": 0.95, "learning_rate": 3.3723243983050105e-08, "loss": 1.1682, "step": 50312 }, { "epoch": 0.95, "learning_rate": 3.3698241362370154e-08, "loss": 0.9605, "step": 50313 }, { "epoch": 0.95, "learning_rate": 3.367324795078564e-08, "loss": 0.9019, "step": 50314 }, { "epoch": 0.95, "learning_rate": 3.3648263748389534e-08, "loss": 0.9429, "step": 50315 }, { "epoch": 0.95, "learning_rate": 3.362328875527537e-08, "loss": 0.8647, "step": 50316 }, { "epoch": 0.95, "learning_rate": 3.359832297153587e-08, "loss": 1.0451, "step": 50317 }, { "epoch": 0.95, "learning_rate": 3.357336639726455e-08, "loss": 0.9718, "step": 50318 }, { "epoch": 0.95, "learning_rate": 3.3548419032555236e-08, "loss": 1.1412, "step": 50319 }, { "epoch": 0.95, "learning_rate": 3.352348087750007e-08, "loss": 0.8556, "step": 50320 }, { "epoch": 0.95, "learning_rate": 3.3498551932192594e-08, "loss": 0.9372, "step": 50321 }, { "epoch": 0.95, "learning_rate": 3.3473632196726057e-08, "loss": 0.9273, "step": 50322 }, { "epoch": 0.95, "learning_rate": 3.3448721671193173e-08, "loss": 0.7924, "step": 50323 }, { "epoch": 0.95, "learning_rate": 3.34238203556872e-08, "loss": 0.8423, "step": 50324 }, { "epoch": 0.95, "learning_rate": 3.339892825030111e-08, "loss": 1.0261, "step": 50325 }, { "epoch": 0.95, "learning_rate": 3.337404535512789e-08, "loss": 0.7584, "step": 50326 }, { "epoch": 0.95, "learning_rate": 3.334917167025997e-08, "loss": 0.9202, "step": 50327 }, { "epoch": 0.95, "learning_rate": 3.332430719579116e-08, "loss": 0.8553, "step": 50328 }, { "epoch": 0.95, "learning_rate": 3.329945193181333e-08, "loss": 0.8452, "step": 50329 }, { "epoch": 0.95, "learning_rate": 3.327460587842002e-08, "loss": 0.9289, "step": 50330 }, { "epoch": 0.95, "learning_rate": 3.324976903570337e-08, "loss": 1.0734, "step": 50331 }, { "epoch": 0.95, "learning_rate": 3.322494140375665e-08, "loss": 1.0557, "step": 50332 }, { "epoch": 0.95, "learning_rate": 3.3200122982672276e-08, "loss": 0.8716, "step": 50333 }, { "epoch": 0.95, "learning_rate": 3.317531377254324e-08, "loss": 0.9213, "step": 50334 }, { "epoch": 0.95, "learning_rate": 3.315051377346168e-08, "loss": 0.9387, "step": 50335 }, { "epoch": 0.95, "learning_rate": 3.312572298552058e-08, "loss": 0.9665, "step": 50336 }, { "epoch": 0.95, "learning_rate": 3.310094140881237e-08, "loss": 1.0455, "step": 50337 }, { "epoch": 0.95, "learning_rate": 3.307616904342975e-08, "loss": 0.7097, "step": 50338 }, { "epoch": 0.95, "learning_rate": 3.3051405889464596e-08, "loss": 0.7797, "step": 50339 }, { "epoch": 0.95, "learning_rate": 3.3026651947010436e-08, "loss": 0.8044, "step": 50340 }, { "epoch": 0.95, "learning_rate": 3.300190721615887e-08, "loss": 0.969, "step": 50341 }, { "epoch": 0.95, "learning_rate": 3.29771716970026e-08, "loss": 0.9199, "step": 50342 }, { "epoch": 0.95, "learning_rate": 3.295244538963377e-08, "loss": 0.8896, "step": 50343 }, { "epoch": 0.95, "learning_rate": 3.292772829414509e-08, "loss": 0.8925, "step": 50344 }, { "epoch": 0.95, "learning_rate": 3.290302041062843e-08, "loss": 0.8257, "step": 50345 }, { "epoch": 0.95, "learning_rate": 3.287832173917649e-08, "loss": 0.6793, "step": 50346 }, { "epoch": 0.95, "learning_rate": 3.2853632279881146e-08, "loss": 0.8159, "step": 50347 }, { "epoch": 0.95, "learning_rate": 3.282895203283454e-08, "loss": 0.8344, "step": 50348 }, { "epoch": 0.95, "learning_rate": 3.2804280998129103e-08, "loss": 0.7245, "step": 50349 }, { "epoch": 0.95, "learning_rate": 3.277961917585698e-08, "loss": 0.9755, "step": 50350 }, { "epoch": 0.95, "learning_rate": 3.275496656610977e-08, "loss": 0.8407, "step": 50351 }, { "epoch": 0.95, "learning_rate": 3.273032316898017e-08, "loss": 0.8617, "step": 50352 }, { "epoch": 0.95, "learning_rate": 3.270568898455978e-08, "loss": 0.9403, "step": 50353 }, { "epoch": 0.95, "learning_rate": 3.2681064012940745e-08, "loss": 0.8365, "step": 50354 }, { "epoch": 0.95, "learning_rate": 3.265644825421493e-08, "loss": 0.8968, "step": 50355 }, { "epoch": 0.95, "learning_rate": 3.26318417084745e-08, "loss": 0.833, "step": 50356 }, { "epoch": 0.95, "learning_rate": 3.2607244375810473e-08, "loss": 0.9099, "step": 50357 }, { "epoch": 0.95, "learning_rate": 3.2582656256316125e-08, "loss": 0.8134, "step": 50358 }, { "epoch": 0.95, "learning_rate": 3.255807735008193e-08, "loss": 0.8197, "step": 50359 }, { "epoch": 0.95, "learning_rate": 3.2533507657200314e-08, "loss": 0.8953, "step": 50360 }, { "epoch": 0.95, "learning_rate": 3.250894717776315e-08, "loss": 1.0486, "step": 50361 }, { "epoch": 0.95, "learning_rate": 3.248439591186176e-08, "loss": 1.0086, "step": 50362 }, { "epoch": 0.95, "learning_rate": 3.2459853859588275e-08, "loss": 1.0015, "step": 50363 }, { "epoch": 0.95, "learning_rate": 3.243532102103375e-08, "loss": 0.8626, "step": 50364 }, { "epoch": 0.95, "learning_rate": 3.241079739629005e-08, "loss": 0.8832, "step": 50365 }, { "epoch": 0.95, "learning_rate": 3.238628298544877e-08, "loss": 0.7124, "step": 50366 }, { "epoch": 0.95, "learning_rate": 3.23617777886015e-08, "loss": 0.8027, "step": 50367 }, { "epoch": 0.95, "learning_rate": 3.2337281805839836e-08, "loss": 0.8534, "step": 50368 }, { "epoch": 0.95, "learning_rate": 3.2312795037254816e-08, "loss": 0.8546, "step": 50369 }, { "epoch": 0.95, "learning_rate": 3.228831748293859e-08, "loss": 1.0107, "step": 50370 }, { "epoch": 0.95, "learning_rate": 3.226384914298192e-08, "loss": 0.8611, "step": 50371 }, { "epoch": 0.95, "learning_rate": 3.2239390017476116e-08, "loss": 0.9055, "step": 50372 }, { "epoch": 0.95, "learning_rate": 3.221494010651305e-08, "loss": 0.7816, "step": 50373 }, { "epoch": 0.95, "learning_rate": 3.219049941018376e-08, "loss": 1.2037, "step": 50374 }, { "epoch": 0.95, "learning_rate": 3.2166067928579294e-08, "loss": 1.0341, "step": 50375 }, { "epoch": 0.95, "learning_rate": 3.214164566179123e-08, "loss": 0.8842, "step": 50376 }, { "epoch": 0.95, "learning_rate": 3.2117232609910623e-08, "loss": 0.7577, "step": 50377 }, { "epoch": 0.95, "learning_rate": 3.2092828773028214e-08, "loss": 0.9991, "step": 50378 }, { "epoch": 0.95, "learning_rate": 3.206843415123589e-08, "loss": 0.7188, "step": 50379 }, { "epoch": 0.95, "learning_rate": 3.2044048744624415e-08, "loss": 0.7154, "step": 50380 }, { "epoch": 0.95, "learning_rate": 3.2019672553284257e-08, "loss": 1.0973, "step": 50381 }, { "epoch": 0.95, "learning_rate": 3.1995305577307565e-08, "loss": 0.7994, "step": 50382 }, { "epoch": 0.95, "learning_rate": 3.197094781678456e-08, "loss": 0.7654, "step": 50383 }, { "epoch": 0.95, "learning_rate": 3.1946599271806265e-08, "loss": 1.0079, "step": 50384 }, { "epoch": 0.95, "learning_rate": 3.192225994246373e-08, "loss": 0.7964, "step": 50385 }, { "epoch": 0.95, "learning_rate": 3.189792982884798e-08, "loss": 0.9078, "step": 50386 }, { "epoch": 0.95, "learning_rate": 3.1873608931049515e-08, "loss": 1.0869, "step": 50387 }, { "epoch": 0.95, "learning_rate": 3.184929724915936e-08, "loss": 0.9034, "step": 50388 }, { "epoch": 0.95, "learning_rate": 3.182499478326828e-08, "loss": 1.0141, "step": 50389 }, { "epoch": 0.95, "learning_rate": 3.180070153346676e-08, "loss": 0.8492, "step": 50390 }, { "epoch": 0.95, "learning_rate": 3.177641749984611e-08, "loss": 1.0837, "step": 50391 }, { "epoch": 0.95, "learning_rate": 3.1752142682496543e-08, "loss": 0.9233, "step": 50392 }, { "epoch": 0.95, "learning_rate": 3.172787708150854e-08, "loss": 1.1459, "step": 50393 }, { "epoch": 0.95, "learning_rate": 3.1703620696973135e-08, "loss": 0.8826, "step": 50394 }, { "epoch": 0.95, "learning_rate": 3.1679373528980816e-08, "loss": 0.7383, "step": 50395 }, { "epoch": 0.95, "learning_rate": 3.165513557762206e-08, "loss": 0.6998, "step": 50396 }, { "epoch": 0.95, "learning_rate": 3.1630906842987085e-08, "loss": 0.9535, "step": 50397 }, { "epoch": 0.95, "learning_rate": 3.160668732516692e-08, "loss": 0.7432, "step": 50398 }, { "epoch": 0.95, "learning_rate": 3.158247702425149e-08, "loss": 1.1321, "step": 50399 }, { "epoch": 0.95, "learning_rate": 3.1558275940331564e-08, "loss": 0.9281, "step": 50400 }, { "epoch": 0.95, "learning_rate": 3.1534084073497337e-08, "loss": 0.9433, "step": 50401 }, { "epoch": 0.95, "learning_rate": 3.150990142383875e-08, "loss": 0.9538, "step": 50402 }, { "epoch": 0.95, "learning_rate": 3.148572799144711e-08, "loss": 0.8456, "step": 50403 }, { "epoch": 0.95, "learning_rate": 3.14615637764118e-08, "loss": 0.7543, "step": 50404 }, { "epoch": 0.95, "learning_rate": 3.1437408778823286e-08, "loss": 0.8742, "step": 50405 }, { "epoch": 0.95, "learning_rate": 3.141326299877179e-08, "loss": 1.0264, "step": 50406 }, { "epoch": 0.95, "learning_rate": 3.1389126436347505e-08, "loss": 0.9183, "step": 50407 }, { "epoch": 0.95, "learning_rate": 3.1364999091640646e-08, "loss": 0.8033, "step": 50408 }, { "epoch": 0.95, "learning_rate": 3.1340880964741136e-08, "loss": 0.7977, "step": 50409 }, { "epoch": 0.95, "learning_rate": 3.1316772055739184e-08, "loss": 0.8032, "step": 50410 }, { "epoch": 0.95, "learning_rate": 3.129267236472444e-08, "loss": 1.04, "step": 50411 }, { "epoch": 0.95, "learning_rate": 3.1268581891787385e-08, "loss": 1.0073, "step": 50412 }, { "epoch": 0.95, "learning_rate": 3.124450063701767e-08, "loss": 0.9265, "step": 50413 }, { "epoch": 0.95, "learning_rate": 3.1220428600505505e-08, "loss": 0.9008, "step": 50414 }, { "epoch": 0.95, "learning_rate": 3.1196365782340254e-08, "loss": 0.7656, "step": 50415 }, { "epoch": 0.95, "learning_rate": 3.117231218261213e-08, "loss": 0.959, "step": 50416 }, { "epoch": 0.95, "learning_rate": 3.1148267801411056e-08, "loss": 0.8346, "step": 50417 }, { "epoch": 0.95, "learning_rate": 3.1124232638826415e-08, "loss": 1.0033, "step": 50418 }, { "epoch": 0.95, "learning_rate": 3.11002066949484e-08, "loss": 0.8922, "step": 50419 }, { "epoch": 0.95, "learning_rate": 3.107618996986639e-08, "loss": 0.7833, "step": 50420 }, { "epoch": 0.95, "learning_rate": 3.105218246367031e-08, "loss": 0.8867, "step": 50421 }, { "epoch": 0.95, "learning_rate": 3.102818417644982e-08, "loss": 1.0479, "step": 50422 }, { "epoch": 0.95, "learning_rate": 3.1004195108294e-08, "loss": 0.8922, "step": 50423 }, { "epoch": 0.95, "learning_rate": 3.0980215259293067e-08, "loss": 0.9523, "step": 50424 }, { "epoch": 0.95, "learning_rate": 3.0956244629536116e-08, "loss": 1.1204, "step": 50425 }, { "epoch": 0.95, "learning_rate": 3.0932283219113066e-08, "loss": 0.7666, "step": 50426 }, { "epoch": 0.95, "learning_rate": 3.090833102811303e-08, "loss": 0.9543, "step": 50427 }, { "epoch": 0.95, "learning_rate": 3.088438805662563e-08, "loss": 0.8443, "step": 50428 }, { "epoch": 0.95, "learning_rate": 3.086045430474027e-08, "loss": 0.6887, "step": 50429 }, { "epoch": 0.95, "learning_rate": 3.0836529772546033e-08, "loss": 0.8752, "step": 50430 }, { "epoch": 0.95, "learning_rate": 3.0812614460132836e-08, "loss": 0.9428, "step": 50431 }, { "epoch": 0.95, "learning_rate": 3.0788708367589513e-08, "loss": 0.9586, "step": 50432 }, { "epoch": 0.95, "learning_rate": 3.076481149500543e-08, "loss": 0.8567, "step": 50433 }, { "epoch": 0.95, "learning_rate": 3.0740923842469685e-08, "loss": 0.739, "step": 50434 }, { "epoch": 0.95, "learning_rate": 3.0717045410071924e-08, "loss": 0.7928, "step": 50435 }, { "epoch": 0.95, "learning_rate": 3.0693176197900684e-08, "loss": 0.7569, "step": 50436 }, { "epoch": 0.95, "learning_rate": 3.066931620604563e-08, "loss": 1.0497, "step": 50437 }, { "epoch": 0.95, "learning_rate": 3.0645465434595565e-08, "loss": 1.0492, "step": 50438 }, { "epoch": 0.95, "learning_rate": 3.06216238836396e-08, "loss": 1.0026, "step": 50439 }, { "epoch": 0.95, "learning_rate": 3.059779155326681e-08, "loss": 0.8386, "step": 50440 }, { "epoch": 0.95, "learning_rate": 3.0573968443566024e-08, "loss": 0.7716, "step": 50441 }, { "epoch": 0.95, "learning_rate": 3.055015455462662e-08, "loss": 0.7459, "step": 50442 }, { "epoch": 0.95, "learning_rate": 3.052634988653686e-08, "loss": 0.8029, "step": 50443 }, { "epoch": 0.95, "learning_rate": 3.05025544393861e-08, "loss": 1.0207, "step": 50444 }, { "epoch": 0.95, "learning_rate": 3.047876821326318e-08, "loss": 0.9294, "step": 50445 }, { "epoch": 0.95, "learning_rate": 3.04549912082569e-08, "loss": 0.8938, "step": 50446 }, { "epoch": 0.95, "learning_rate": 3.043122342445581e-08, "loss": 0.8619, "step": 50447 }, { "epoch": 0.95, "learning_rate": 3.040746486194901e-08, "loss": 0.8224, "step": 50448 }, { "epoch": 0.95, "learning_rate": 3.038371552082475e-08, "loss": 0.913, "step": 50449 }, { "epoch": 0.95, "learning_rate": 3.035997540117214e-08, "loss": 1.1227, "step": 50450 }, { "epoch": 0.95, "learning_rate": 3.033624450307943e-08, "loss": 0.9512, "step": 50451 }, { "epoch": 0.95, "learning_rate": 3.031252282663599e-08, "loss": 0.7851, "step": 50452 }, { "epoch": 0.95, "learning_rate": 3.028881037192927e-08, "loss": 0.8949, "step": 50453 }, { "epoch": 0.95, "learning_rate": 3.02651071390489e-08, "loss": 0.8962, "step": 50454 }, { "epoch": 0.95, "learning_rate": 3.02414131280826e-08, "loss": 0.9503, "step": 50455 }, { "epoch": 0.95, "learning_rate": 3.021772833911918e-08, "loss": 1.044, "step": 50456 }, { "epoch": 0.95, "learning_rate": 3.019405277224691e-08, "loss": 0.8139, "step": 50457 }, { "epoch": 0.95, "learning_rate": 3.01703864275546e-08, "loss": 0.9858, "step": 50458 }, { "epoch": 0.95, "learning_rate": 3.014672930513024e-08, "loss": 0.9047, "step": 50459 }, { "epoch": 0.95, "learning_rate": 3.0123081405062094e-08, "loss": 0.6915, "step": 50460 }, { "epoch": 0.95, "learning_rate": 3.0099442727438975e-08, "loss": 0.9027, "step": 50461 }, { "epoch": 0.95, "learning_rate": 3.007581327234832e-08, "loss": 1.0994, "step": 50462 }, { "epoch": 0.95, "learning_rate": 3.00521930398795e-08, "loss": 0.861, "step": 50463 }, { "epoch": 0.95, "learning_rate": 3.002858203011966e-08, "loss": 0.843, "step": 50464 }, { "epoch": 0.95, "learning_rate": 3.000498024315707e-08, "loss": 0.9427, "step": 50465 }, { "epoch": 0.95, "learning_rate": 2.998138767908082e-08, "loss": 0.8332, "step": 50466 }, { "epoch": 0.95, "learning_rate": 2.995780433797779e-08, "loss": 0.8549, "step": 50467 }, { "epoch": 0.95, "learning_rate": 2.99342302199368e-08, "loss": 1.043, "step": 50468 }, { "epoch": 0.95, "learning_rate": 2.991066532504583e-08, "loss": 1.126, "step": 50469 }, { "epoch": 0.95, "learning_rate": 2.988710965339231e-08, "loss": 0.7668, "step": 50470 }, { "epoch": 0.95, "learning_rate": 2.986356320506478e-08, "loss": 0.9119, "step": 50471 }, { "epoch": 0.95, "learning_rate": 2.9840025980151235e-08, "loss": 0.7228, "step": 50472 }, { "epoch": 0.95, "learning_rate": 2.981649797873909e-08, "loss": 0.7985, "step": 50473 }, { "epoch": 0.95, "learning_rate": 2.979297920091606e-08, "loss": 0.9916, "step": 50474 }, { "epoch": 0.95, "learning_rate": 2.9769469646770967e-08, "loss": 1.1218, "step": 50475 }, { "epoch": 0.95, "learning_rate": 2.97459693163904e-08, "loss": 0.8747, "step": 50476 }, { "epoch": 0.95, "learning_rate": 2.9722478209862905e-08, "loss": 0.965, "step": 50477 }, { "epoch": 0.95, "learning_rate": 2.9698996327275907e-08, "loss": 0.8275, "step": 50478 }, { "epoch": 0.95, "learning_rate": 2.967552366871712e-08, "loss": 0.7292, "step": 50479 }, { "epoch": 0.95, "learning_rate": 2.9652060234273973e-08, "loss": 1.0295, "step": 50480 }, { "epoch": 0.95, "learning_rate": 2.9628606024034444e-08, "loss": 1.1113, "step": 50481 }, { "epoch": 0.95, "learning_rate": 2.960516103808625e-08, "loss": 0.8803, "step": 50482 }, { "epoch": 0.95, "learning_rate": 2.9581725276515982e-08, "loss": 0.9342, "step": 50483 }, { "epoch": 0.95, "learning_rate": 2.955829873941246e-08, "loss": 0.829, "step": 50484 }, { "epoch": 0.95, "learning_rate": 2.953488142686228e-08, "loss": 0.769, "step": 50485 }, { "epoch": 0.95, "learning_rate": 2.9511473338952877e-08, "loss": 0.9785, "step": 50486 }, { "epoch": 0.95, "learning_rate": 2.9488074475772232e-08, "loss": 0.9896, "step": 50487 }, { "epoch": 0.95, "learning_rate": 2.9464684837406942e-08, "loss": 1.0942, "step": 50488 }, { "epoch": 0.95, "learning_rate": 2.944130442394527e-08, "loss": 0.7449, "step": 50489 }, { "epoch": 0.95, "learning_rate": 2.941793323547354e-08, "loss": 0.8103, "step": 50490 }, { "epoch": 0.95, "learning_rate": 2.939457127207973e-08, "loss": 0.8386, "step": 50491 }, { "epoch": 0.95, "learning_rate": 2.9371218533850997e-08, "loss": 0.8244, "step": 50492 }, { "epoch": 0.95, "learning_rate": 2.9347875020874216e-08, "loss": 0.8131, "step": 50493 }, { "epoch": 0.95, "learning_rate": 2.9324540733236816e-08, "loss": 1.0796, "step": 50494 }, { "epoch": 0.95, "learning_rate": 2.9301215671025673e-08, "loss": 0.8156, "step": 50495 }, { "epoch": 0.95, "learning_rate": 2.9277899834328217e-08, "loss": 0.6401, "step": 50496 }, { "epoch": 0.95, "learning_rate": 2.9254593223231042e-08, "loss": 0.9438, "step": 50497 }, { "epoch": 0.95, "learning_rate": 2.923129583782186e-08, "loss": 0.8196, "step": 50498 }, { "epoch": 0.95, "learning_rate": 2.920800767818699e-08, "loss": 0.9706, "step": 50499 }, { "epoch": 0.95, "learning_rate": 2.918472874441358e-08, "loss": 1.0209, "step": 50500 }, { "epoch": 0.95, "learning_rate": 2.9161459036588792e-08, "loss": 0.9467, "step": 50501 }, { "epoch": 0.95, "learning_rate": 2.913819855479921e-08, "loss": 0.9165, "step": 50502 }, { "epoch": 0.95, "learning_rate": 2.911494729913228e-08, "loss": 0.7915, "step": 50503 }, { "epoch": 0.95, "learning_rate": 2.9091705269673753e-08, "loss": 0.8052, "step": 50504 }, { "epoch": 0.95, "learning_rate": 2.9068472466511622e-08, "loss": 0.9849, "step": 50505 }, { "epoch": 0.95, "learning_rate": 2.904524888973165e-08, "loss": 1.1162, "step": 50506 }, { "epoch": 0.95, "learning_rate": 2.9022034539420986e-08, "loss": 1.0558, "step": 50507 }, { "epoch": 0.95, "learning_rate": 2.899882941566651e-08, "loss": 0.8543, "step": 50508 }, { "epoch": 0.95, "learning_rate": 2.8975633518554536e-08, "loss": 0.835, "step": 50509 }, { "epoch": 0.95, "learning_rate": 2.8952446848171667e-08, "loss": 0.7324, "step": 50510 }, { "epoch": 0.95, "learning_rate": 2.8929269404604776e-08, "loss": 0.8071, "step": 50511 }, { "epoch": 0.95, "learning_rate": 2.8906101187940183e-08, "loss": 1.0358, "step": 50512 }, { "epoch": 0.95, "learning_rate": 2.8882942198264485e-08, "loss": 0.924, "step": 50513 }, { "epoch": 0.95, "learning_rate": 2.8859792435664003e-08, "loss": 0.9316, "step": 50514 }, { "epoch": 0.95, "learning_rate": 2.8836651900225333e-08, "loss": 0.6947, "step": 50515 }, { "epoch": 0.95, "learning_rate": 2.8813520592034795e-08, "loss": 0.8989, "step": 50516 }, { "epoch": 0.95, "learning_rate": 2.8790398511178987e-08, "loss": 0.9892, "step": 50517 }, { "epoch": 0.95, "learning_rate": 2.8767285657743672e-08, "loss": 1.1285, "step": 50518 }, { "epoch": 0.95, "learning_rate": 2.8744182031816004e-08, "loss": 0.9169, "step": 50519 }, { "epoch": 0.95, "learning_rate": 2.872108763348147e-08, "loss": 0.816, "step": 50520 }, { "epoch": 0.95, "learning_rate": 2.8698002462826668e-08, "loss": 0.9161, "step": 50521 }, { "epoch": 0.95, "learning_rate": 2.8674926519937917e-08, "loss": 0.8849, "step": 50522 }, { "epoch": 0.95, "learning_rate": 2.8651859804900985e-08, "loss": 0.6874, "step": 50523 }, { "epoch": 0.95, "learning_rate": 2.862880231780246e-08, "loss": 0.7574, "step": 50524 }, { "epoch": 0.95, "learning_rate": 2.860575405872812e-08, "loss": 0.8483, "step": 50525 }, { "epoch": 0.95, "learning_rate": 2.8582715027764275e-08, "loss": 1.0648, "step": 50526 }, { "epoch": 0.95, "learning_rate": 2.8559685224996413e-08, "loss": 0.9085, "step": 50527 }, { "epoch": 0.95, "learning_rate": 2.8536664650511137e-08, "loss": 0.8581, "step": 50528 }, { "epoch": 0.95, "learning_rate": 2.8513653304394205e-08, "loss": 0.8039, "step": 50529 }, { "epoch": 0.95, "learning_rate": 2.849065118673139e-08, "loss": 0.6881, "step": 50530 }, { "epoch": 0.95, "learning_rate": 2.8467658297609e-08, "loss": 1.0783, "step": 50531 }, { "epoch": 0.95, "learning_rate": 2.844467463711226e-08, "loss": 0.9649, "step": 50532 }, { "epoch": 0.95, "learning_rate": 2.8421700205327475e-08, "loss": 0.6515, "step": 50533 }, { "epoch": 0.95, "learning_rate": 2.839873500234014e-08, "loss": 0.6128, "step": 50534 }, { "epoch": 0.95, "learning_rate": 2.8375779028236294e-08, "loss": 0.9486, "step": 50535 }, { "epoch": 0.95, "learning_rate": 2.8352832283101706e-08, "loss": 0.7015, "step": 50536 }, { "epoch": 0.95, "learning_rate": 2.8329894767021304e-08, "loss": 1.1615, "step": 50537 }, { "epoch": 0.95, "learning_rate": 2.8306966480081965e-08, "loss": 0.7537, "step": 50538 }, { "epoch": 0.95, "learning_rate": 2.8284047422368342e-08, "loss": 0.9417, "step": 50539 }, { "epoch": 0.95, "learning_rate": 2.8261137593966202e-08, "loss": 0.8946, "step": 50540 }, { "epoch": 0.95, "learning_rate": 2.823823699496103e-08, "loss": 0.903, "step": 50541 }, { "epoch": 0.95, "learning_rate": 2.8215345625438874e-08, "loss": 0.8497, "step": 50542 }, { "epoch": 0.95, "learning_rate": 2.8192463485484657e-08, "loss": 0.8659, "step": 50543 }, { "epoch": 0.95, "learning_rate": 2.816959057518387e-08, "loss": 0.9661, "step": 50544 }, { "epoch": 0.95, "learning_rate": 2.8146726894622278e-08, "loss": 1.0811, "step": 50545 }, { "epoch": 0.95, "learning_rate": 2.8123872443884813e-08, "loss": 0.7909, "step": 50546 }, { "epoch": 0.95, "learning_rate": 2.8101027223057243e-08, "loss": 1.0038, "step": 50547 }, { "epoch": 0.95, "learning_rate": 2.8078191232224495e-08, "loss": 0.9541, "step": 50548 }, { "epoch": 0.95, "learning_rate": 2.805536447147178e-08, "loss": 0.7255, "step": 50549 }, { "epoch": 0.95, "learning_rate": 2.8032546940885142e-08, "loss": 1.098, "step": 50550 }, { "epoch": 0.95, "learning_rate": 2.8009738640548678e-08, "loss": 0.9662, "step": 50551 }, { "epoch": 0.95, "learning_rate": 2.798693957054843e-08, "loss": 0.8717, "step": 50552 }, { "epoch": 0.95, "learning_rate": 2.7964149730968783e-08, "loss": 0.8667, "step": 50553 }, { "epoch": 0.95, "learning_rate": 2.794136912189521e-08, "loss": 0.8451, "step": 50554 }, { "epoch": 0.95, "learning_rate": 2.791859774341321e-08, "loss": 0.9554, "step": 50555 }, { "epoch": 0.95, "learning_rate": 2.7895835595606878e-08, "loss": 1.1748, "step": 50556 }, { "epoch": 0.95, "learning_rate": 2.787308267856198e-08, "loss": 0.9655, "step": 50557 }, { "epoch": 0.95, "learning_rate": 2.7850338992363168e-08, "loss": 1.0293, "step": 50558 }, { "epoch": 0.95, "learning_rate": 2.7827604537095097e-08, "loss": 0.9696, "step": 50559 }, { "epoch": 0.95, "learning_rate": 2.780487931284326e-08, "loss": 0.8563, "step": 50560 }, { "epoch": 0.95, "learning_rate": 2.7782163319692025e-08, "loss": 0.8382, "step": 50561 }, { "epoch": 0.95, "learning_rate": 2.7759456557726605e-08, "loss": 1.0206, "step": 50562 }, { "epoch": 0.95, "learning_rate": 2.773675902703138e-08, "loss": 1.0522, "step": 50563 }, { "epoch": 0.95, "learning_rate": 2.7714070727691555e-08, "loss": 0.9736, "step": 50564 }, { "epoch": 0.95, "learning_rate": 2.7691391659791234e-08, "loss": 0.8154, "step": 50565 }, { "epoch": 0.95, "learning_rate": 2.76687218234159e-08, "loss": 0.8566, "step": 50566 }, { "epoch": 0.95, "learning_rate": 2.7646061218649377e-08, "loss": 0.8624, "step": 50567 }, { "epoch": 0.95, "learning_rate": 2.76234098455766e-08, "loss": 1.0174, "step": 50568 }, { "epoch": 0.95, "learning_rate": 2.7600767704282493e-08, "loss": 0.8833, "step": 50569 }, { "epoch": 0.95, "learning_rate": 2.7578134794851165e-08, "loss": 1.0336, "step": 50570 }, { "epoch": 0.95, "learning_rate": 2.7555511117367263e-08, "loss": 0.8316, "step": 50571 }, { "epoch": 0.95, "learning_rate": 2.7532896671915442e-08, "loss": 0.9636, "step": 50572 }, { "epoch": 0.95, "learning_rate": 2.751029145857981e-08, "loss": 0.8864, "step": 50573 }, { "epoch": 0.95, "learning_rate": 2.748769547744501e-08, "loss": 0.8531, "step": 50574 }, { "epoch": 0.95, "learning_rate": 2.7465108728595145e-08, "loss": 0.9939, "step": 50575 }, { "epoch": 0.95, "learning_rate": 2.7442531212115154e-08, "loss": 0.9268, "step": 50576 }, { "epoch": 0.95, "learning_rate": 2.7419962928088572e-08, "loss": 0.7188, "step": 50577 }, { "epoch": 0.95, "learning_rate": 2.7397403876600336e-08, "loss": 0.7395, "step": 50578 }, { "epoch": 0.95, "learning_rate": 2.7374854057734267e-08, "loss": 0.7991, "step": 50579 }, { "epoch": 0.95, "learning_rate": 2.7352313471574466e-08, "loss": 0.744, "step": 50580 }, { "epoch": 0.95, "learning_rate": 2.7329782118205582e-08, "loss": 1.0538, "step": 50581 }, { "epoch": 0.95, "learning_rate": 2.7307259997711444e-08, "loss": 1.0223, "step": 50582 }, { "epoch": 0.95, "learning_rate": 2.7284747110176148e-08, "loss": 0.9226, "step": 50583 }, { "epoch": 0.95, "learning_rate": 2.726224345568379e-08, "loss": 0.861, "step": 50584 }, { "epoch": 0.95, "learning_rate": 2.7239749034318473e-08, "loss": 0.9268, "step": 50585 }, { "epoch": 0.95, "learning_rate": 2.7217263846163745e-08, "loss": 0.8544, "step": 50586 }, { "epoch": 0.95, "learning_rate": 2.7194787891304254e-08, "loss": 1.1723, "step": 50587 }, { "epoch": 0.95, "learning_rate": 2.7172321169823822e-08, "loss": 0.8527, "step": 50588 }, { "epoch": 0.95, "learning_rate": 2.7149863681805444e-08, "loss": 0.7522, "step": 50589 }, { "epoch": 0.95, "learning_rate": 2.7127415427334324e-08, "loss": 0.9084, "step": 50590 }, { "epoch": 0.95, "learning_rate": 2.7104976406493456e-08, "loss": 0.7682, "step": 50591 }, { "epoch": 0.95, "learning_rate": 2.7082546619366657e-08, "loss": 0.7893, "step": 50592 }, { "epoch": 0.95, "learning_rate": 2.7060126066037752e-08, "loss": 1.1462, "step": 50593 }, { "epoch": 0.95, "learning_rate": 2.703771474659056e-08, "loss": 0.9224, "step": 50594 }, { "epoch": 0.95, "learning_rate": 2.7015312661108905e-08, "loss": 0.8184, "step": 50595 }, { "epoch": 0.95, "learning_rate": 2.6992919809676054e-08, "loss": 1.0938, "step": 50596 }, { "epoch": 0.95, "learning_rate": 2.6970536192376106e-08, "loss": 0.8137, "step": 50597 }, { "epoch": 0.95, "learning_rate": 2.6948161809291772e-08, "loss": 0.8073, "step": 50598 }, { "epoch": 0.95, "learning_rate": 2.692579666050771e-08, "loss": 0.9173, "step": 50599 }, { "epoch": 0.95, "learning_rate": 2.6903440746106623e-08, "loss": 0.9305, "step": 50600 }, { "epoch": 0.95, "learning_rate": 2.6881094066172342e-08, "loss": 0.8723, "step": 50601 }, { "epoch": 0.95, "learning_rate": 2.6858756620788406e-08, "loss": 0.8236, "step": 50602 }, { "epoch": 0.95, "learning_rate": 2.6836428410037807e-08, "loss": 0.7962, "step": 50603 }, { "epoch": 0.95, "learning_rate": 2.6814109434004366e-08, "loss": 1.0212, "step": 50604 }, { "epoch": 0.95, "learning_rate": 2.6791799692770792e-08, "loss": 0.9961, "step": 50605 }, { "epoch": 0.95, "learning_rate": 2.6769499186421466e-08, "loss": 0.7836, "step": 50606 }, { "epoch": 0.95, "learning_rate": 2.6747207915038266e-08, "loss": 0.9521, "step": 50607 }, { "epoch": 0.95, "learning_rate": 2.6724925878705844e-08, "loss": 0.7378, "step": 50608 }, { "epoch": 0.95, "learning_rate": 2.6702653077506356e-08, "loss": 0.8958, "step": 50609 }, { "epoch": 0.95, "learning_rate": 2.6680389511523074e-08, "loss": 0.8666, "step": 50610 }, { "epoch": 0.95, "learning_rate": 2.6658135180839817e-08, "loss": 0.7367, "step": 50611 }, { "epoch": 0.95, "learning_rate": 2.6635890085539018e-08, "loss": 0.8689, "step": 50612 }, { "epoch": 0.95, "learning_rate": 2.6613654225704222e-08, "loss": 0.8816, "step": 50613 }, { "epoch": 0.95, "learning_rate": 2.6591427601417864e-08, "loss": 0.9398, "step": 50614 }, { "epoch": 0.95, "learning_rate": 2.6569210212763485e-08, "loss": 0.7993, "step": 50615 }, { "epoch": 0.95, "learning_rate": 2.65470020598238e-08, "loss": 0.6623, "step": 50616 }, { "epoch": 0.95, "learning_rate": 2.6524803142681798e-08, "loss": 0.9719, "step": 50617 }, { "epoch": 0.96, "learning_rate": 2.6502613461420468e-08, "loss": 1.1083, "step": 50618 }, { "epoch": 0.96, "learning_rate": 2.6480433016122242e-08, "loss": 0.7595, "step": 50619 }, { "epoch": 0.96, "learning_rate": 2.645826180687039e-08, "loss": 0.8058, "step": 50620 }, { "epoch": 0.96, "learning_rate": 2.643609983374762e-08, "loss": 0.8991, "step": 50621 }, { "epoch": 0.96, "learning_rate": 2.6413947096836645e-08, "loss": 0.7734, "step": 50622 }, { "epoch": 0.96, "learning_rate": 2.63918035962199e-08, "loss": 0.8688, "step": 50623 }, { "epoch": 0.96, "learning_rate": 2.636966933198065e-08, "loss": 0.8643, "step": 50624 }, { "epoch": 0.96, "learning_rate": 2.6347544304200778e-08, "loss": 1.1864, "step": 50625 }, { "epoch": 0.96, "learning_rate": 2.6325428512963547e-08, "loss": 0.9118, "step": 50626 }, { "epoch": 0.96, "learning_rate": 2.630332195835167e-08, "loss": 0.7621, "step": 50627 }, { "epoch": 0.96, "learning_rate": 2.6281224640446744e-08, "loss": 0.6625, "step": 50628 }, { "epoch": 0.96, "learning_rate": 2.625913655933232e-08, "loss": 0.9635, "step": 50629 }, { "epoch": 0.96, "learning_rate": 2.6237057715090275e-08, "loss": 0.6983, "step": 50630 }, { "epoch": 0.96, "learning_rate": 2.621498810780304e-08, "loss": 1.0419, "step": 50631 }, { "epoch": 0.96, "learning_rate": 2.619292773755361e-08, "loss": 1.0221, "step": 50632 }, { "epoch": 0.96, "learning_rate": 2.6170876604423577e-08, "loss": 1.025, "step": 50633 }, { "epoch": 0.96, "learning_rate": 2.6148834708495664e-08, "loss": 1.0767, "step": 50634 }, { "epoch": 0.96, "learning_rate": 2.6126802049852296e-08, "loss": 0.8521, "step": 50635 }, { "epoch": 0.96, "learning_rate": 2.6104778628575633e-08, "loss": 0.8836, "step": 50636 }, { "epoch": 0.96, "learning_rate": 2.608276444474783e-08, "loss": 0.9969, "step": 50637 }, { "epoch": 0.96, "learning_rate": 2.606075949845105e-08, "loss": 0.9267, "step": 50638 }, { "epoch": 0.96, "learning_rate": 2.603876378976772e-08, "loss": 0.759, "step": 50639 }, { "epoch": 0.96, "learning_rate": 2.601677731877944e-08, "loss": 0.8995, "step": 50640 }, { "epoch": 0.96, "learning_rate": 2.5994800085568927e-08, "loss": 0.9452, "step": 50641 }, { "epoch": 0.96, "learning_rate": 2.5972832090218058e-08, "loss": 0.698, "step": 50642 }, { "epoch": 0.96, "learning_rate": 2.5950873332808712e-08, "loss": 1.2578, "step": 50643 }, { "epoch": 0.96, "learning_rate": 2.5928923813422768e-08, "loss": 1.1078, "step": 50644 }, { "epoch": 0.96, "learning_rate": 2.5906983532142384e-08, "loss": 0.843, "step": 50645 }, { "epoch": 0.96, "learning_rate": 2.5885052489049712e-08, "loss": 0.973, "step": 50646 }, { "epoch": 0.96, "learning_rate": 2.5863130684226078e-08, "loss": 0.6169, "step": 50647 }, { "epoch": 0.96, "learning_rate": 2.5841218117753918e-08, "loss": 0.8172, "step": 50648 }, { "epoch": 0.96, "learning_rate": 2.5819314789714557e-08, "loss": 1.1677, "step": 50649 }, { "epoch": 0.96, "learning_rate": 2.5797420700190423e-08, "loss": 1.1235, "step": 50650 }, { "epoch": 0.96, "learning_rate": 2.577553584926257e-08, "loss": 0.8333, "step": 50651 }, { "epoch": 0.96, "learning_rate": 2.5753660237012866e-08, "loss": 0.805, "step": 50652 }, { "epoch": 0.96, "learning_rate": 2.573179386352348e-08, "loss": 0.8727, "step": 50653 }, { "epoch": 0.96, "learning_rate": 2.570993672887545e-08, "loss": 0.9202, "step": 50654 }, { "epoch": 0.96, "learning_rate": 2.568808883315066e-08, "loss": 1.0732, "step": 50655 }, { "epoch": 0.96, "learning_rate": 2.5666250176430706e-08, "loss": 1.1006, "step": 50656 }, { "epoch": 0.96, "learning_rate": 2.5644420758797194e-08, "loss": 0.9954, "step": 50657 }, { "epoch": 0.96, "learning_rate": 2.5622600580331447e-08, "loss": 1.1037, "step": 50658 }, { "epoch": 0.96, "learning_rate": 2.5600789641115063e-08, "loss": 0.8254, "step": 50659 }, { "epoch": 0.96, "learning_rate": 2.5578987941229648e-08, "loss": 0.8233, "step": 50660 }, { "epoch": 0.96, "learning_rate": 2.5557195480756248e-08, "loss": 0.9905, "step": 50661 }, { "epoch": 0.96, "learning_rate": 2.553541225977646e-08, "loss": 0.9816, "step": 50662 }, { "epoch": 0.96, "learning_rate": 2.551363827837161e-08, "loss": 0.7823, "step": 50663 }, { "epoch": 0.96, "learning_rate": 2.5491873536623023e-08, "loss": 0.8911, "step": 50664 }, { "epoch": 0.96, "learning_rate": 2.5470118034611745e-08, "loss": 0.9494, "step": 50665 }, { "epoch": 0.96, "learning_rate": 2.5448371772419102e-08, "loss": 0.9351, "step": 50666 }, { "epoch": 0.96, "learning_rate": 2.542663475012641e-08, "loss": 0.9172, "step": 50667 }, { "epoch": 0.96, "learning_rate": 2.5404906967815003e-08, "loss": 1.0385, "step": 50668 }, { "epoch": 0.96, "learning_rate": 2.538318842556592e-08, "loss": 0.9266, "step": 50669 }, { "epoch": 0.96, "learning_rate": 2.5361479123459653e-08, "loss": 0.8138, "step": 50670 }, { "epoch": 0.96, "learning_rate": 2.5339779061578084e-08, "loss": 0.7384, "step": 50671 }, { "epoch": 0.96, "learning_rate": 2.5318088240001704e-08, "loss": 0.8704, "step": 50672 }, { "epoch": 0.96, "learning_rate": 2.5296406658811834e-08, "loss": 0.8716, "step": 50673 }, { "epoch": 0.96, "learning_rate": 2.5274734318089245e-08, "loss": 1.0139, "step": 50674 }, { "epoch": 0.96, "learning_rate": 2.5253071217914982e-08, "loss": 0.912, "step": 50675 }, { "epoch": 0.96, "learning_rate": 2.5231417358369813e-08, "loss": 0.8552, "step": 50676 }, { "epoch": 0.96, "learning_rate": 2.5209772739534787e-08, "loss": 0.9281, "step": 50677 }, { "epoch": 0.96, "learning_rate": 2.5188137361490396e-08, "loss": 0.7522, "step": 50678 }, { "epoch": 0.96, "learning_rate": 2.516651122431768e-08, "loss": 1.0343, "step": 50679 }, { "epoch": 0.96, "learning_rate": 2.5144894328097412e-08, "loss": 0.7601, "step": 50680 }, { "epoch": 0.96, "learning_rate": 2.5123286672910364e-08, "loss": 1.0196, "step": 50681 }, { "epoch": 0.96, "learning_rate": 2.5101688258836743e-08, "loss": 0.869, "step": 50682 }, { "epoch": 0.96, "learning_rate": 2.5080099085957875e-08, "loss": 0.7248, "step": 50683 }, { "epoch": 0.96, "learning_rate": 2.505851915435398e-08, "loss": 0.8406, "step": 50684 }, { "epoch": 0.96, "learning_rate": 2.5036948464105536e-08, "loss": 0.7632, "step": 50685 }, { "epoch": 0.96, "learning_rate": 2.5015387015293326e-08, "loss": 0.9774, "step": 50686 }, { "epoch": 0.96, "learning_rate": 2.4993834807997552e-08, "loss": 1.031, "step": 50687 }, { "epoch": 0.96, "learning_rate": 2.497229184229899e-08, "loss": 0.9714, "step": 50688 }, { "epoch": 0.96, "learning_rate": 2.4950758118278127e-08, "loss": 0.975, "step": 50689 }, { "epoch": 0.96, "learning_rate": 2.492923363601546e-08, "loss": 0.9102, "step": 50690 }, { "epoch": 0.96, "learning_rate": 2.490771839559064e-08, "loss": 0.7206, "step": 50691 }, { "epoch": 0.96, "learning_rate": 2.4886212397084996e-08, "loss": 0.8738, "step": 50692 }, { "epoch": 0.96, "learning_rate": 2.4864715640578185e-08, "loss": 0.9629, "step": 50693 }, { "epoch": 0.96, "learning_rate": 2.484322812615042e-08, "loss": 1.1298, "step": 50694 }, { "epoch": 0.96, "learning_rate": 2.482174985388247e-08, "loss": 0.7067, "step": 50695 }, { "epoch": 0.96, "learning_rate": 2.4800280823853994e-08, "loss": 0.8918, "step": 50696 }, { "epoch": 0.96, "learning_rate": 2.4778821036145486e-08, "loss": 0.9189, "step": 50697 }, { "epoch": 0.96, "learning_rate": 2.4757370490836876e-08, "loss": 0.9839, "step": 50698 }, { "epoch": 0.96, "learning_rate": 2.4735929188008377e-08, "loss": 0.7321, "step": 50699 }, { "epoch": 0.96, "learning_rate": 2.4714497127739932e-08, "loss": 1.0967, "step": 50700 }, { "epoch": 0.96, "learning_rate": 2.4693074310112032e-08, "loss": 0.9807, "step": 50701 }, { "epoch": 0.96, "learning_rate": 2.467166073520405e-08, "loss": 0.6497, "step": 50702 }, { "epoch": 0.96, "learning_rate": 2.465025640309593e-08, "loss": 0.9236, "step": 50703 }, { "epoch": 0.96, "learning_rate": 2.4628861313868436e-08, "loss": 0.7963, "step": 50704 }, { "epoch": 0.96, "learning_rate": 2.4607475467600395e-08, "loss": 1.1049, "step": 50705 }, { "epoch": 0.96, "learning_rate": 2.4586098864372298e-08, "loss": 1.0601, "step": 50706 }, { "epoch": 0.96, "learning_rate": 2.4564731504263806e-08, "loss": 0.8236, "step": 50707 }, { "epoch": 0.96, "learning_rate": 2.454337338735485e-08, "loss": 0.8556, "step": 50708 }, { "epoch": 0.96, "learning_rate": 2.4522024513724818e-08, "loss": 0.92, "step": 50709 }, { "epoch": 0.96, "learning_rate": 2.450068488345364e-08, "loss": 0.6512, "step": 50710 }, { "epoch": 0.96, "learning_rate": 2.4479354496621254e-08, "loss": 0.9542, "step": 50711 }, { "epoch": 0.96, "learning_rate": 2.4458033353306763e-08, "loss": 1.216, "step": 50712 }, { "epoch": 0.96, "learning_rate": 2.4436721453590384e-08, "loss": 0.9327, "step": 50713 }, { "epoch": 0.96, "learning_rate": 2.4415418797551216e-08, "loss": 0.8173, "step": 50714 }, { "epoch": 0.96, "learning_rate": 2.439412538526892e-08, "loss": 0.8091, "step": 50715 }, { "epoch": 0.96, "learning_rate": 2.437284121682315e-08, "loss": 0.897, "step": 50716 }, { "epoch": 0.96, "learning_rate": 2.4351566292293295e-08, "loss": 0.7425, "step": 50717 }, { "epoch": 0.96, "learning_rate": 2.433030061175873e-08, "loss": 1.1148, "step": 50718 }, { "epoch": 0.96, "learning_rate": 2.4309044175298835e-08, "loss": 0.9861, "step": 50719 }, { "epoch": 0.96, "learning_rate": 2.4287796982993273e-08, "loss": 1.1104, "step": 50720 }, { "epoch": 0.96, "learning_rate": 2.4266559034920865e-08, "loss": 0.8703, "step": 50721 }, { "epoch": 0.96, "learning_rate": 2.4245330331161555e-08, "loss": 0.8175, "step": 50722 }, { "epoch": 0.96, "learning_rate": 2.422411087179416e-08, "loss": 0.8777, "step": 50723 }, { "epoch": 0.96, "learning_rate": 2.4202900656897787e-08, "loss": 0.8987, "step": 50724 }, { "epoch": 0.96, "learning_rate": 2.4181699686552094e-08, "loss": 1.1486, "step": 50725 }, { "epoch": 0.96, "learning_rate": 2.4160507960836187e-08, "loss": 0.9732, "step": 50726 }, { "epoch": 0.96, "learning_rate": 2.4139325479828613e-08, "loss": 0.8929, "step": 50727 }, { "epoch": 0.96, "learning_rate": 2.4118152243609306e-08, "loss": 0.8917, "step": 50728 }, { "epoch": 0.96, "learning_rate": 2.4096988252256537e-08, "loss": 0.7531, "step": 50729 }, { "epoch": 0.96, "learning_rate": 2.4075833505849965e-08, "loss": 0.8942, "step": 50730 }, { "epoch": 0.96, "learning_rate": 2.405468800446814e-08, "loss": 0.8965, "step": 50731 }, { "epoch": 0.96, "learning_rate": 2.4033551748190444e-08, "loss": 0.9651, "step": 50732 }, { "epoch": 0.96, "learning_rate": 2.401242473709542e-08, "loss": 0.9019, "step": 50733 }, { "epoch": 0.96, "learning_rate": 2.3991306971262175e-08, "loss": 0.9153, "step": 50734 }, { "epoch": 0.96, "learning_rate": 2.3970198450769255e-08, "loss": 0.8456, "step": 50735 }, { "epoch": 0.96, "learning_rate": 2.3949099175695766e-08, "loss": 1.0069, "step": 50736 }, { "epoch": 0.96, "learning_rate": 2.3928009146120536e-08, "loss": 1.0123, "step": 50737 }, { "epoch": 0.96, "learning_rate": 2.3906928362122107e-08, "loss": 0.9819, "step": 50738 }, { "epoch": 0.96, "learning_rate": 2.388585682377931e-08, "loss": 1.0223, "step": 50739 }, { "epoch": 0.96, "learning_rate": 2.3864794531170688e-08, "loss": 0.7754, "step": 50740 }, { "epoch": 0.96, "learning_rate": 2.384374148437507e-08, "loss": 0.8853, "step": 50741 }, { "epoch": 0.96, "learning_rate": 2.3822697683471286e-08, "loss": 0.8285, "step": 50742 }, { "epoch": 0.96, "learning_rate": 2.380166312853732e-08, "loss": 1.3413, "step": 50743 }, { "epoch": 0.96, "learning_rate": 2.3780637819652286e-08, "loss": 1.0288, "step": 50744 }, { "epoch": 0.96, "learning_rate": 2.3759621756893892e-08, "loss": 0.8719, "step": 50745 }, { "epoch": 0.96, "learning_rate": 2.3738614940341797e-08, "loss": 0.8209, "step": 50746 }, { "epoch": 0.96, "learning_rate": 2.3717617370073444e-08, "loss": 0.8223, "step": 50747 }, { "epoch": 0.96, "learning_rate": 2.369662904616765e-08, "loss": 0.8848, "step": 50748 }, { "epoch": 0.96, "learning_rate": 2.3675649968702696e-08, "loss": 1.1007, "step": 50749 }, { "epoch": 0.96, "learning_rate": 2.3654680137756846e-08, "loss": 1.0075, "step": 50750 }, { "epoch": 0.96, "learning_rate": 2.363371955340865e-08, "loss": 1.0389, "step": 50751 }, { "epoch": 0.96, "learning_rate": 2.3612768215736105e-08, "loss": 0.787, "step": 50752 }, { "epoch": 0.96, "learning_rate": 2.359182612481775e-08, "loss": 1.0209, "step": 50753 }, { "epoch": 0.96, "learning_rate": 2.3570893280731033e-08, "loss": 0.6894, "step": 50754 }, { "epoch": 0.96, "learning_rate": 2.354996968355533e-08, "loss": 0.7931, "step": 50755 }, { "epoch": 0.96, "learning_rate": 2.3529055333367802e-08, "loss": 0.9122, "step": 50756 }, { "epoch": 0.96, "learning_rate": 2.350815023024672e-08, "loss": 1.0597, "step": 50757 }, { "epoch": 0.96, "learning_rate": 2.348725437427063e-08, "loss": 0.8055, "step": 50758 }, { "epoch": 0.96, "learning_rate": 2.3466367765516972e-08, "loss": 0.7013, "step": 50759 }, { "epoch": 0.96, "learning_rate": 2.344549040406402e-08, "loss": 0.6166, "step": 50760 }, { "epoch": 0.96, "learning_rate": 2.342462228998976e-08, "loss": 0.9032, "step": 50761 }, { "epoch": 0.96, "learning_rate": 2.340376342337192e-08, "loss": 1.1511, "step": 50762 }, { "epoch": 0.96, "learning_rate": 2.3382913804288476e-08, "loss": 1.0552, "step": 50763 }, { "epoch": 0.96, "learning_rate": 2.3362073432817433e-08, "loss": 0.9858, "step": 50764 }, { "epoch": 0.96, "learning_rate": 2.3341242309036505e-08, "loss": 0.8128, "step": 50765 }, { "epoch": 0.96, "learning_rate": 2.3320420433023126e-08, "loss": 0.716, "step": 50766 }, { "epoch": 0.96, "learning_rate": 2.3299607804855574e-08, "loss": 0.989, "step": 50767 }, { "epoch": 0.96, "learning_rate": 2.3278804424611555e-08, "loss": 1.021, "step": 50768 }, { "epoch": 0.96, "learning_rate": 2.3258010292368237e-08, "loss": 0.7985, "step": 50769 }, { "epoch": 0.96, "learning_rate": 2.323722540820361e-08, "loss": 1.1227, "step": 50770 }, { "epoch": 0.96, "learning_rate": 2.3216449772195116e-08, "loss": 0.951, "step": 50771 }, { "epoch": 0.96, "learning_rate": 2.319568338442074e-08, "loss": 0.8896, "step": 50772 }, { "epoch": 0.96, "learning_rate": 2.317492624495765e-08, "loss": 0.7706, "step": 50773 }, { "epoch": 0.96, "learning_rate": 2.315417835388356e-08, "loss": 0.9534, "step": 50774 }, { "epoch": 0.96, "learning_rate": 2.313343971127563e-08, "loss": 1.0612, "step": 50775 }, { "epoch": 0.96, "learning_rate": 2.3112710317211572e-08, "loss": 0.9935, "step": 50776 }, { "epoch": 0.96, "learning_rate": 2.3091990171768553e-08, "loss": 0.6915, "step": 50777 }, { "epoch": 0.96, "learning_rate": 2.3071279275024284e-08, "loss": 1.0065, "step": 50778 }, { "epoch": 0.96, "learning_rate": 2.3050577627055926e-08, "loss": 0.8593, "step": 50779 }, { "epoch": 0.96, "learning_rate": 2.302988522794064e-08, "loss": 0.9423, "step": 50780 }, { "epoch": 0.96, "learning_rate": 2.3009202077755867e-08, "loss": 0.9161, "step": 50781 }, { "epoch": 0.96, "learning_rate": 2.298852817657876e-08, "loss": 1.029, "step": 50782 }, { "epoch": 0.96, "learning_rate": 2.2967863524486765e-08, "loss": 0.9438, "step": 50783 }, { "epoch": 0.96, "learning_rate": 2.2947208121556762e-08, "loss": 0.9819, "step": 50784 }, { "epoch": 0.96, "learning_rate": 2.2926561967865635e-08, "loss": 0.716, "step": 50785 }, { "epoch": 0.96, "learning_rate": 2.2905925063491098e-08, "loss": 1.0217, "step": 50786 }, { "epoch": 0.96, "learning_rate": 2.2885297408509755e-08, "loss": 1.3213, "step": 50787 }, { "epoch": 0.96, "learning_rate": 2.286467900299849e-08, "loss": 0.9828, "step": 50788 }, { "epoch": 0.96, "learning_rate": 2.2844069847035023e-08, "loss": 0.934, "step": 50789 }, { "epoch": 0.96, "learning_rate": 2.2823469940695676e-08, "loss": 1.0815, "step": 50790 }, { "epoch": 0.96, "learning_rate": 2.2802879284057333e-08, "loss": 0.8296, "step": 50791 }, { "epoch": 0.96, "learning_rate": 2.2782297877197435e-08, "loss": 0.9937, "step": 50792 }, { "epoch": 0.96, "learning_rate": 2.276172572019231e-08, "loss": 1.1422, "step": 50793 }, { "epoch": 0.96, "learning_rate": 2.2741162813118834e-08, "loss": 0.868, "step": 50794 }, { "epoch": 0.96, "learning_rate": 2.2720609156054174e-08, "loss": 0.7292, "step": 50795 }, { "epoch": 0.96, "learning_rate": 2.2700064749074658e-08, "loss": 0.7086, "step": 50796 }, { "epoch": 0.96, "learning_rate": 2.2679529592257167e-08, "loss": 0.8223, "step": 50797 }, { "epoch": 0.96, "learning_rate": 2.2659003685678305e-08, "loss": 0.8152, "step": 50798 }, { "epoch": 0.96, "learning_rate": 2.263848702941468e-08, "loss": 0.9478, "step": 50799 }, { "epoch": 0.96, "learning_rate": 2.2617979623543173e-08, "loss": 0.9405, "step": 50800 }, { "epoch": 0.96, "learning_rate": 2.2597481468140113e-08, "loss": 0.9081, "step": 50801 }, { "epoch": 0.96, "learning_rate": 2.2576992563282106e-08, "loss": 0.7593, "step": 50802 }, { "epoch": 0.96, "learning_rate": 2.255651290904548e-08, "loss": 0.8447, "step": 50803 }, { "epoch": 0.96, "learning_rate": 2.2536042505507116e-08, "loss": 0.7933, "step": 50804 }, { "epoch": 0.96, "learning_rate": 2.2515581352743066e-08, "loss": 0.8078, "step": 50805 }, { "epoch": 0.96, "learning_rate": 2.2495129450829933e-08, "loss": 0.9832, "step": 50806 }, { "epoch": 0.96, "learning_rate": 2.2474686799844047e-08, "loss": 0.8672, "step": 50807 }, { "epoch": 0.96, "learning_rate": 2.2454253399861737e-08, "loss": 0.8333, "step": 50808 }, { "epoch": 0.96, "learning_rate": 2.243382925095905e-08, "loss": 0.8256, "step": 50809 }, { "epoch": 0.96, "learning_rate": 2.2413414353212593e-08, "loss": 0.944, "step": 50810 }, { "epoch": 0.96, "learning_rate": 2.2393008706698692e-08, "loss": 0.8116, "step": 50811 }, { "epoch": 0.96, "learning_rate": 2.2372612311493124e-08, "loss": 0.9622, "step": 50812 }, { "epoch": 0.96, "learning_rate": 2.2352225167672216e-08, "loss": 0.8866, "step": 50813 }, { "epoch": 0.96, "learning_rate": 2.2331847275312567e-08, "loss": 0.8165, "step": 50814 }, { "epoch": 0.96, "learning_rate": 2.2311478634489124e-08, "loss": 0.8543, "step": 50815 }, { "epoch": 0.96, "learning_rate": 2.2291119245279323e-08, "loss": 0.9081, "step": 50816 }, { "epoch": 0.96, "learning_rate": 2.2270769107758106e-08, "loss": 0.9464, "step": 50817 }, { "epoch": 0.96, "learning_rate": 2.2250428222002073e-08, "loss": 0.9735, "step": 50818 }, { "epoch": 0.96, "learning_rate": 2.2230096588086725e-08, "loss": 0.9498, "step": 50819 }, { "epoch": 0.96, "learning_rate": 2.2209774206088386e-08, "loss": 0.9506, "step": 50820 }, { "epoch": 0.96, "learning_rate": 2.218946107608283e-08, "loss": 0.9532, "step": 50821 }, { "epoch": 0.96, "learning_rate": 2.216915719814583e-08, "loss": 0.8775, "step": 50822 }, { "epoch": 0.96, "learning_rate": 2.2148862572353435e-08, "loss": 0.8538, "step": 50823 }, { "epoch": 0.96, "learning_rate": 2.2128577198780587e-08, "loss": 0.9078, "step": 50824 }, { "epoch": 0.96, "learning_rate": 2.2108301077504168e-08, "loss": 1.1008, "step": 50825 }, { "epoch": 0.96, "learning_rate": 2.2088034208599396e-08, "loss": 0.8981, "step": 50826 }, { "epoch": 0.96, "learning_rate": 2.2067776592141487e-08, "loss": 0.8646, "step": 50827 }, { "epoch": 0.96, "learning_rate": 2.204752822820705e-08, "loss": 0.9072, "step": 50828 }, { "epoch": 0.96, "learning_rate": 2.202728911687102e-08, "loss": 0.7883, "step": 50829 }, { "epoch": 0.96, "learning_rate": 2.2007059258208897e-08, "loss": 1.0841, "step": 50830 }, { "epoch": 0.96, "learning_rate": 2.1986838652296726e-08, "loss": 1.1883, "step": 50831 }, { "epoch": 0.96, "learning_rate": 2.1966627299209453e-08, "loss": 0.9297, "step": 50832 }, { "epoch": 0.96, "learning_rate": 2.1946425199022848e-08, "loss": 0.7401, "step": 50833 }, { "epoch": 0.96, "learning_rate": 2.1926232351812403e-08, "loss": 0.7856, "step": 50834 }, { "epoch": 0.96, "learning_rate": 2.190604875765362e-08, "loss": 0.8352, "step": 50835 }, { "epoch": 0.96, "learning_rate": 2.1885874416621435e-08, "loss": 0.8875, "step": 50836 }, { "epoch": 0.96, "learning_rate": 2.1865709328791616e-08, "loss": 1.0917, "step": 50837 }, { "epoch": 0.96, "learning_rate": 2.1845553494239115e-08, "loss": 1.1158, "step": 50838 }, { "epoch": 0.96, "learning_rate": 2.1825406913039137e-08, "loss": 0.8914, "step": 50839 }, { "epoch": 0.96, "learning_rate": 2.1805269585267462e-08, "loss": 0.9364, "step": 50840 }, { "epoch": 0.96, "learning_rate": 2.1785141510998753e-08, "loss": 0.6728, "step": 50841 }, { "epoch": 0.96, "learning_rate": 2.1765022690308225e-08, "loss": 0.8902, "step": 50842 }, { "epoch": 0.96, "learning_rate": 2.174491312327137e-08, "loss": 0.8932, "step": 50843 }, { "epoch": 0.96, "learning_rate": 2.172481280996286e-08, "loss": 0.8844, "step": 50844 }, { "epoch": 0.96, "learning_rate": 2.1704721750457902e-08, "loss": 0.8771, "step": 50845 }, { "epoch": 0.96, "learning_rate": 2.1684639944831443e-08, "loss": 0.9149, "step": 50846 }, { "epoch": 0.96, "learning_rate": 2.1664567393158975e-08, "loss": 0.7955, "step": 50847 }, { "epoch": 0.96, "learning_rate": 2.164450409551433e-08, "loss": 0.752, "step": 50848 }, { "epoch": 0.96, "learning_rate": 2.1624450051973833e-08, "loss": 1.0995, "step": 50849 }, { "epoch": 0.96, "learning_rate": 2.1604405262611315e-08, "loss": 0.9302, "step": 50850 }, { "epoch": 0.96, "learning_rate": 2.1584369727501995e-08, "loss": 0.9423, "step": 50851 }, { "epoch": 0.96, "learning_rate": 2.1564343446720538e-08, "loss": 0.853, "step": 50852 }, { "epoch": 0.96, "learning_rate": 2.1544326420341876e-08, "loss": 0.9687, "step": 50853 }, { "epoch": 0.96, "learning_rate": 2.152431864844068e-08, "loss": 0.7706, "step": 50854 }, { "epoch": 0.96, "learning_rate": 2.1504320131091883e-08, "loss": 0.8007, "step": 50855 }, { "epoch": 0.96, "learning_rate": 2.1484330868369874e-08, "loss": 1.0137, "step": 50856 }, { "epoch": 0.96, "learning_rate": 2.1464350860349313e-08, "loss": 1.0147, "step": 50857 }, { "epoch": 0.96, "learning_rate": 2.1444380107105144e-08, "loss": 0.7883, "step": 50858 }, { "epoch": 0.96, "learning_rate": 2.1424418608711196e-08, "loss": 0.7667, "step": 50859 }, { "epoch": 0.96, "learning_rate": 2.1404466365242682e-08, "loss": 0.5952, "step": 50860 }, { "epoch": 0.96, "learning_rate": 2.1384523376773992e-08, "loss": 0.8279, "step": 50861 }, { "epoch": 0.96, "learning_rate": 2.1364589643379507e-08, "loss": 0.9437, "step": 50862 }, { "epoch": 0.96, "learning_rate": 2.1344665165133615e-08, "loss": 0.8134, "step": 50863 }, { "epoch": 0.96, "learning_rate": 2.13247499421107e-08, "loss": 0.7733, "step": 50864 }, { "epoch": 0.96, "learning_rate": 2.130484397438515e-08, "loss": 0.9393, "step": 50865 }, { "epoch": 0.96, "learning_rate": 2.128494726203134e-08, "loss": 0.8779, "step": 50866 }, { "epoch": 0.96, "learning_rate": 2.126505980512339e-08, "loss": 0.8357, "step": 50867 }, { "epoch": 0.96, "learning_rate": 2.1245181603735952e-08, "loss": 0.9533, "step": 50868 }, { "epoch": 0.96, "learning_rate": 2.1225312657942864e-08, "loss": 0.9976, "step": 50869 }, { "epoch": 0.96, "learning_rate": 2.1205452967818508e-08, "loss": 0.7897, "step": 50870 }, { "epoch": 0.96, "learning_rate": 2.118560253343699e-08, "loss": 0.8633, "step": 50871 }, { "epoch": 0.96, "learning_rate": 2.1165761354872416e-08, "loss": 1.1043, "step": 50872 }, { "epoch": 0.96, "learning_rate": 2.11459294321989e-08, "loss": 0.873, "step": 50873 }, { "epoch": 0.96, "learning_rate": 2.112610676549054e-08, "loss": 1.1608, "step": 50874 }, { "epoch": 0.96, "learning_rate": 2.1106293354821173e-08, "loss": 1.0703, "step": 50875 }, { "epoch": 0.96, "learning_rate": 2.1086489200264904e-08, "loss": 0.5867, "step": 50876 }, { "epoch": 0.96, "learning_rate": 2.106669430189584e-08, "loss": 0.9093, "step": 50877 }, { "epoch": 0.96, "learning_rate": 2.1046908659787536e-08, "loss": 0.9674, "step": 50878 }, { "epoch": 0.96, "learning_rate": 2.1027132274014374e-08, "loss": 0.7484, "step": 50879 }, { "epoch": 0.96, "learning_rate": 2.1007365144649628e-08, "loss": 1.0139, "step": 50880 }, { "epoch": 0.96, "learning_rate": 2.0987607271767407e-08, "loss": 1.3713, "step": 50881 }, { "epoch": 0.96, "learning_rate": 2.0967858655441265e-08, "loss": 0.9666, "step": 50882 }, { "epoch": 0.96, "learning_rate": 2.0948119295745307e-08, "loss": 0.9168, "step": 50883 }, { "epoch": 0.96, "learning_rate": 2.0928389192753086e-08, "loss": 0.9823, "step": 50884 }, { "epoch": 0.96, "learning_rate": 2.090866834653843e-08, "loss": 0.9493, "step": 50885 }, { "epoch": 0.96, "learning_rate": 2.0888956757174615e-08, "loss": 0.8871, "step": 50886 }, { "epoch": 0.96, "learning_rate": 2.0869254424735197e-08, "loss": 1.0771, "step": 50887 }, { "epoch": 0.96, "learning_rate": 2.084956134929428e-08, "loss": 0.9719, "step": 50888 }, { "epoch": 0.96, "learning_rate": 2.0829877530925134e-08, "loss": 0.9632, "step": 50889 }, { "epoch": 0.96, "learning_rate": 2.0810202969701043e-08, "loss": 0.7278, "step": 50890 }, { "epoch": 0.96, "learning_rate": 2.079053766569583e-08, "loss": 0.7129, "step": 50891 }, { "epoch": 0.96, "learning_rate": 2.0770881618982498e-08, "loss": 0.9343, "step": 50892 }, { "epoch": 0.96, "learning_rate": 2.0751234829634593e-08, "loss": 0.8369, "step": 50893 }, { "epoch": 0.96, "learning_rate": 2.0731597297725947e-08, "loss": 0.9669, "step": 50894 }, { "epoch": 0.96, "learning_rate": 2.0711969023329283e-08, "loss": 0.839, "step": 50895 }, { "epoch": 0.96, "learning_rate": 2.069235000651787e-08, "loss": 0.7413, "step": 50896 }, { "epoch": 0.96, "learning_rate": 2.0672740247365542e-08, "loss": 1.021, "step": 50897 }, { "epoch": 0.96, "learning_rate": 2.0653139745945293e-08, "loss": 0.7309, "step": 50898 }, { "epoch": 0.96, "learning_rate": 2.0633548502329848e-08, "loss": 1.053, "step": 50899 }, { "epoch": 0.96, "learning_rate": 2.061396651659303e-08, "loss": 1.0844, "step": 50900 }, { "epoch": 0.96, "learning_rate": 2.059439378880729e-08, "loss": 0.7634, "step": 50901 }, { "epoch": 0.96, "learning_rate": 2.0574830319046447e-08, "loss": 1.0596, "step": 50902 }, { "epoch": 0.96, "learning_rate": 2.055527610738295e-08, "loss": 0.7544, "step": 50903 }, { "epoch": 0.96, "learning_rate": 2.053573115389007e-08, "loss": 0.9419, "step": 50904 }, { "epoch": 0.96, "learning_rate": 2.051619545864053e-08, "loss": 1.0059, "step": 50905 }, { "epoch": 0.96, "learning_rate": 2.0496669021707603e-08, "loss": 1.3434, "step": 50906 }, { "epoch": 0.96, "learning_rate": 2.0477151843164568e-08, "loss": 0.7057, "step": 50907 }, { "epoch": 0.96, "learning_rate": 2.0457643923083303e-08, "loss": 0.9476, "step": 50908 }, { "epoch": 0.96, "learning_rate": 2.043814526153709e-08, "loss": 0.782, "step": 50909 }, { "epoch": 0.96, "learning_rate": 2.04186558585992e-08, "loss": 0.7548, "step": 50910 }, { "epoch": 0.96, "learning_rate": 2.03991757143418e-08, "loss": 1.0858, "step": 50911 }, { "epoch": 0.96, "learning_rate": 2.0379704828837888e-08, "loss": 0.8227, "step": 50912 }, { "epoch": 0.96, "learning_rate": 2.036024320216018e-08, "loss": 1.1837, "step": 50913 }, { "epoch": 0.96, "learning_rate": 2.0340790834381398e-08, "loss": 0.8771, "step": 50914 }, { "epoch": 0.96, "learning_rate": 2.032134772557398e-08, "loss": 0.8558, "step": 50915 }, { "epoch": 0.96, "learning_rate": 2.0301913875810376e-08, "loss": 0.8674, "step": 50916 }, { "epoch": 0.96, "learning_rate": 2.0282489285163574e-08, "loss": 0.8064, "step": 50917 }, { "epoch": 0.96, "learning_rate": 2.0263073953706024e-08, "loss": 0.9847, "step": 50918 }, { "epoch": 0.96, "learning_rate": 2.0243667881510165e-08, "loss": 0.9564, "step": 50919 }, { "epoch": 0.96, "learning_rate": 2.022427106864816e-08, "loss": 0.7905, "step": 50920 }, { "epoch": 0.96, "learning_rate": 2.0204883515193007e-08, "loss": 0.9813, "step": 50921 }, { "epoch": 0.96, "learning_rate": 2.0185505221216594e-08, "loss": 0.9086, "step": 50922 }, { "epoch": 0.96, "learning_rate": 2.016613618679164e-08, "loss": 0.6561, "step": 50923 }, { "epoch": 0.96, "learning_rate": 2.0146776411990032e-08, "loss": 0.8084, "step": 50924 }, { "epoch": 0.96, "learning_rate": 2.0127425896884488e-08, "loss": 1.0388, "step": 50925 }, { "epoch": 0.96, "learning_rate": 2.0108084641547175e-08, "loss": 0.7681, "step": 50926 }, { "epoch": 0.96, "learning_rate": 2.008875264604998e-08, "loss": 0.8147, "step": 50927 }, { "epoch": 0.96, "learning_rate": 2.006942991046562e-08, "loss": 0.9167, "step": 50928 }, { "epoch": 0.96, "learning_rate": 2.0050116434865707e-08, "loss": 0.6171, "step": 50929 }, { "epoch": 0.96, "learning_rate": 2.0030812219322958e-08, "loss": 0.7581, "step": 50930 }, { "epoch": 0.96, "learning_rate": 2.0011517263908986e-08, "loss": 1.1573, "step": 50931 }, { "epoch": 0.96, "learning_rate": 1.9992231568695676e-08, "loss": 0.8773, "step": 50932 }, { "epoch": 0.96, "learning_rate": 1.9972955133755745e-08, "loss": 1.0577, "step": 50933 }, { "epoch": 0.96, "learning_rate": 1.995368795916053e-08, "loss": 0.8101, "step": 50934 }, { "epoch": 0.96, "learning_rate": 1.993443004498219e-08, "loss": 0.7627, "step": 50935 }, { "epoch": 0.96, "learning_rate": 1.9915181391292893e-08, "loss": 1.0359, "step": 50936 }, { "epoch": 0.96, "learning_rate": 1.989594199816397e-08, "loss": 1.0093, "step": 50937 }, { "epoch": 0.96, "learning_rate": 1.9876711865667864e-08, "loss": 0.9821, "step": 50938 }, { "epoch": 0.96, "learning_rate": 1.9857490993875907e-08, "loss": 0.9336, "step": 50939 }, { "epoch": 0.96, "learning_rate": 1.9838279382859982e-08, "loss": 0.8035, "step": 50940 }, { "epoch": 0.96, "learning_rate": 1.98190770326917e-08, "loss": 0.717, "step": 50941 }, { "epoch": 0.96, "learning_rate": 1.979988394344351e-08, "loss": 0.732, "step": 50942 }, { "epoch": 0.96, "learning_rate": 1.978070011518618e-08, "loss": 0.9782, "step": 50943 }, { "epoch": 0.96, "learning_rate": 1.97615255479916e-08, "loss": 0.8614, "step": 50944 }, { "epoch": 0.96, "learning_rate": 1.974236024193138e-08, "loss": 0.7981, "step": 50945 }, { "epoch": 0.96, "learning_rate": 1.9723204197077127e-08, "loss": 0.9365, "step": 50946 }, { "epoch": 0.96, "learning_rate": 1.9704057413500733e-08, "loss": 0.8333, "step": 50947 }, { "epoch": 0.96, "learning_rate": 1.968491989127297e-08, "loss": 0.802, "step": 50948 }, { "epoch": 0.96, "learning_rate": 1.9665791630466004e-08, "loss": 1.0805, "step": 50949 }, { "epoch": 0.96, "learning_rate": 1.9646672631150608e-08, "loss": 1.2143, "step": 50950 }, { "epoch": 0.96, "learning_rate": 1.962756289339868e-08, "loss": 0.79, "step": 50951 }, { "epoch": 0.96, "learning_rate": 1.960846241728126e-08, "loss": 0.8715, "step": 50952 }, { "epoch": 0.96, "learning_rate": 1.9589371202869688e-08, "loss": 0.8997, "step": 50953 }, { "epoch": 0.96, "learning_rate": 1.9570289250235574e-08, "loss": 0.9735, "step": 50954 }, { "epoch": 0.96, "learning_rate": 1.955121655944997e-08, "loss": 0.7205, "step": 50955 }, { "epoch": 0.96, "learning_rate": 1.953215313058393e-08, "loss": 1.0473, "step": 50956 }, { "epoch": 0.96, "learning_rate": 1.9513098963708787e-08, "loss": 0.9635, "step": 50957 }, { "epoch": 0.96, "learning_rate": 1.949405405889587e-08, "loss": 0.8607, "step": 50958 }, { "epoch": 0.96, "learning_rate": 1.9475018416215963e-08, "loss": 0.8011, "step": 50959 }, { "epoch": 0.96, "learning_rate": 1.945599203574011e-08, "loss": 0.9683, "step": 50960 }, { "epoch": 0.96, "learning_rate": 1.943697491753993e-08, "loss": 0.9235, "step": 50961 }, { "epoch": 0.96, "learning_rate": 1.941796706168564e-08, "loss": 0.9802, "step": 50962 }, { "epoch": 0.96, "learning_rate": 1.9398968468248846e-08, "loss": 1.1031, "step": 50963 }, { "epoch": 0.96, "learning_rate": 1.9379979137300052e-08, "loss": 0.6943, "step": 50964 }, { "epoch": 0.96, "learning_rate": 1.936099906891059e-08, "loss": 0.867, "step": 50965 }, { "epoch": 0.96, "learning_rate": 1.934202826315096e-08, "loss": 0.6793, "step": 50966 }, { "epoch": 0.96, "learning_rate": 1.932306672009221e-08, "loss": 0.8776, "step": 50967 }, { "epoch": 0.96, "learning_rate": 1.9304114439804843e-08, "loss": 1.062, "step": 50968 }, { "epoch": 0.96, "learning_rate": 1.9285171422360193e-08, "loss": 1.0336, "step": 50969 }, { "epoch": 0.96, "learning_rate": 1.926623766782848e-08, "loss": 0.8776, "step": 50970 }, { "epoch": 0.96, "learning_rate": 1.924731317628048e-08, "loss": 0.7334, "step": 50971 }, { "epoch": 0.96, "learning_rate": 1.922839794778697e-08, "loss": 0.9079, "step": 50972 }, { "epoch": 0.96, "learning_rate": 1.9209491982418728e-08, "loss": 0.82, "step": 50973 }, { "epoch": 0.96, "learning_rate": 1.9190595280245972e-08, "loss": 0.8225, "step": 50974 }, { "epoch": 0.96, "learning_rate": 1.9171707841339758e-08, "loss": 1.0435, "step": 50975 }, { "epoch": 0.96, "learning_rate": 1.9152829665770035e-08, "loss": 1.0011, "step": 50976 }, { "epoch": 0.96, "learning_rate": 1.913396075360785e-08, "loss": 0.801, "step": 50977 }, { "epoch": 0.96, "learning_rate": 1.911510110492315e-08, "loss": 0.9784, "step": 50978 }, { "epoch": 0.96, "learning_rate": 1.9096250719786713e-08, "loss": 0.8123, "step": 50979 }, { "epoch": 0.96, "learning_rate": 1.9077409598268758e-08, "loss": 0.8793, "step": 50980 }, { "epoch": 0.96, "learning_rate": 1.9058577740439786e-08, "loss": 1.2084, "step": 50981 }, { "epoch": 0.96, "learning_rate": 1.903975514637002e-08, "loss": 1.0195, "step": 50982 }, { "epoch": 0.96, "learning_rate": 1.90209418161294e-08, "loss": 0.9395, "step": 50983 }, { "epoch": 0.96, "learning_rate": 1.9002137749788983e-08, "loss": 0.7619, "step": 50984 }, { "epoch": 0.96, "learning_rate": 1.8983342947418437e-08, "loss": 0.9112, "step": 50985 }, { "epoch": 0.96, "learning_rate": 1.8964557409087703e-08, "loss": 0.8233, "step": 50986 }, { "epoch": 0.96, "learning_rate": 1.8945781134867556e-08, "loss": 0.8832, "step": 50987 }, { "epoch": 0.96, "learning_rate": 1.8927014124827668e-08, "loss": 0.9566, "step": 50988 }, { "epoch": 0.96, "learning_rate": 1.890825637903826e-08, "loss": 0.7295, "step": 50989 }, { "epoch": 0.96, "learning_rate": 1.888950789756927e-08, "loss": 0.9442, "step": 50990 }, { "epoch": 0.96, "learning_rate": 1.8870768680490924e-08, "loss": 0.7799, "step": 50991 }, { "epoch": 0.96, "learning_rate": 1.885203872787289e-08, "loss": 0.8348, "step": 50992 }, { "epoch": 0.96, "learning_rate": 1.8833318039785385e-08, "loss": 0.9309, "step": 50993 }, { "epoch": 0.96, "learning_rate": 1.8814606616298082e-08, "loss": 0.9339, "step": 50994 }, { "epoch": 0.96, "learning_rate": 1.8795904457480917e-08, "loss": 1.0565, "step": 50995 }, { "epoch": 0.96, "learning_rate": 1.8777211563404118e-08, "loss": 0.9458, "step": 50996 }, { "epoch": 0.96, "learning_rate": 1.8758527934136794e-08, "loss": 0.9244, "step": 50997 }, { "epoch": 0.96, "learning_rate": 1.8739853569749165e-08, "loss": 0.7678, "step": 50998 }, { "epoch": 0.96, "learning_rate": 1.87211884703109e-08, "loss": 0.9412, "step": 50999 }, { "epoch": 0.96, "learning_rate": 1.8702532635891667e-08, "loss": 1.3137, "step": 51000 }, { "epoch": 0.96, "learning_rate": 1.8683886066560852e-08, "loss": 0.991, "step": 51001 }, { "epoch": 0.96, "learning_rate": 1.866524876238868e-08, "loss": 0.7949, "step": 51002 }, { "epoch": 0.96, "learning_rate": 1.8646620723444252e-08, "loss": 0.8197, "step": 51003 }, { "epoch": 0.96, "learning_rate": 1.862800194979697e-08, "loss": 0.84, "step": 51004 }, { "epoch": 0.96, "learning_rate": 1.860939244151705e-08, "loss": 0.9886, "step": 51005 }, { "epoch": 0.96, "learning_rate": 1.85907921986736e-08, "loss": 1.0679, "step": 51006 }, { "epoch": 0.96, "learning_rate": 1.8572201221335738e-08, "loss": 0.8264, "step": 51007 }, { "epoch": 0.96, "learning_rate": 1.8553619509573406e-08, "loss": 0.809, "step": 51008 }, { "epoch": 0.96, "learning_rate": 1.8535047063455713e-08, "loss": 0.8942, "step": 51009 }, { "epoch": 0.96, "learning_rate": 1.851648388305205e-08, "loss": 1.0803, "step": 51010 }, { "epoch": 0.96, "learning_rate": 1.8497929968431805e-08, "loss": 0.7818, "step": 51011 }, { "epoch": 0.96, "learning_rate": 1.847938531966409e-08, "loss": 1.0236, "step": 51012 }, { "epoch": 0.96, "learning_rate": 1.846084993681829e-08, "loss": 1.078, "step": 51013 }, { "epoch": 0.96, "learning_rate": 1.8442323819963526e-08, "loss": 0.9153, "step": 51014 }, { "epoch": 0.96, "learning_rate": 1.8423806969169455e-08, "loss": 0.8989, "step": 51015 }, { "epoch": 0.96, "learning_rate": 1.840529938450436e-08, "loss": 0.9727, "step": 51016 }, { "epoch": 0.96, "learning_rate": 1.838680106603791e-08, "loss": 0.9479, "step": 51017 }, { "epoch": 0.96, "learning_rate": 1.8368312013839208e-08, "loss": 1.1874, "step": 51018 }, { "epoch": 0.96, "learning_rate": 1.8349832227976815e-08, "loss": 0.8499, "step": 51019 }, { "epoch": 0.96, "learning_rate": 1.8331361708520402e-08, "loss": 0.9997, "step": 51020 }, { "epoch": 0.96, "learning_rate": 1.831290045553824e-08, "loss": 0.9732, "step": 51021 }, { "epoch": 0.96, "learning_rate": 1.82944484691e-08, "loss": 0.8412, "step": 51022 }, { "epoch": 0.96, "learning_rate": 1.8276005749273962e-08, "loss": 0.9381, "step": 51023 }, { "epoch": 0.96, "learning_rate": 1.825757229612951e-08, "loss": 1.1749, "step": 51024 }, { "epoch": 0.96, "learning_rate": 1.8239148109734928e-08, "loss": 1.05, "step": 51025 }, { "epoch": 0.96, "learning_rate": 1.8220733190159323e-08, "loss": 0.8651, "step": 51026 }, { "epoch": 0.96, "learning_rate": 1.8202327537471255e-08, "loss": 1.0216, "step": 51027 }, { "epoch": 0.96, "learning_rate": 1.8183931151739832e-08, "loss": 0.7476, "step": 51028 }, { "epoch": 0.96, "learning_rate": 1.8165544033033334e-08, "loss": 0.9028, "step": 51029 }, { "epoch": 0.96, "learning_rate": 1.8147166181420594e-08, "loss": 0.8429, "step": 51030 }, { "epoch": 0.96, "learning_rate": 1.812879759697045e-08, "loss": 0.8845, "step": 51031 }, { "epoch": 0.96, "learning_rate": 1.8110438279751175e-08, "loss": 0.9867, "step": 51032 }, { "epoch": 0.96, "learning_rate": 1.8092088229831606e-08, "loss": 0.8337, "step": 51033 }, { "epoch": 0.96, "learning_rate": 1.8073747447279744e-08, "loss": 0.9627, "step": 51034 }, { "epoch": 0.96, "learning_rate": 1.8055415932164422e-08, "loss": 0.7998, "step": 51035 }, { "epoch": 0.96, "learning_rate": 1.8037093684554473e-08, "loss": 0.7225, "step": 51036 }, { "epoch": 0.96, "learning_rate": 1.8018780704517626e-08, "loss": 0.9752, "step": 51037 }, { "epoch": 0.96, "learning_rate": 1.800047699212243e-08, "loss": 0.9627, "step": 51038 }, { "epoch": 0.96, "learning_rate": 1.798218254743772e-08, "loss": 0.8619, "step": 51039 }, { "epoch": 0.96, "learning_rate": 1.7963897370531226e-08, "loss": 0.7546, "step": 51040 }, { "epoch": 0.96, "learning_rate": 1.7945621461471218e-08, "loss": 0.8998, "step": 51041 }, { "epoch": 0.96, "learning_rate": 1.7927354820326537e-08, "loss": 0.8784, "step": 51042 }, { "epoch": 0.96, "learning_rate": 1.7909097447164902e-08, "loss": 1.0912, "step": 51043 }, { "epoch": 0.96, "learning_rate": 1.7890849342054595e-08, "loss": 0.9584, "step": 51044 }, { "epoch": 0.96, "learning_rate": 1.7872610505063613e-08, "loss": 0.7875, "step": 51045 }, { "epoch": 0.96, "learning_rate": 1.7854380936260517e-08, "loss": 0.8848, "step": 51046 }, { "epoch": 0.96, "learning_rate": 1.7836160635712752e-08, "loss": 0.8366, "step": 51047 }, { "epoch": 0.96, "learning_rate": 1.7817949603488593e-08, "loss": 0.8026, "step": 51048 }, { "epoch": 0.96, "learning_rate": 1.7799747839656322e-08, "loss": 0.8958, "step": 51049 }, { "epoch": 0.96, "learning_rate": 1.7781555344283662e-08, "loss": 0.882, "step": 51050 }, { "epoch": 0.96, "learning_rate": 1.7763372117438615e-08, "loss": 0.9268, "step": 51051 }, { "epoch": 0.96, "learning_rate": 1.7745198159188902e-08, "loss": 0.7671, "step": 51052 }, { "epoch": 0.96, "learning_rate": 1.7727033469602528e-08, "loss": 0.8828, "step": 51053 }, { "epoch": 0.96, "learning_rate": 1.770887804874749e-08, "loss": 0.748, "step": 51054 }, { "epoch": 0.96, "learning_rate": 1.7690731896691236e-08, "loss": 0.82, "step": 51055 }, { "epoch": 0.96, "learning_rate": 1.7672595013501492e-08, "loss": 0.93, "step": 51056 }, { "epoch": 0.96, "learning_rate": 1.7654467399246532e-08, "loss": 0.8657, "step": 51057 }, { "epoch": 0.96, "learning_rate": 1.7636349053993528e-08, "loss": 0.9577, "step": 51058 }, { "epoch": 0.96, "learning_rate": 1.76182399778102e-08, "loss": 0.8541, "step": 51059 }, { "epoch": 0.96, "learning_rate": 1.7600140170764278e-08, "loss": 0.8987, "step": 51060 }, { "epoch": 0.96, "learning_rate": 1.7582049632923205e-08, "loss": 0.8012, "step": 51061 }, { "epoch": 0.96, "learning_rate": 1.756396836435498e-08, "loss": 1.0524, "step": 51062 }, { "epoch": 0.96, "learning_rate": 1.7545896365126493e-08, "loss": 0.9637, "step": 51063 }, { "epoch": 0.96, "learning_rate": 1.7527833635305746e-08, "loss": 0.7282, "step": 51064 }, { "epoch": 0.96, "learning_rate": 1.7509780174959634e-08, "loss": 0.9258, "step": 51065 }, { "epoch": 0.96, "learning_rate": 1.7491735984156157e-08, "loss": 0.753, "step": 51066 }, { "epoch": 0.96, "learning_rate": 1.747370106296248e-08, "loss": 0.6938, "step": 51067 }, { "epoch": 0.96, "learning_rate": 1.745567541144577e-08, "loss": 0.8878, "step": 51068 }, { "epoch": 0.96, "learning_rate": 1.743765902967348e-08, "loss": 0.8298, "step": 51069 }, { "epoch": 0.96, "learning_rate": 1.7419651917712775e-08, "loss": 1.0677, "step": 51070 }, { "epoch": 0.96, "learning_rate": 1.7401654075630826e-08, "loss": 0.8249, "step": 51071 }, { "epoch": 0.96, "learning_rate": 1.738366550349535e-08, "loss": 1.1146, "step": 51072 }, { "epoch": 0.96, "learning_rate": 1.7365686201372965e-08, "loss": 0.8626, "step": 51073 }, { "epoch": 0.96, "learning_rate": 1.7347716169330843e-08, "loss": 1.0316, "step": 51074 }, { "epoch": 0.96, "learning_rate": 1.732975540743642e-08, "loss": 1.0399, "step": 51075 }, { "epoch": 0.96, "learning_rate": 1.7311803915756598e-08, "loss": 1.0352, "step": 51076 }, { "epoch": 0.96, "learning_rate": 1.729386169435826e-08, "loss": 0.8527, "step": 51077 }, { "epoch": 0.96, "learning_rate": 1.727592874330858e-08, "loss": 0.899, "step": 51078 }, { "epoch": 0.96, "learning_rate": 1.7258005062674442e-08, "loss": 0.8654, "step": 51079 }, { "epoch": 0.96, "learning_rate": 1.7240090652522746e-08, "loss": 0.9221, "step": 51080 }, { "epoch": 0.96, "learning_rate": 1.7222185512920652e-08, "loss": 0.8976, "step": 51081 }, { "epoch": 0.96, "learning_rate": 1.7204289643934503e-08, "loss": 0.9648, "step": 51082 }, { "epoch": 0.96, "learning_rate": 1.718640304563146e-08, "loss": 0.8915, "step": 51083 }, { "epoch": 0.96, "learning_rate": 1.7168525718078422e-08, "loss": 0.8373, "step": 51084 }, { "epoch": 0.96, "learning_rate": 1.7150657661341996e-08, "loss": 0.79, "step": 51085 }, { "epoch": 0.96, "learning_rate": 1.713279887548852e-08, "loss": 0.8345, "step": 51086 }, { "epoch": 0.96, "learning_rate": 1.711494936058544e-08, "loss": 1.0581, "step": 51087 }, { "epoch": 0.96, "learning_rate": 1.7097109116699097e-08, "loss": 0.9293, "step": 51088 }, { "epoch": 0.96, "learning_rate": 1.7079278143895538e-08, "loss": 0.9417, "step": 51089 }, { "epoch": 0.96, "learning_rate": 1.7061456442242218e-08, "loss": 0.8986, "step": 51090 }, { "epoch": 0.96, "learning_rate": 1.7043644011805193e-08, "loss": 0.6917, "step": 51091 }, { "epoch": 0.96, "learning_rate": 1.7025840852651077e-08, "loss": 0.9557, "step": 51092 }, { "epoch": 0.96, "learning_rate": 1.7008046964846205e-08, "loss": 0.9173, "step": 51093 }, { "epoch": 0.96, "learning_rate": 1.6990262348457466e-08, "loss": 0.9943, "step": 51094 }, { "epoch": 0.96, "learning_rate": 1.697248700355064e-08, "loss": 1.0312, "step": 51095 }, { "epoch": 0.96, "learning_rate": 1.6954720930192626e-08, "loss": 0.8083, "step": 51096 }, { "epoch": 0.96, "learning_rate": 1.6936964128449472e-08, "loss": 1.1446, "step": 51097 }, { "epoch": 0.96, "learning_rate": 1.6919216598387246e-08, "loss": 0.7495, "step": 51098 }, { "epoch": 0.96, "learning_rate": 1.6901478340073108e-08, "loss": 1.0984, "step": 51099 }, { "epoch": 0.96, "learning_rate": 1.6883749353572288e-08, "loss": 1.0377, "step": 51100 }, { "epoch": 0.96, "learning_rate": 1.6866029638951677e-08, "loss": 0.9322, "step": 51101 }, { "epoch": 0.96, "learning_rate": 1.684831919627705e-08, "loss": 0.8435, "step": 51102 }, { "epoch": 0.96, "learning_rate": 1.6830618025614754e-08, "loss": 1.016, "step": 51103 }, { "epoch": 0.96, "learning_rate": 1.681292612703056e-08, "loss": 0.7455, "step": 51104 }, { "epoch": 0.96, "learning_rate": 1.6795243500591086e-08, "loss": 1.011, "step": 51105 }, { "epoch": 0.96, "learning_rate": 1.6777570146361832e-08, "loss": 0.9651, "step": 51106 }, { "epoch": 0.96, "learning_rate": 1.675990606440886e-08, "loss": 1.0255, "step": 51107 }, { "epoch": 0.96, "learning_rate": 1.674225125479878e-08, "loss": 0.8225, "step": 51108 }, { "epoch": 0.96, "learning_rate": 1.672460571759654e-08, "loss": 0.8528, "step": 51109 }, { "epoch": 0.96, "learning_rate": 1.6706969452868483e-08, "loss": 0.7994, "step": 51110 }, { "epoch": 0.96, "learning_rate": 1.6689342460680658e-08, "loss": 0.8396, "step": 51111 }, { "epoch": 0.96, "learning_rate": 1.6671724741098573e-08, "loss": 0.9999, "step": 51112 }, { "epoch": 0.96, "learning_rate": 1.6654116294188282e-08, "loss": 0.9164, "step": 51113 }, { "epoch": 0.96, "learning_rate": 1.6636517120015295e-08, "loss": 0.9388, "step": 51114 }, { "epoch": 0.96, "learning_rate": 1.6618927218645387e-08, "loss": 0.7289, "step": 51115 }, { "epoch": 0.96, "learning_rate": 1.6601346590144062e-08, "loss": 0.6481, "step": 51116 }, { "epoch": 0.96, "learning_rate": 1.6583775234577383e-08, "loss": 0.8961, "step": 51117 }, { "epoch": 0.96, "learning_rate": 1.6566213152010845e-08, "loss": 0.785, "step": 51118 }, { "epoch": 0.96, "learning_rate": 1.6548660342509683e-08, "loss": 1.0175, "step": 51119 }, { "epoch": 0.96, "learning_rate": 1.6531116806139945e-08, "loss": 0.883, "step": 51120 }, { "epoch": 0.96, "learning_rate": 1.651358254296659e-08, "loss": 0.6951, "step": 51121 }, { "epoch": 0.96, "learning_rate": 1.6496057553055667e-08, "loss": 0.7171, "step": 51122 }, { "epoch": 0.96, "learning_rate": 1.6478541836472128e-08, "loss": 0.9511, "step": 51123 }, { "epoch": 0.96, "learning_rate": 1.6461035393281476e-08, "loss": 0.9143, "step": 51124 }, { "epoch": 0.96, "learning_rate": 1.6443538223549217e-08, "loss": 1.1279, "step": 51125 }, { "epoch": 0.96, "learning_rate": 1.642605032734085e-08, "loss": 0.9099, "step": 51126 }, { "epoch": 0.96, "learning_rate": 1.640857170472132e-08, "loss": 0.8002, "step": 51127 }, { "epoch": 0.96, "learning_rate": 1.639110235575586e-08, "loss": 0.9951, "step": 51128 }, { "epoch": 0.96, "learning_rate": 1.637364228051025e-08, "loss": 0.7952, "step": 51129 }, { "epoch": 0.96, "learning_rate": 1.6356191479049154e-08, "loss": 1.0349, "step": 51130 }, { "epoch": 0.96, "learning_rate": 1.6338749951437806e-08, "loss": 1.0152, "step": 51131 }, { "epoch": 0.96, "learning_rate": 1.6321317697741424e-08, "loss": 1.0389, "step": 51132 }, { "epoch": 0.96, "learning_rate": 1.6303894718025238e-08, "loss": 0.8043, "step": 51133 }, { "epoch": 0.96, "learning_rate": 1.6286481012353915e-08, "loss": 1.0043, "step": 51134 }, { "epoch": 0.96, "learning_rate": 1.6269076580792965e-08, "loss": 0.7408, "step": 51135 }, { "epoch": 0.96, "learning_rate": 1.625168142340705e-08, "loss": 0.9721, "step": 51136 }, { "epoch": 0.96, "learning_rate": 1.6234295540260847e-08, "loss": 0.9208, "step": 51137 }, { "epoch": 0.96, "learning_rate": 1.6216918931420132e-08, "loss": 0.846, "step": 51138 }, { "epoch": 0.96, "learning_rate": 1.6199551596949304e-08, "loss": 0.8597, "step": 51139 }, { "epoch": 0.96, "learning_rate": 1.618219353691275e-08, "loss": 0.6861, "step": 51140 }, { "epoch": 0.96, "learning_rate": 1.6164844751375974e-08, "loss": 0.7217, "step": 51141 }, { "epoch": 0.96, "learning_rate": 1.6147505240403648e-08, "loss": 0.7976, "step": 51142 }, { "epoch": 0.96, "learning_rate": 1.6130175004060165e-08, "loss": 0.9393, "step": 51143 }, { "epoch": 0.96, "learning_rate": 1.6112854042410476e-08, "loss": 1.0406, "step": 51144 }, { "epoch": 0.96, "learning_rate": 1.6095542355519243e-08, "loss": 0.973, "step": 51145 }, { "epoch": 0.96, "learning_rate": 1.6078239943451145e-08, "loss": 0.8206, "step": 51146 }, { "epoch": 0.96, "learning_rate": 1.606094680627085e-08, "loss": 0.9893, "step": 51147 }, { "epoch": 0.97, "learning_rate": 1.6043662944042747e-08, "loss": 0.9196, "step": 51148 }, { "epoch": 0.97, "learning_rate": 1.6026388356831236e-08, "loss": 0.7702, "step": 51149 }, { "epoch": 0.97, "learning_rate": 1.6009123044701536e-08, "loss": 0.9354, "step": 51150 }, { "epoch": 0.97, "learning_rate": 1.599186700771721e-08, "loss": 1.1984, "step": 51151 }, { "epoch": 0.97, "learning_rate": 1.5974620245943206e-08, "loss": 0.7914, "step": 51152 }, { "epoch": 0.97, "learning_rate": 1.595738275944364e-08, "loss": 0.9681, "step": 51153 }, { "epoch": 0.97, "learning_rate": 1.594015454828318e-08, "loss": 0.8447, "step": 51154 }, { "epoch": 0.97, "learning_rate": 1.592293561252595e-08, "loss": 0.9203, "step": 51155 }, { "epoch": 0.97, "learning_rate": 1.5905725952236327e-08, "loss": 1.1896, "step": 51156 }, { "epoch": 0.97, "learning_rate": 1.5888525567478718e-08, "loss": 0.9486, "step": 51157 }, { "epoch": 0.97, "learning_rate": 1.5871334458316956e-08, "loss": 0.938, "step": 51158 }, { "epoch": 0.97, "learning_rate": 1.585415262481571e-08, "loss": 0.8061, "step": 51159 }, { "epoch": 0.97, "learning_rate": 1.583698006703882e-08, "loss": 0.902, "step": 51160 }, { "epoch": 0.97, "learning_rate": 1.5819816785050123e-08, "loss": 1.001, "step": 51161 }, { "epoch": 0.97, "learning_rate": 1.5802662778914568e-08, "loss": 0.8861, "step": 51162 }, { "epoch": 0.97, "learning_rate": 1.5785518048695436e-08, "loss": 1.11, "step": 51163 }, { "epoch": 0.97, "learning_rate": 1.576838259445712e-08, "loss": 0.903, "step": 51164 }, { "epoch": 0.97, "learning_rate": 1.575125641626346e-08, "loss": 0.9937, "step": 51165 }, { "epoch": 0.97, "learning_rate": 1.573413951417857e-08, "loss": 1.0011, "step": 51166 }, { "epoch": 0.97, "learning_rate": 1.571703188826601e-08, "loss": 0.8564, "step": 51167 }, { "epoch": 0.97, "learning_rate": 1.5699933538589897e-08, "loss": 0.8154, "step": 51168 }, { "epoch": 0.97, "learning_rate": 1.5682844465214343e-08, "loss": 0.7862, "step": 51169 }, { "epoch": 0.97, "learning_rate": 1.5665764668202356e-08, "loss": 0.9736, "step": 51170 }, { "epoch": 0.97, "learning_rate": 1.5648694147618882e-08, "loss": 1.1577, "step": 51171 }, { "epoch": 0.97, "learning_rate": 1.563163290352665e-08, "loss": 0.6496, "step": 51172 }, { "epoch": 0.97, "learning_rate": 1.5614580935989776e-08, "loss": 0.9495, "step": 51173 }, { "epoch": 0.97, "learning_rate": 1.5597538245071818e-08, "loss": 0.8509, "step": 51174 }, { "epoch": 0.97, "learning_rate": 1.558050483083634e-08, "loss": 1.0694, "step": 51175 }, { "epoch": 0.97, "learning_rate": 1.5563480693347454e-08, "loss": 1.0209, "step": 51176 }, { "epoch": 0.97, "learning_rate": 1.5546465832668167e-08, "loss": 0.9752, "step": 51177 }, { "epoch": 0.97, "learning_rate": 1.5529460248862317e-08, "loss": 0.7332, "step": 51178 }, { "epoch": 0.97, "learning_rate": 1.5512463941992907e-08, "loss": 0.7837, "step": 51179 }, { "epoch": 0.97, "learning_rate": 1.549547691212405e-08, "loss": 0.9093, "step": 51180 }, { "epoch": 0.97, "learning_rate": 1.5478499159319037e-08, "loss": 1.1478, "step": 51181 }, { "epoch": 0.97, "learning_rate": 1.546153068364087e-08, "loss": 0.9274, "step": 51182 }, { "epoch": 0.97, "learning_rate": 1.544457148515338e-08, "loss": 0.6304, "step": 51183 }, { "epoch": 0.97, "learning_rate": 1.5427621563919582e-08, "loss": 1.1831, "step": 51184 }, { "epoch": 0.97, "learning_rate": 1.5410680920002753e-08, "loss": 0.8672, "step": 51185 }, { "epoch": 0.97, "learning_rate": 1.5393749553466453e-08, "loss": 0.7809, "step": 51186 }, { "epoch": 0.97, "learning_rate": 1.537682746437369e-08, "loss": 1.081, "step": 51187 }, { "epoch": 0.97, "learning_rate": 1.5359914652787744e-08, "loss": 0.8593, "step": 51188 }, { "epoch": 0.97, "learning_rate": 1.5343011118771344e-08, "loss": 0.8034, "step": 51189 }, { "epoch": 0.97, "learning_rate": 1.532611686238833e-08, "loss": 0.9559, "step": 51190 }, { "epoch": 0.97, "learning_rate": 1.5309231883701148e-08, "loss": 0.8446, "step": 51191 }, { "epoch": 0.97, "learning_rate": 1.529235618277336e-08, "loss": 0.9848, "step": 51192 }, { "epoch": 0.97, "learning_rate": 1.5275489759667696e-08, "loss": 0.8229, "step": 51193 }, { "epoch": 0.97, "learning_rate": 1.5258632614447156e-08, "loss": 0.9404, "step": 51194 }, { "epoch": 0.97, "learning_rate": 1.5241784747174472e-08, "loss": 0.9096, "step": 51195 }, { "epoch": 0.97, "learning_rate": 1.5224946157912923e-08, "loss": 0.8335, "step": 51196 }, { "epoch": 0.97, "learning_rate": 1.5208116846725517e-08, "loss": 0.8209, "step": 51197 }, { "epoch": 0.97, "learning_rate": 1.519129681367443e-08, "loss": 0.8729, "step": 51198 }, { "epoch": 0.97, "learning_rate": 1.5174486058823212e-08, "loss": 0.7757, "step": 51199 }, { "epoch": 0.97, "learning_rate": 1.5157684582233766e-08, "loss": 0.8095, "step": 51200 }, { "epoch": 0.97, "learning_rate": 1.5140892383969652e-08, "loss": 0.907, "step": 51201 }, { "epoch": 0.97, "learning_rate": 1.5124109464093318e-08, "loss": 0.8628, "step": 51202 }, { "epoch": 0.97, "learning_rate": 1.5107335822667213e-08, "loss": 0.799, "step": 51203 }, { "epoch": 0.97, "learning_rate": 1.5090571459754345e-08, "loss": 0.6532, "step": 51204 }, { "epoch": 0.97, "learning_rate": 1.5073816375416885e-08, "loss": 0.9752, "step": 51205 }, { "epoch": 0.97, "learning_rate": 1.505707056971756e-08, "loss": 0.8107, "step": 51206 }, { "epoch": 0.97, "learning_rate": 1.5040334042719096e-08, "loss": 1.0778, "step": 51207 }, { "epoch": 0.97, "learning_rate": 1.5023606794483668e-08, "loss": 1.0128, "step": 51208 }, { "epoch": 0.97, "learning_rate": 1.5006888825074284e-08, "loss": 0.8405, "step": 51209 }, { "epoch": 0.97, "learning_rate": 1.4990180134552555e-08, "loss": 0.8799, "step": 51210 }, { "epoch": 0.97, "learning_rate": 1.4973480722981493e-08, "loss": 1.0027, "step": 51211 }, { "epoch": 0.97, "learning_rate": 1.4956790590423266e-08, "loss": 1.0023, "step": 51212 }, { "epoch": 0.97, "learning_rate": 1.494010973694032e-08, "loss": 1.0127, "step": 51213 }, { "epoch": 0.97, "learning_rate": 1.492343816259456e-08, "loss": 0.9299, "step": 51214 }, { "epoch": 0.97, "learning_rate": 1.490677586744843e-08, "loss": 0.7914, "step": 51215 }, { "epoch": 0.97, "learning_rate": 1.4890122851564382e-08, "loss": 0.8528, "step": 51216 }, { "epoch": 0.97, "learning_rate": 1.4873479115004586e-08, "loss": 0.857, "step": 51217 }, { "epoch": 0.97, "learning_rate": 1.485684465783066e-08, "loss": 1.0044, "step": 51218 }, { "epoch": 0.97, "learning_rate": 1.4840219480105333e-08, "loss": 1.2081, "step": 51219 }, { "epoch": 0.97, "learning_rate": 1.48236035818905e-08, "loss": 0.8723, "step": 51220 }, { "epoch": 0.97, "learning_rate": 1.4806996963247777e-08, "loss": 0.9988, "step": 51221 }, { "epoch": 0.97, "learning_rate": 1.4790399624239615e-08, "loss": 1.012, "step": 51222 }, { "epoch": 0.97, "learning_rate": 1.4773811564928187e-08, "loss": 0.9201, "step": 51223 }, { "epoch": 0.97, "learning_rate": 1.475723278537483e-08, "loss": 1.213, "step": 51224 }, { "epoch": 0.97, "learning_rate": 1.4740663285641999e-08, "loss": 1.0455, "step": 51225 }, { "epoch": 0.97, "learning_rate": 1.4724103065791307e-08, "loss": 0.9419, "step": 51226 }, { "epoch": 0.97, "learning_rate": 1.470755212588465e-08, "loss": 0.8204, "step": 51227 }, { "epoch": 0.97, "learning_rate": 1.4691010465983646e-08, "loss": 0.9683, "step": 51228 }, { "epoch": 0.97, "learning_rate": 1.467447808615019e-08, "loss": 0.8613, "step": 51229 }, { "epoch": 0.97, "learning_rate": 1.4657954986446176e-08, "loss": 0.8145, "step": 51230 }, { "epoch": 0.97, "learning_rate": 1.4641441166932946e-08, "loss": 0.9691, "step": 51231 }, { "epoch": 0.97, "learning_rate": 1.462493662767267e-08, "loss": 1.084, "step": 51232 }, { "epoch": 0.97, "learning_rate": 1.4608441368726411e-08, "loss": 0.7545, "step": 51233 }, { "epoch": 0.97, "learning_rate": 1.4591955390156342e-08, "loss": 0.8972, "step": 51234 }, { "epoch": 0.97, "learning_rate": 1.4575478692023526e-08, "loss": 0.8779, "step": 51235 }, { "epoch": 0.97, "learning_rate": 1.4559011274389579e-08, "loss": 0.7802, "step": 51236 }, { "epoch": 0.97, "learning_rate": 1.4542553137316117e-08, "loss": 1.2005, "step": 51237 }, { "epoch": 0.97, "learning_rate": 1.4526104280864484e-08, "loss": 0.9172, "step": 51238 }, { "epoch": 0.97, "learning_rate": 1.4509664705096294e-08, "loss": 0.9863, "step": 51239 }, { "epoch": 0.97, "learning_rate": 1.4493234410072887e-08, "loss": 0.8571, "step": 51240 }, { "epoch": 0.97, "learning_rate": 1.4476813395855327e-08, "loss": 0.9797, "step": 51241 }, { "epoch": 0.97, "learning_rate": 1.446040166250523e-08, "loss": 0.866, "step": 51242 }, { "epoch": 0.97, "learning_rate": 1.4443999210083937e-08, "loss": 0.9971, "step": 51243 }, { "epoch": 0.97, "learning_rate": 1.442760603865251e-08, "loss": 0.9528, "step": 51244 }, { "epoch": 0.97, "learning_rate": 1.4411222148271731e-08, "loss": 0.9298, "step": 51245 }, { "epoch": 0.97, "learning_rate": 1.4394847539003776e-08, "loss": 0.9166, "step": 51246 }, { "epoch": 0.97, "learning_rate": 1.437848221090915e-08, "loss": 0.9442, "step": 51247 }, { "epoch": 0.97, "learning_rate": 1.4362126164048918e-08, "loss": 0.7277, "step": 51248 }, { "epoch": 0.97, "learning_rate": 1.4345779398484416e-08, "loss": 1.2602, "step": 51249 }, { "epoch": 0.97, "learning_rate": 1.4329441914276432e-08, "loss": 1.1302, "step": 51250 }, { "epoch": 0.97, "learning_rate": 1.4313113711486303e-08, "loss": 0.9307, "step": 51251 }, { "epoch": 0.97, "learning_rate": 1.429679479017454e-08, "loss": 0.9073, "step": 51252 }, { "epoch": 0.97, "learning_rate": 1.4280485150402479e-08, "loss": 0.8592, "step": 51253 }, { "epoch": 0.97, "learning_rate": 1.4264184792230907e-08, "loss": 0.6154, "step": 51254 }, { "epoch": 0.97, "learning_rate": 1.4247893715720606e-08, "loss": 1.0104, "step": 51255 }, { "epoch": 0.97, "learning_rate": 1.4231611920932365e-08, "loss": 0.9679, "step": 51256 }, { "epoch": 0.97, "learning_rate": 1.4215339407927242e-08, "loss": 0.9231, "step": 51257 }, { "epoch": 0.97, "learning_rate": 1.4199076176765747e-08, "loss": 0.9091, "step": 51258 }, { "epoch": 0.97, "learning_rate": 1.4182822227508664e-08, "loss": 0.7666, "step": 51259 }, { "epoch": 0.97, "learning_rate": 1.4166577560216776e-08, "loss": 0.9045, "step": 51260 }, { "epoch": 0.97, "learning_rate": 1.4150342174950315e-08, "loss": 0.8182, "step": 51261 }, { "epoch": 0.97, "learning_rate": 1.413411607177062e-08, "loss": 1.2341, "step": 51262 }, { "epoch": 0.97, "learning_rate": 1.411789925073792e-08, "loss": 0.9057, "step": 51263 }, { "epoch": 0.97, "learning_rate": 1.4101691711912723e-08, "loss": 0.7707, "step": 51264 }, { "epoch": 0.97, "learning_rate": 1.4085493455355537e-08, "loss": 0.884, "step": 51265 }, { "epoch": 0.97, "learning_rate": 1.4069304481126866e-08, "loss": 0.9442, "step": 51266 }, { "epoch": 0.97, "learning_rate": 1.405312478928722e-08, "loss": 0.8921, "step": 51267 }, { "epoch": 0.97, "learning_rate": 1.4036954379897105e-08, "loss": 0.8954, "step": 51268 }, { "epoch": 0.97, "learning_rate": 1.402079325301675e-08, "loss": 1.1555, "step": 51269 }, { "epoch": 0.97, "learning_rate": 1.4004641408706387e-08, "loss": 0.9143, "step": 51270 }, { "epoch": 0.97, "learning_rate": 1.3988498847026521e-08, "loss": 0.8284, "step": 51271 }, { "epoch": 0.97, "learning_rate": 1.3972365568037382e-08, "loss": 0.9017, "step": 51272 }, { "epoch": 0.97, "learning_rate": 1.3956241571799201e-08, "loss": 0.8487, "step": 51273 }, { "epoch": 0.97, "learning_rate": 1.3940126858372483e-08, "loss": 0.8089, "step": 51274 }, { "epoch": 0.97, "learning_rate": 1.3924021427816625e-08, "loss": 1.1829, "step": 51275 }, { "epoch": 0.97, "learning_rate": 1.3907925280192413e-08, "loss": 0.7718, "step": 51276 }, { "epoch": 0.97, "learning_rate": 1.3891838415560077e-08, "loss": 0.8503, "step": 51277 }, { "epoch": 0.97, "learning_rate": 1.3875760833979012e-08, "loss": 0.8376, "step": 51278 }, { "epoch": 0.97, "learning_rate": 1.3859692535509728e-08, "loss": 0.79, "step": 51279 }, { "epoch": 0.97, "learning_rate": 1.3843633520212174e-08, "loss": 0.989, "step": 51280 }, { "epoch": 0.97, "learning_rate": 1.3827583788146304e-08, "loss": 1.2257, "step": 51281 }, { "epoch": 0.97, "learning_rate": 1.3811543339371792e-08, "loss": 1.01, "step": 51282 }, { "epoch": 0.97, "learning_rate": 1.3795512173949144e-08, "loss": 0.8597, "step": 51283 }, { "epoch": 0.97, "learning_rate": 1.377949029193748e-08, "loss": 0.9239, "step": 51284 }, { "epoch": 0.97, "learning_rate": 1.3763477693397031e-08, "loss": 0.5975, "step": 51285 }, { "epoch": 0.97, "learning_rate": 1.3747474378387749e-08, "loss": 0.7797, "step": 51286 }, { "epoch": 0.97, "learning_rate": 1.3731480346969029e-08, "loss": 0.9612, "step": 51287 }, { "epoch": 0.97, "learning_rate": 1.3715495599200546e-08, "loss": 0.9667, "step": 51288 }, { "epoch": 0.97, "learning_rate": 1.369952013514253e-08, "loss": 0.8998, "step": 51289 }, { "epoch": 0.97, "learning_rate": 1.36835539548541e-08, "loss": 0.8323, "step": 51290 }, { "epoch": 0.97, "learning_rate": 1.3667597058394932e-08, "loss": 0.897, "step": 51291 }, { "epoch": 0.97, "learning_rate": 1.36516494458247e-08, "loss": 0.8865, "step": 51292 }, { "epoch": 0.97, "learning_rate": 1.3635711117203354e-08, "loss": 0.8781, "step": 51293 }, { "epoch": 0.97, "learning_rate": 1.361978207258946e-08, "loss": 1.1382, "step": 51294 }, { "epoch": 0.97, "learning_rate": 1.3603862312043526e-08, "loss": 0.8695, "step": 51295 }, { "epoch": 0.97, "learning_rate": 1.3587951835624391e-08, "loss": 0.8687, "step": 51296 }, { "epoch": 0.97, "learning_rate": 1.3572050643391731e-08, "loss": 0.6614, "step": 51297 }, { "epoch": 0.97, "learning_rate": 1.3556158735404667e-08, "loss": 0.8543, "step": 51298 }, { "epoch": 0.97, "learning_rate": 1.3540276111722595e-08, "loss": 1.0054, "step": 51299 }, { "epoch": 0.97, "learning_rate": 1.352440277240491e-08, "loss": 1.0388, "step": 51300 }, { "epoch": 0.97, "learning_rate": 1.350853871751101e-08, "loss": 0.9045, "step": 51301 }, { "epoch": 0.97, "learning_rate": 1.3492683947100015e-08, "loss": 0.8671, "step": 51302 }, { "epoch": 0.97, "learning_rate": 1.3476838461230768e-08, "loss": 0.8732, "step": 51303 }, { "epoch": 0.97, "learning_rate": 1.3461002259963219e-08, "loss": 0.8491, "step": 51304 }, { "epoch": 0.97, "learning_rate": 1.3445175343355655e-08, "loss": 0.7537, "step": 51305 }, { "epoch": 0.97, "learning_rate": 1.342935771146775e-08, "loss": 1.2898, "step": 51306 }, { "epoch": 0.97, "learning_rate": 1.3413549364358346e-08, "loss": 0.9469, "step": 51307 }, { "epoch": 0.97, "learning_rate": 1.3397750302086565e-08, "loss": 0.8094, "step": 51308 }, { "epoch": 0.97, "learning_rate": 1.3381960524711246e-08, "loss": 0.7729, "step": 51309 }, { "epoch": 0.97, "learning_rate": 1.336618003229151e-08, "loss": 0.791, "step": 51310 }, { "epoch": 0.97, "learning_rate": 1.3350408824886197e-08, "loss": 0.9649, "step": 51311 }, { "epoch": 0.97, "learning_rate": 1.333464690255415e-08, "loss": 0.9852, "step": 51312 }, { "epoch": 0.97, "learning_rate": 1.3318894265354487e-08, "loss": 0.8922, "step": 51313 }, { "epoch": 0.97, "learning_rate": 1.3303150913345775e-08, "loss": 0.8127, "step": 51314 }, { "epoch": 0.97, "learning_rate": 1.3287416846586576e-08, "loss": 1.0169, "step": 51315 }, { "epoch": 0.97, "learning_rate": 1.3271692065136288e-08, "loss": 0.841, "step": 51316 }, { "epoch": 0.97, "learning_rate": 1.3255976569053197e-08, "loss": 0.7511, "step": 51317 }, { "epoch": 0.97, "learning_rate": 1.3240270358395867e-08, "loss": 0.9678, "step": 51318 }, { "epoch": 0.97, "learning_rate": 1.3224573433223142e-08, "loss": 1.0909, "step": 51319 }, { "epoch": 0.97, "learning_rate": 1.3208885793593863e-08, "loss": 1.1553, "step": 51320 }, { "epoch": 0.97, "learning_rate": 1.3193207439566037e-08, "loss": 0.9381, "step": 51321 }, { "epoch": 0.97, "learning_rate": 1.3177538371198784e-08, "loss": 1.0685, "step": 51322 }, { "epoch": 0.97, "learning_rate": 1.3161878588550115e-08, "loss": 0.7806, "step": 51323 }, { "epoch": 0.97, "learning_rate": 1.314622809167887e-08, "loss": 1.034, "step": 51324 }, { "epoch": 0.97, "learning_rate": 1.3130586880643336e-08, "loss": 1.0781, "step": 51325 }, { "epoch": 0.97, "learning_rate": 1.311495495550208e-08, "loss": 0.9808, "step": 51326 }, { "epoch": 0.97, "learning_rate": 1.3099332316313107e-08, "loss": 0.6524, "step": 51327 }, { "epoch": 0.97, "learning_rate": 1.3083718963134983e-08, "loss": 0.7388, "step": 51328 }, { "epoch": 0.97, "learning_rate": 1.3068114896026274e-08, "loss": 1.1321, "step": 51329 }, { "epoch": 0.97, "learning_rate": 1.3052520115044708e-08, "loss": 1.1356, "step": 51330 }, { "epoch": 0.97, "learning_rate": 1.3036934620248854e-08, "loss": 1.0204, "step": 51331 }, { "epoch": 0.97, "learning_rate": 1.3021358411696994e-08, "loss": 0.9604, "step": 51332 }, { "epoch": 0.97, "learning_rate": 1.3005791489446862e-08, "loss": 1.1119, "step": 51333 }, { "epoch": 0.97, "learning_rate": 1.2990233853557022e-08, "loss": 0.9525, "step": 51334 }, { "epoch": 0.97, "learning_rate": 1.2974685504085482e-08, "loss": 0.8983, "step": 51335 }, { "epoch": 0.97, "learning_rate": 1.2959146441089976e-08, "loss": 0.7364, "step": 51336 }, { "epoch": 0.97, "learning_rate": 1.294361666462879e-08, "loss": 1.0306, "step": 51337 }, { "epoch": 0.97, "learning_rate": 1.292809617475993e-08, "loss": 0.9658, "step": 51338 }, { "epoch": 0.97, "learning_rate": 1.2912584971541408e-08, "loss": 0.9646, "step": 51339 }, { "epoch": 0.97, "learning_rate": 1.2897083055030956e-08, "loss": 0.8392, "step": 51340 }, { "epoch": 0.97, "learning_rate": 1.2881590425286583e-08, "loss": 0.8804, "step": 51341 }, { "epoch": 0.97, "learning_rate": 1.286610708236602e-08, "loss": 0.701, "step": 51342 }, { "epoch": 0.97, "learning_rate": 1.2850633026327275e-08, "loss": 0.98, "step": 51343 }, { "epoch": 0.97, "learning_rate": 1.2835168257227804e-08, "loss": 0.9308, "step": 51344 }, { "epoch": 0.97, "learning_rate": 1.2819712775125615e-08, "loss": 0.7743, "step": 51345 }, { "epoch": 0.97, "learning_rate": 1.2804266580078717e-08, "loss": 0.9781, "step": 51346 }, { "epoch": 0.97, "learning_rate": 1.278882967214401e-08, "loss": 1.0641, "step": 51347 }, { "epoch": 0.97, "learning_rate": 1.2773402051379502e-08, "loss": 0.7204, "step": 51348 }, { "epoch": 0.97, "learning_rate": 1.2757983717843203e-08, "loss": 0.7941, "step": 51349 }, { "epoch": 0.97, "learning_rate": 1.2742574671592013e-08, "loss": 1.0196, "step": 51350 }, { "epoch": 0.97, "learning_rate": 1.2727174912683938e-08, "loss": 0.9379, "step": 51351 }, { "epoch": 0.97, "learning_rate": 1.2711784441176433e-08, "loss": 0.9463, "step": 51352 }, { "epoch": 0.97, "learning_rate": 1.2696403257126677e-08, "loss": 0.8386, "step": 51353 }, { "epoch": 0.97, "learning_rate": 1.2681031360592399e-08, "loss": 0.719, "step": 51354 }, { "epoch": 0.97, "learning_rate": 1.2665668751630777e-08, "loss": 0.9615, "step": 51355 }, { "epoch": 0.97, "learning_rate": 1.2650315430299542e-08, "loss": 1.2701, "step": 51356 }, { "epoch": 0.97, "learning_rate": 1.2634971396655592e-08, "loss": 1.0096, "step": 51357 }, { "epoch": 0.97, "learning_rate": 1.2619636650756385e-08, "loss": 0.849, "step": 51358 }, { "epoch": 0.97, "learning_rate": 1.2604311192659091e-08, "loss": 0.8102, "step": 51359 }, { "epoch": 0.97, "learning_rate": 1.2588995022421168e-08, "loss": 1.1006, "step": 51360 }, { "epoch": 0.97, "learning_rate": 1.2573688140099794e-08, "loss": 0.9898, "step": 51361 }, { "epoch": 0.97, "learning_rate": 1.2558390545751864e-08, "loss": 1.2328, "step": 51362 }, { "epoch": 0.97, "learning_rate": 1.2543102239434557e-08, "loss": 0.8231, "step": 51363 }, { "epoch": 0.97, "learning_rate": 1.252782322120505e-08, "loss": 0.7209, "step": 51364 }, { "epoch": 0.97, "learning_rate": 1.2512553491120516e-08, "loss": 0.9755, "step": 51365 }, { "epoch": 0.97, "learning_rate": 1.249729304923758e-08, "loss": 0.7944, "step": 51366 }, { "epoch": 0.97, "learning_rate": 1.2482041895613971e-08, "loss": 0.7137, "step": 51367 }, { "epoch": 0.97, "learning_rate": 1.246680003030576e-08, "loss": 0.8553, "step": 51368 }, { "epoch": 0.97, "learning_rate": 1.2451567453370117e-08, "loss": 1.0048, "step": 51369 }, { "epoch": 0.97, "learning_rate": 1.24363441648645e-08, "loss": 0.9402, "step": 51370 }, { "epoch": 0.97, "learning_rate": 1.2421130164844974e-08, "loss": 0.7369, "step": 51371 }, { "epoch": 0.97, "learning_rate": 1.2405925453368717e-08, "loss": 0.9014, "step": 51372 }, { "epoch": 0.97, "learning_rate": 1.2390730030492625e-08, "loss": 0.8818, "step": 51373 }, { "epoch": 0.97, "learning_rate": 1.2375543896273046e-08, "loss": 0.9718, "step": 51374 }, { "epoch": 0.97, "learning_rate": 1.2360367050767152e-08, "loss": 1.1091, "step": 51375 }, { "epoch": 0.97, "learning_rate": 1.234519949403129e-08, "loss": 0.8743, "step": 51376 }, { "epoch": 0.97, "learning_rate": 1.2330041226122081e-08, "loss": 0.9895, "step": 51377 }, { "epoch": 0.97, "learning_rate": 1.2314892247096144e-08, "loss": 0.9255, "step": 51378 }, { "epoch": 0.97, "learning_rate": 1.2299752557010381e-08, "loss": 0.9186, "step": 51379 }, { "epoch": 0.97, "learning_rate": 1.2284622155921133e-08, "loss": 0.82, "step": 51380 }, { "epoch": 0.97, "learning_rate": 1.2269501043884469e-08, "loss": 0.9872, "step": 51381 }, { "epoch": 0.97, "learning_rate": 1.2254389220957564e-08, "loss": 0.9212, "step": 51382 }, { "epoch": 0.97, "learning_rate": 1.2239286687196205e-08, "loss": 0.7339, "step": 51383 }, { "epoch": 0.97, "learning_rate": 1.2224193442657295e-08, "loss": 1.0126, "step": 51384 }, { "epoch": 0.97, "learning_rate": 1.2209109487396898e-08, "loss": 0.7353, "step": 51385 }, { "epoch": 0.97, "learning_rate": 1.2194034821471356e-08, "loss": 0.807, "step": 51386 }, { "epoch": 0.97, "learning_rate": 1.2178969444937016e-08, "loss": 0.9434, "step": 51387 }, { "epoch": 0.97, "learning_rate": 1.216391335785022e-08, "loss": 0.9006, "step": 51388 }, { "epoch": 0.97, "learning_rate": 1.2148866560267037e-08, "loss": 0.8411, "step": 51389 }, { "epoch": 0.97, "learning_rate": 1.213382905224353e-08, "loss": 0.8852, "step": 51390 }, { "epoch": 0.97, "learning_rate": 1.211880083383632e-08, "loss": 0.8459, "step": 51391 }, { "epoch": 0.97, "learning_rate": 1.210378190510092e-08, "loss": 0.7173, "step": 51392 }, { "epoch": 0.97, "learning_rate": 1.2088772266093951e-08, "loss": 0.7639, "step": 51393 }, { "epoch": 0.97, "learning_rate": 1.2073771916871202e-08, "loss": 1.0306, "step": 51394 }, { "epoch": 0.97, "learning_rate": 1.2058780857488738e-08, "loss": 0.8955, "step": 51395 }, { "epoch": 0.97, "learning_rate": 1.204379908800235e-08, "loss": 0.7849, "step": 51396 }, { "epoch": 0.97, "learning_rate": 1.2028826608468103e-08, "loss": 0.9295, "step": 51397 }, { "epoch": 0.97, "learning_rate": 1.201386341894234e-08, "loss": 0.8902, "step": 51398 }, { "epoch": 0.97, "learning_rate": 1.1998909519480017e-08, "loss": 1.0735, "step": 51399 }, { "epoch": 0.97, "learning_rate": 1.1983964910137757e-08, "loss": 1.0173, "step": 51400 }, { "epoch": 0.97, "learning_rate": 1.1969029590971071e-08, "loss": 0.9774, "step": 51401 }, { "epoch": 0.97, "learning_rate": 1.1954103562035746e-08, "loss": 0.8518, "step": 51402 }, { "epoch": 0.97, "learning_rate": 1.1939186823387573e-08, "loss": 0.9276, "step": 51403 }, { "epoch": 0.97, "learning_rate": 1.192427937508206e-08, "loss": 0.8606, "step": 51404 }, { "epoch": 0.97, "learning_rate": 1.1909381217174998e-08, "loss": 1.2126, "step": 51405 }, { "epoch": 0.97, "learning_rate": 1.1894492349721898e-08, "loss": 1.1768, "step": 51406 }, { "epoch": 0.97, "learning_rate": 1.1879612772778826e-08, "loss": 0.8397, "step": 51407 }, { "epoch": 0.97, "learning_rate": 1.1864742486400738e-08, "loss": 0.821, "step": 51408 }, { "epoch": 0.97, "learning_rate": 1.1849881490643423e-08, "loss": 0.7245, "step": 51409 }, { "epoch": 0.97, "learning_rate": 1.1835029785562669e-08, "loss": 0.7142, "step": 51410 }, { "epoch": 0.97, "learning_rate": 1.1820187371213155e-08, "loss": 0.9757, "step": 51411 }, { "epoch": 0.97, "learning_rate": 1.1805354247650946e-08, "loss": 0.9469, "step": 51412 }, { "epoch": 0.97, "learning_rate": 1.1790530414931279e-08, "loss": 0.9972, "step": 51413 }, { "epoch": 0.97, "learning_rate": 1.1775715873109661e-08, "loss": 0.83, "step": 51414 }, { "epoch": 0.97, "learning_rate": 1.176091062224105e-08, "loss": 0.7079, "step": 51415 }, { "epoch": 0.97, "learning_rate": 1.1746114662380959e-08, "loss": 0.8363, "step": 51416 }, { "epoch": 0.97, "learning_rate": 1.1731327993584618e-08, "loss": 0.9883, "step": 51417 }, { "epoch": 0.97, "learning_rate": 1.1716550615906985e-08, "loss": 0.9693, "step": 51418 }, { "epoch": 0.97, "learning_rate": 1.1701782529403848e-08, "loss": 1.0038, "step": 51419 }, { "epoch": 0.97, "learning_rate": 1.168702373412961e-08, "loss": 0.8331, "step": 51420 }, { "epoch": 0.97, "learning_rate": 1.167227423013978e-08, "loss": 0.8641, "step": 51421 }, { "epoch": 0.97, "learning_rate": 1.165753401748959e-08, "loss": 1.0065, "step": 51422 }, { "epoch": 0.97, "learning_rate": 1.1642803096233723e-08, "loss": 0.7761, "step": 51423 }, { "epoch": 0.97, "learning_rate": 1.162808146642741e-08, "loss": 1.0534, "step": 51424 }, { "epoch": 0.97, "learning_rate": 1.1613369128125328e-08, "loss": 1.1432, "step": 51425 }, { "epoch": 0.97, "learning_rate": 1.1598666081382715e-08, "loss": 0.8536, "step": 51426 }, { "epoch": 0.97, "learning_rate": 1.1583972326254522e-08, "loss": 0.955, "step": 51427 }, { "epoch": 0.97, "learning_rate": 1.1569287862795431e-08, "loss": 0.9569, "step": 51428 }, { "epoch": 0.97, "learning_rate": 1.1554612691060397e-08, "loss": 0.8745, "step": 51429 }, { "epoch": 0.97, "learning_rate": 1.1539946811104096e-08, "loss": 0.7239, "step": 51430 }, { "epoch": 0.97, "learning_rate": 1.1525290222981212e-08, "loss": 1.0052, "step": 51431 }, { "epoch": 0.97, "learning_rate": 1.1510642926746696e-08, "loss": 0.8519, "step": 51432 }, { "epoch": 0.97, "learning_rate": 1.1496004922455228e-08, "loss": 0.6785, "step": 51433 }, { "epoch": 0.97, "learning_rate": 1.148137621016121e-08, "loss": 0.8199, "step": 51434 }, { "epoch": 0.97, "learning_rate": 1.1466756789919598e-08, "loss": 0.7514, "step": 51435 }, { "epoch": 0.97, "learning_rate": 1.1452146661784513e-08, "loss": 0.9201, "step": 51436 }, { "epoch": 0.97, "learning_rate": 1.1437545825811192e-08, "loss": 1.2033, "step": 51437 }, { "epoch": 0.97, "learning_rate": 1.1422954282053477e-08, "loss": 0.9845, "step": 51438 }, { "epoch": 0.97, "learning_rate": 1.1408372030566328e-08, "loss": 1.0015, "step": 51439 }, { "epoch": 0.97, "learning_rate": 1.1393799071403866e-08, "loss": 0.8392, "step": 51440 }, { "epoch": 0.97, "learning_rate": 1.137923540462077e-08, "loss": 0.8916, "step": 51441 }, { "epoch": 0.97, "learning_rate": 1.1364681030271441e-08, "loss": 0.8143, "step": 51442 }, { "epoch": 0.97, "learning_rate": 1.1350135948409724e-08, "loss": 0.9989, "step": 51443 }, { "epoch": 0.97, "learning_rate": 1.1335600159090576e-08, "loss": 1.1265, "step": 51444 }, { "epoch": 0.97, "learning_rate": 1.1321073662367843e-08, "loss": 0.8495, "step": 51445 }, { "epoch": 0.97, "learning_rate": 1.1306556458296203e-08, "loss": 0.9863, "step": 51446 }, { "epoch": 0.97, "learning_rate": 1.1292048546929224e-08, "loss": 0.7834, "step": 51447 }, { "epoch": 0.97, "learning_rate": 1.1277549928321584e-08, "loss": 0.702, "step": 51448 }, { "epoch": 0.97, "learning_rate": 1.126306060252741e-08, "loss": 0.8113, "step": 51449 }, { "epoch": 0.97, "learning_rate": 1.1248580569600264e-08, "loss": 0.851, "step": 51450 }, { "epoch": 0.97, "learning_rate": 1.1234109829595108e-08, "loss": 0.9786, "step": 51451 }, { "epoch": 0.97, "learning_rate": 1.1219648382565229e-08, "loss": 0.7672, "step": 51452 }, { "epoch": 0.97, "learning_rate": 1.1205196228564752e-08, "loss": 0.7002, "step": 51453 }, { "epoch": 0.97, "learning_rate": 1.11907533676478e-08, "loss": 0.7101, "step": 51454 }, { "epoch": 0.97, "learning_rate": 1.1176319799868496e-08, "loss": 0.682, "step": 51455 }, { "epoch": 0.97, "learning_rate": 1.1161895525280409e-08, "loss": 1.0559, "step": 51456 }, { "epoch": 0.97, "learning_rate": 1.1147480543937384e-08, "loss": 1.0864, "step": 51457 }, { "epoch": 0.97, "learning_rate": 1.1133074855893266e-08, "loss": 0.8547, "step": 51458 }, { "epoch": 0.97, "learning_rate": 1.1118678461202182e-08, "loss": 0.7109, "step": 51459 }, { "epoch": 0.97, "learning_rate": 1.1104291359917418e-08, "loss": 0.8203, "step": 51460 }, { "epoch": 0.97, "learning_rate": 1.108991355209338e-08, "loss": 0.9671, "step": 51461 }, { "epoch": 0.97, "learning_rate": 1.1075545037782798e-08, "loss": 1.0211, "step": 51462 }, { "epoch": 0.97, "learning_rate": 1.1061185817040076e-08, "loss": 0.8991, "step": 51463 }, { "epoch": 0.97, "learning_rate": 1.1046835889918507e-08, "loss": 0.7878, "step": 51464 }, { "epoch": 0.97, "learning_rate": 1.1032495256471653e-08, "loss": 0.9819, "step": 51465 }, { "epoch": 0.97, "learning_rate": 1.1018163916753088e-08, "loss": 0.8797, "step": 51466 }, { "epoch": 0.97, "learning_rate": 1.1003841870816656e-08, "loss": 0.681, "step": 51467 }, { "epoch": 0.97, "learning_rate": 1.098952911871537e-08, "loss": 0.9585, "step": 51468 }, { "epoch": 0.97, "learning_rate": 1.0975225660502797e-08, "loss": 1.0685, "step": 51469 }, { "epoch": 0.97, "learning_rate": 1.0960931496232786e-08, "loss": 0.9196, "step": 51470 }, { "epoch": 0.97, "learning_rate": 1.0946646625957791e-08, "loss": 0.7877, "step": 51471 }, { "epoch": 0.97, "learning_rate": 1.0932371049732215e-08, "loss": 0.7593, "step": 51472 }, { "epoch": 0.97, "learning_rate": 1.0918104767608518e-08, "loss": 0.868, "step": 51473 }, { "epoch": 0.97, "learning_rate": 1.0903847779640263e-08, "loss": 0.9483, "step": 51474 }, { "epoch": 0.97, "learning_rate": 1.0889600085881025e-08, "loss": 1.1477, "step": 51475 }, { "epoch": 0.97, "learning_rate": 1.0875361686383534e-08, "loss": 0.8223, "step": 51476 }, { "epoch": 0.97, "learning_rate": 1.0861132581201084e-08, "loss": 0.8937, "step": 51477 }, { "epoch": 0.97, "learning_rate": 1.0846912770386964e-08, "loss": 1.0002, "step": 51478 }, { "epoch": 0.97, "learning_rate": 1.0832702253994188e-08, "loss": 0.7571, "step": 51479 }, { "epoch": 0.97, "learning_rate": 1.0818501032075768e-08, "loss": 0.9746, "step": 51480 }, { "epoch": 0.97, "learning_rate": 1.0804309104684441e-08, "loss": 0.8561, "step": 51481 }, { "epoch": 0.97, "learning_rate": 1.0790126471873775e-08, "loss": 0.872, "step": 51482 }, { "epoch": 0.97, "learning_rate": 1.0775953133696504e-08, "loss": 0.9876, "step": 51483 }, { "epoch": 0.97, "learning_rate": 1.0761789090205366e-08, "loss": 0.8757, "step": 51484 }, { "epoch": 0.97, "learning_rate": 1.0747634341453373e-08, "loss": 0.8529, "step": 51485 }, { "epoch": 0.97, "learning_rate": 1.0733488887493537e-08, "loss": 0.966, "step": 51486 }, { "epoch": 0.97, "learning_rate": 1.0719352728378318e-08, "loss": 1.168, "step": 51487 }, { "epoch": 0.97, "learning_rate": 1.0705225864161007e-08, "loss": 1.0258, "step": 51488 }, { "epoch": 0.97, "learning_rate": 1.0691108294893782e-08, "loss": 0.7814, "step": 51489 }, { "epoch": 0.97, "learning_rate": 1.0677000020629658e-08, "loss": 0.832, "step": 51490 }, { "epoch": 0.97, "learning_rate": 1.0662901041421647e-08, "loss": 0.799, "step": 51491 }, { "epoch": 0.97, "learning_rate": 1.0648811357321654e-08, "loss": 0.7268, "step": 51492 }, { "epoch": 0.97, "learning_rate": 1.063473096838269e-08, "loss": 1.0754, "step": 51493 }, { "epoch": 0.97, "learning_rate": 1.0620659874657491e-08, "loss": 1.0179, "step": 51494 }, { "epoch": 0.97, "learning_rate": 1.0606598076198238e-08, "loss": 0.9137, "step": 51495 }, { "epoch": 0.97, "learning_rate": 1.0592545573057943e-08, "loss": 0.7887, "step": 51496 }, { "epoch": 0.97, "learning_rate": 1.0578502365288512e-08, "loss": 0.9084, "step": 51497 }, { "epoch": 0.97, "learning_rate": 1.0564468452942678e-08, "loss": 0.9955, "step": 51498 }, { "epoch": 0.97, "learning_rate": 1.0550443836072621e-08, "loss": 0.959, "step": 51499 }, { "epoch": 0.97, "learning_rate": 1.053642851473108e-08, "loss": 1.1577, "step": 51500 }, { "epoch": 0.97, "learning_rate": 1.052242248897023e-08, "loss": 0.5582, "step": 51501 }, { "epoch": 0.97, "learning_rate": 1.0508425758841978e-08, "loss": 0.9978, "step": 51502 }, { "epoch": 0.97, "learning_rate": 1.0494438324399337e-08, "loss": 1.0188, "step": 51503 }, { "epoch": 0.97, "learning_rate": 1.048046018569393e-08, "loss": 0.9142, "step": 51504 }, { "epoch": 0.97, "learning_rate": 1.0466491342778218e-08, "loss": 1.0143, "step": 51505 }, { "epoch": 0.97, "learning_rate": 1.0452531795704379e-08, "loss": 0.8912, "step": 51506 }, { "epoch": 0.97, "learning_rate": 1.0438581544524317e-08, "loss": 0.7775, "step": 51507 }, { "epoch": 0.97, "learning_rate": 1.0424640589290213e-08, "loss": 0.7959, "step": 51508 }, { "epoch": 0.97, "learning_rate": 1.0410708930054247e-08, "loss": 0.9557, "step": 51509 }, { "epoch": 0.97, "learning_rate": 1.0396786566868321e-08, "loss": 1.0277, "step": 51510 }, { "epoch": 0.97, "learning_rate": 1.0382873499784617e-08, "loss": 0.9007, "step": 51511 }, { "epoch": 0.97, "learning_rate": 1.036896972885476e-08, "loss": 0.9828, "step": 51512 }, { "epoch": 0.97, "learning_rate": 1.035507525413093e-08, "loss": 1.0178, "step": 51513 }, { "epoch": 0.97, "learning_rate": 1.034119007566503e-08, "loss": 0.778, "step": 51514 }, { "epoch": 0.97, "learning_rate": 1.0327314193508409e-08, "loss": 1.0186, "step": 51515 }, { "epoch": 0.97, "learning_rate": 1.0313447607713522e-08, "loss": 0.809, "step": 51516 }, { "epoch": 0.97, "learning_rate": 1.0299590318331998e-08, "loss": 0.9209, "step": 51517 }, { "epoch": 0.97, "learning_rate": 1.0285742325415183e-08, "loss": 0.9668, "step": 51518 }, { "epoch": 0.97, "learning_rate": 1.0271903629015256e-08, "loss": 0.9387, "step": 51519 }, { "epoch": 0.97, "learning_rate": 1.0258074229183568e-08, "loss": 1.0107, "step": 51520 }, { "epoch": 0.97, "learning_rate": 1.024425412597202e-08, "loss": 0.8872, "step": 51521 }, { "epoch": 0.97, "learning_rate": 1.0230443319432236e-08, "loss": 0.8338, "step": 51522 }, { "epoch": 0.97, "learning_rate": 1.0216641809615291e-08, "loss": 0.9779, "step": 51523 }, { "epoch": 0.97, "learning_rate": 1.020284959657336e-08, "loss": 1.1058, "step": 51524 }, { "epoch": 0.97, "learning_rate": 1.0189066680357519e-08, "loss": 1.0239, "step": 51525 }, { "epoch": 0.97, "learning_rate": 1.0175293061019388e-08, "loss": 1.0604, "step": 51526 }, { "epoch": 0.97, "learning_rate": 1.0161528738610315e-08, "loss": 0.7942, "step": 51527 }, { "epoch": 0.97, "learning_rate": 1.014777371318193e-08, "loss": 0.6429, "step": 51528 }, { "epoch": 0.97, "learning_rate": 1.01340279847853e-08, "loss": 0.8541, "step": 51529 }, { "epoch": 0.97, "learning_rate": 1.0120291553471773e-08, "loss": 0.9316, "step": 51530 }, { "epoch": 0.97, "learning_rate": 1.0106564419292975e-08, "loss": 0.9747, "step": 51531 }, { "epoch": 0.97, "learning_rate": 1.009284658229942e-08, "loss": 0.8315, "step": 51532 }, { "epoch": 0.97, "learning_rate": 1.007913804254329e-08, "loss": 0.8348, "step": 51533 }, { "epoch": 0.97, "learning_rate": 1.0065438800075378e-08, "loss": 0.8941, "step": 51534 }, { "epoch": 0.97, "learning_rate": 1.0051748854946475e-08, "loss": 0.8674, "step": 51535 }, { "epoch": 0.97, "learning_rate": 1.0038068207208206e-08, "loss": 0.6503, "step": 51536 }, { "epoch": 0.97, "learning_rate": 1.0024396856911366e-08, "loss": 1.1485, "step": 51537 }, { "epoch": 0.97, "learning_rate": 1.0010734804107025e-08, "loss": 0.9205, "step": 51538 }, { "epoch": 0.97, "learning_rate": 9.997082048846252e-09, "loss": 1.0311, "step": 51539 }, { "epoch": 0.97, "learning_rate": 9.983438591180117e-09, "loss": 1.034, "step": 51540 }, { "epoch": 0.97, "learning_rate": 9.969804431159414e-09, "loss": 0.8204, "step": 51541 }, { "epoch": 0.97, "learning_rate": 9.956179568835212e-09, "loss": 0.8322, "step": 51542 }, { "epoch": 0.97, "learning_rate": 9.942564004258304e-09, "loss": 0.8365, "step": 51543 }, { "epoch": 0.97, "learning_rate": 9.928957737479205e-09, "loss": 0.9446, "step": 51544 }, { "epoch": 0.97, "learning_rate": 9.915360768549542e-09, "loss": 0.6127, "step": 51545 }, { "epoch": 0.97, "learning_rate": 9.901773097519274e-09, "loss": 0.8196, "step": 51546 }, { "epoch": 0.97, "learning_rate": 9.888194724439471e-09, "loss": 0.8228, "step": 51547 }, { "epoch": 0.97, "learning_rate": 9.874625649360647e-09, "loss": 0.9558, "step": 51548 }, { "epoch": 0.97, "learning_rate": 9.861065872333875e-09, "loss": 0.8848, "step": 51549 }, { "epoch": 0.97, "learning_rate": 9.84751539340939e-09, "loss": 0.9506, "step": 51550 }, { "epoch": 0.97, "learning_rate": 9.833974212637987e-09, "loss": 0.8725, "step": 51551 }, { "epoch": 0.97, "learning_rate": 9.820442330070179e-09, "loss": 0.9869, "step": 51552 }, { "epoch": 0.97, "learning_rate": 9.806919745756482e-09, "loss": 0.9142, "step": 51553 }, { "epoch": 0.97, "learning_rate": 9.793406459747412e-09, "loss": 0.6221, "step": 51554 }, { "epoch": 0.97, "learning_rate": 9.779902472093205e-09, "loss": 0.9175, "step": 51555 }, { "epoch": 0.97, "learning_rate": 9.766407782844655e-09, "loss": 0.946, "step": 51556 }, { "epoch": 0.97, "learning_rate": 9.752922392052e-09, "loss": 0.8874, "step": 51557 }, { "epoch": 0.97, "learning_rate": 9.739446299765753e-09, "loss": 0.8141, "step": 51558 }, { "epoch": 0.97, "learning_rate": 9.725979506035876e-09, "loss": 0.7301, "step": 51559 }, { "epoch": 0.97, "learning_rate": 9.712522010912883e-09, "loss": 0.8292, "step": 51560 }, { "epoch": 0.97, "learning_rate": 9.699073814447014e-09, "loss": 0.7422, "step": 51561 }, { "epoch": 0.97, "learning_rate": 9.685634916688224e-09, "loss": 0.9622, "step": 51562 }, { "epoch": 0.97, "learning_rate": 9.672205317687034e-09, "loss": 0.9534, "step": 51563 }, { "epoch": 0.97, "learning_rate": 9.658785017493677e-09, "loss": 0.8787, "step": 51564 }, { "epoch": 0.97, "learning_rate": 9.64537401615756e-09, "loss": 0.9639, "step": 51565 }, { "epoch": 0.97, "learning_rate": 9.631972313729753e-09, "loss": 0.8108, "step": 51566 }, { "epoch": 0.97, "learning_rate": 9.618579910259662e-09, "loss": 0.8401, "step": 51567 }, { "epoch": 0.97, "learning_rate": 9.605196805797522e-09, "loss": 1.3513, "step": 51568 }, { "epoch": 0.97, "learning_rate": 9.591823000393019e-09, "loss": 1.0484, "step": 51569 }, { "epoch": 0.97, "learning_rate": 9.578458494096388e-09, "loss": 0.9545, "step": 51570 }, { "epoch": 0.97, "learning_rate": 9.565103286957312e-09, "loss": 0.9386, "step": 51571 }, { "epoch": 0.97, "learning_rate": 9.551757379026027e-09, "loss": 1.0732, "step": 51572 }, { "epoch": 0.97, "learning_rate": 9.538420770351942e-09, "loss": 0.8571, "step": 51573 }, { "epoch": 0.97, "learning_rate": 9.525093460985013e-09, "loss": 0.7847, "step": 51574 }, { "epoch": 0.97, "learning_rate": 9.511775450975203e-09, "loss": 0.9088, "step": 51575 }, { "epoch": 0.97, "learning_rate": 9.498466740372193e-09, "loss": 0.946, "step": 51576 }, { "epoch": 0.97, "learning_rate": 9.485167329225109e-09, "loss": 0.7677, "step": 51577 }, { "epoch": 0.97, "learning_rate": 9.471877217584192e-09, "loss": 0.9955, "step": 51578 }, { "epoch": 0.97, "learning_rate": 9.45859640549912e-09, "loss": 0.8683, "step": 51579 }, { "epoch": 0.97, "learning_rate": 9.445324893019026e-09, "loss": 0.8611, "step": 51580 }, { "epoch": 0.97, "learning_rate": 9.432062680193865e-09, "loss": 0.9798, "step": 51581 }, { "epoch": 0.97, "learning_rate": 9.418809767073322e-09, "loss": 1.0717, "step": 51582 }, { "epoch": 0.97, "learning_rate": 9.405566153705969e-09, "loss": 0.9468, "step": 51583 }, { "epoch": 0.97, "learning_rate": 9.392331840142321e-09, "loss": 1.005, "step": 51584 }, { "epoch": 0.97, "learning_rate": 9.379106826431228e-09, "loss": 0.8407, "step": 51585 }, { "epoch": 0.97, "learning_rate": 9.365891112622094e-09, "loss": 0.7722, "step": 51586 }, { "epoch": 0.97, "learning_rate": 9.352684698764602e-09, "loss": 1.1096, "step": 51587 }, { "epoch": 0.97, "learning_rate": 9.339487584907603e-09, "loss": 1.11, "step": 51588 }, { "epoch": 0.97, "learning_rate": 9.3262997711005e-09, "loss": 0.7764, "step": 51589 }, { "epoch": 0.97, "learning_rate": 9.313121257392699e-09, "loss": 0.8501, "step": 51590 }, { "epoch": 0.97, "learning_rate": 9.299952043833327e-09, "loss": 0.7375, "step": 51591 }, { "epoch": 0.97, "learning_rate": 9.28679213047179e-09, "loss": 0.8399, "step": 51592 }, { "epoch": 0.97, "learning_rate": 9.273641517356657e-09, "loss": 1.058, "step": 51593 }, { "epoch": 0.97, "learning_rate": 9.260500204537892e-09, "loss": 1.1397, "step": 51594 }, { "epoch": 0.97, "learning_rate": 9.247368192063511e-09, "loss": 0.7675, "step": 51595 }, { "epoch": 0.97, "learning_rate": 9.234245479983472e-09, "loss": 0.9035, "step": 51596 }, { "epoch": 0.97, "learning_rate": 9.221132068346072e-09, "loss": 0.7097, "step": 51597 }, { "epoch": 0.97, "learning_rate": 9.208027957200715e-09, "loss": 0.7699, "step": 51598 }, { "epoch": 0.97, "learning_rate": 9.194933146596253e-09, "loss": 0.8799, "step": 51599 }, { "epoch": 0.97, "learning_rate": 9.181847636581532e-09, "loss": 1.0434, "step": 51600 }, { "epoch": 0.97, "learning_rate": 9.168771427205404e-09, "loss": 1.0861, "step": 51601 }, { "epoch": 0.97, "learning_rate": 9.155704518516717e-09, "loss": 0.7245, "step": 51602 }, { "epoch": 0.97, "learning_rate": 9.142646910564601e-09, "loss": 0.9002, "step": 51603 }, { "epoch": 0.97, "learning_rate": 9.129598603396795e-09, "loss": 0.8233, "step": 51604 }, { "epoch": 0.97, "learning_rate": 9.116559597063257e-09, "loss": 0.884, "step": 51605 }, { "epoch": 0.97, "learning_rate": 9.103529891612005e-09, "loss": 1.0087, "step": 51606 }, { "epoch": 0.97, "learning_rate": 9.090509487091614e-09, "loss": 0.968, "step": 51607 }, { "epoch": 0.97, "learning_rate": 9.07749838355093e-09, "loss": 0.9136, "step": 51608 }, { "epoch": 0.97, "learning_rate": 9.06449658103853e-09, "loss": 0.8732, "step": 51609 }, { "epoch": 0.97, "learning_rate": 9.05150407960298e-09, "loss": 0.7686, "step": 51610 }, { "epoch": 0.97, "learning_rate": 9.038520879292577e-09, "loss": 0.9487, "step": 51611 }, { "epoch": 0.97, "learning_rate": 9.025546980156174e-09, "loss": 1.1885, "step": 51612 }, { "epoch": 0.97, "learning_rate": 9.012582382241786e-09, "loss": 0.9542, "step": 51613 }, { "epoch": 0.97, "learning_rate": 8.999627085598261e-09, "loss": 1.0231, "step": 51614 }, { "epoch": 0.97, "learning_rate": 8.986681090273619e-09, "loss": 0.9292, "step": 51615 }, { "epoch": 0.97, "learning_rate": 8.97374439631643e-09, "loss": 0.9836, "step": 51616 }, { "epoch": 0.97, "learning_rate": 8.960817003774713e-09, "loss": 0.7969, "step": 51617 }, { "epoch": 0.97, "learning_rate": 8.94789891269704e-09, "loss": 1.1253, "step": 51618 }, { "epoch": 0.97, "learning_rate": 8.934990123131704e-09, "loss": 0.8423, "step": 51619 }, { "epoch": 0.97, "learning_rate": 8.922090635126446e-09, "loss": 0.8864, "step": 51620 }, { "epoch": 0.97, "learning_rate": 8.909200448729838e-09, "loss": 0.8434, "step": 51621 }, { "epoch": 0.97, "learning_rate": 8.896319563989896e-09, "loss": 0.8527, "step": 51622 }, { "epoch": 0.97, "learning_rate": 8.883447980954917e-09, "loss": 0.9789, "step": 51623 }, { "epoch": 0.97, "learning_rate": 8.87058569967264e-09, "loss": 1.0593, "step": 51624 }, { "epoch": 0.97, "learning_rate": 8.857732720191082e-09, "loss": 1.2661, "step": 51625 }, { "epoch": 0.97, "learning_rate": 8.844889042558535e-09, "loss": 0.9916, "step": 51626 }, { "epoch": 0.97, "learning_rate": 8.832054666822742e-09, "loss": 0.8311, "step": 51627 }, { "epoch": 0.97, "learning_rate": 8.819229593031442e-09, "loss": 1.0466, "step": 51628 }, { "epoch": 0.97, "learning_rate": 8.806413821232928e-09, "loss": 0.8457, "step": 51629 }, { "epoch": 0.97, "learning_rate": 8.793607351474941e-09, "loss": 1.0048, "step": 51630 }, { "epoch": 0.97, "learning_rate": 8.780810183805221e-09, "loss": 1.1372, "step": 51631 }, { "epoch": 0.97, "learning_rate": 8.768022318271508e-09, "loss": 0.9631, "step": 51632 }, { "epoch": 0.97, "learning_rate": 8.755243754921816e-09, "loss": 0.9958, "step": 51633 }, { "epoch": 0.97, "learning_rate": 8.74247449380361e-09, "loss": 0.9375, "step": 51634 }, { "epoch": 0.97, "learning_rate": 8.729714534964351e-09, "loss": 0.9595, "step": 51635 }, { "epoch": 0.97, "learning_rate": 8.716963878452333e-09, "loss": 0.948, "step": 51636 }, { "epoch": 0.97, "learning_rate": 8.704222524314466e-09, "loss": 1.0878, "step": 51637 }, { "epoch": 0.97, "learning_rate": 8.691490472598763e-09, "loss": 1.0166, "step": 51638 }, { "epoch": 0.97, "learning_rate": 8.678767723352688e-09, "loss": 0.7549, "step": 51639 }, { "epoch": 0.97, "learning_rate": 8.666054276623703e-09, "loss": 0.731, "step": 51640 }, { "epoch": 0.97, "learning_rate": 8.653350132459271e-09, "loss": 1.0896, "step": 51641 }, { "epoch": 0.97, "learning_rate": 8.640655290906852e-09, "loss": 0.6906, "step": 51642 }, { "epoch": 0.97, "learning_rate": 8.627969752013631e-09, "loss": 1.0151, "step": 51643 }, { "epoch": 0.97, "learning_rate": 8.615293515827627e-09, "loss": 0.9775, "step": 51644 }, { "epoch": 0.97, "learning_rate": 8.602626582395468e-09, "loss": 0.8444, "step": 51645 }, { "epoch": 0.97, "learning_rate": 8.589968951764615e-09, "loss": 0.9639, "step": 51646 }, { "epoch": 0.97, "learning_rate": 8.577320623982533e-09, "loss": 0.8441, "step": 51647 }, { "epoch": 0.97, "learning_rate": 8.564681599096403e-09, "loss": 0.7206, "step": 51648 }, { "epoch": 0.97, "learning_rate": 8.552051877153134e-09, "loss": 0.8794, "step": 51649 }, { "epoch": 0.97, "learning_rate": 8.539431458200464e-09, "loss": 1.1954, "step": 51650 }, { "epoch": 0.97, "learning_rate": 8.526820342285024e-09, "loss": 1.0577, "step": 51651 }, { "epoch": 0.97, "learning_rate": 8.514218529453999e-09, "loss": 0.864, "step": 51652 }, { "epoch": 0.97, "learning_rate": 8.501626019754572e-09, "loss": 0.8456, "step": 51653 }, { "epoch": 0.97, "learning_rate": 8.489042813233372e-09, "loss": 1.0455, "step": 51654 }, { "epoch": 0.97, "learning_rate": 8.47646890993814e-09, "loss": 0.9082, "step": 51655 }, { "epoch": 0.97, "learning_rate": 8.46390430991495e-09, "loss": 1.2403, "step": 51656 }, { "epoch": 0.97, "learning_rate": 8.451349013211541e-09, "loss": 0.9303, "step": 51657 }, { "epoch": 0.97, "learning_rate": 8.438803019874264e-09, "loss": 1.0294, "step": 51658 }, { "epoch": 0.97, "learning_rate": 8.426266329950027e-09, "loss": 0.8452, "step": 51659 }, { "epoch": 0.97, "learning_rate": 8.413738943485738e-09, "loss": 0.9543, "step": 51660 }, { "epoch": 0.97, "learning_rate": 8.401220860528302e-09, "loss": 0.8065, "step": 51661 }, { "epoch": 0.97, "learning_rate": 8.388712081124073e-09, "loss": 0.9909, "step": 51662 }, { "epoch": 0.97, "learning_rate": 8.376212605320234e-09, "loss": 0.7983, "step": 51663 }, { "epoch": 0.97, "learning_rate": 8.363722433163135e-09, "loss": 0.7922, "step": 51664 }, { "epoch": 0.97, "learning_rate": 8.351241564699408e-09, "loss": 0.7979, "step": 51665 }, { "epoch": 0.97, "learning_rate": 8.33876999997596e-09, "loss": 0.8841, "step": 51666 }, { "epoch": 0.97, "learning_rate": 8.326307739038864e-09, "loss": 0.769, "step": 51667 }, { "epoch": 0.97, "learning_rate": 8.313854781935026e-09, "loss": 1.1218, "step": 51668 }, { "epoch": 0.97, "learning_rate": 8.301411128711078e-09, "loss": 1.0391, "step": 51669 }, { "epoch": 0.97, "learning_rate": 8.288976779413094e-09, "loss": 0.7253, "step": 51670 }, { "epoch": 0.97, "learning_rate": 8.2765517340877e-09, "loss": 0.9183, "step": 51671 }, { "epoch": 0.97, "learning_rate": 8.264135992781252e-09, "loss": 0.7814, "step": 51672 }, { "epoch": 0.97, "learning_rate": 8.2517295555401e-09, "loss": 0.794, "step": 51673 }, { "epoch": 0.97, "learning_rate": 8.239332422410595e-09, "loss": 0.9597, "step": 51674 }, { "epoch": 0.97, "learning_rate": 8.22694459343909e-09, "loss": 1.1002, "step": 51675 }, { "epoch": 0.97, "learning_rate": 8.21456606867166e-09, "loss": 0.8309, "step": 51676 }, { "epoch": 0.97, "learning_rate": 8.202196848154653e-09, "loss": 0.7491, "step": 51677 }, { "epoch": 0.98, "learning_rate": 8.189836931934424e-09, "loss": 0.9463, "step": 51678 }, { "epoch": 0.98, "learning_rate": 8.177486320056493e-09, "loss": 0.8709, "step": 51679 }, { "epoch": 0.98, "learning_rate": 8.165145012568044e-09, "loss": 0.9277, "step": 51680 }, { "epoch": 0.98, "learning_rate": 8.152813009514038e-09, "loss": 0.9347, "step": 51681 }, { "epoch": 0.98, "learning_rate": 8.140490310941384e-09, "loss": 0.9085, "step": 51682 }, { "epoch": 0.98, "learning_rate": 8.128176916895603e-09, "loss": 0.6016, "step": 51683 }, { "epoch": 0.98, "learning_rate": 8.115872827422767e-09, "loss": 0.9846, "step": 51684 }, { "epoch": 0.98, "learning_rate": 8.103578042568672e-09, "loss": 0.6703, "step": 51685 }, { "epoch": 0.98, "learning_rate": 8.091292562379672e-09, "loss": 0.9337, "step": 51686 }, { "epoch": 0.98, "learning_rate": 8.079016386901561e-09, "loss": 1.0945, "step": 51687 }, { "epoch": 0.98, "learning_rate": 8.066749516179583e-09, "loss": 1.142, "step": 51688 }, { "epoch": 0.98, "learning_rate": 8.05449195026009e-09, "loss": 0.9063, "step": 51689 }, { "epoch": 0.98, "learning_rate": 8.042243689188879e-09, "loss": 0.9599, "step": 51690 }, { "epoch": 0.98, "learning_rate": 8.030004733011464e-09, "loss": 0.6871, "step": 51691 }, { "epoch": 0.98, "learning_rate": 8.017775081773648e-09, "loss": 1.0269, "step": 51692 }, { "epoch": 0.98, "learning_rate": 8.005554735520948e-09, "loss": 1.2086, "step": 51693 }, { "epoch": 0.98, "learning_rate": 7.993343694298882e-09, "loss": 1.0586, "step": 51694 }, { "epoch": 0.98, "learning_rate": 7.981141958153526e-09, "loss": 0.7836, "step": 51695 }, { "epoch": 0.98, "learning_rate": 7.968949527130122e-09, "loss": 0.8892, "step": 51696 }, { "epoch": 0.98, "learning_rate": 7.956766401274463e-09, "loss": 0.8838, "step": 51697 }, { "epoch": 0.98, "learning_rate": 7.944592580631516e-09, "loss": 0.7684, "step": 51698 }, { "epoch": 0.98, "learning_rate": 7.932428065247355e-09, "loss": 0.9069, "step": 51699 }, { "epoch": 0.98, "learning_rate": 7.920272855166943e-09, "loss": 1.0275, "step": 51700 }, { "epoch": 0.98, "learning_rate": 7.908126950435802e-09, "loss": 0.9206, "step": 51701 }, { "epoch": 0.98, "learning_rate": 7.89599035109917e-09, "loss": 0.7689, "step": 51702 }, { "epoch": 0.98, "learning_rate": 7.883863057202845e-09, "loss": 0.9328, "step": 51703 }, { "epoch": 0.98, "learning_rate": 7.871745068791514e-09, "loss": 0.8092, "step": 51704 }, { "epoch": 0.98, "learning_rate": 7.859636385910696e-09, "loss": 0.857, "step": 51705 }, { "epoch": 0.98, "learning_rate": 7.847537008605633e-09, "loss": 1.0146, "step": 51706 }, { "epoch": 0.98, "learning_rate": 7.835446936921287e-09, "loss": 0.9753, "step": 51707 }, { "epoch": 0.98, "learning_rate": 7.82336617090318e-09, "loss": 0.9514, "step": 51708 }, { "epoch": 0.98, "learning_rate": 7.811294710596274e-09, "loss": 0.9303, "step": 51709 }, { "epoch": 0.98, "learning_rate": 7.799232556045256e-09, "loss": 0.8715, "step": 51710 }, { "epoch": 0.98, "learning_rate": 7.787179707295921e-09, "loss": 0.9573, "step": 51711 }, { "epoch": 0.98, "learning_rate": 7.775136164392405e-09, "loss": 1.1693, "step": 51712 }, { "epoch": 0.98, "learning_rate": 7.763101927380501e-09, "loss": 1.0144, "step": 51713 }, { "epoch": 0.98, "learning_rate": 7.751076996304618e-09, "loss": 1.001, "step": 51714 }, { "epoch": 0.98, "learning_rate": 7.739061371209721e-09, "loss": 0.9156, "step": 51715 }, { "epoch": 0.98, "learning_rate": 7.727055052140775e-09, "loss": 0.8209, "step": 51716 }, { "epoch": 0.98, "learning_rate": 7.715058039142743e-09, "loss": 0.8677, "step": 51717 }, { "epoch": 0.98, "learning_rate": 7.703070332260033e-09, "loss": 0.8187, "step": 51718 }, { "epoch": 0.98, "learning_rate": 7.691091931537886e-09, "loss": 0.94, "step": 51719 }, { "epoch": 0.98, "learning_rate": 7.679122837020713e-09, "loss": 0.8743, "step": 51720 }, { "epoch": 0.98, "learning_rate": 7.6671630487532e-09, "loss": 1.0702, "step": 51721 }, { "epoch": 0.98, "learning_rate": 7.655212566780034e-09, "loss": 0.9007, "step": 51722 }, { "epoch": 0.98, "learning_rate": 7.643271391145902e-09, "loss": 0.8517, "step": 51723 }, { "epoch": 0.98, "learning_rate": 7.631339521895487e-09, "loss": 0.9526, "step": 51724 }, { "epoch": 0.98, "learning_rate": 7.6194169590732e-09, "loss": 0.9691, "step": 51725 }, { "epoch": 0.98, "learning_rate": 7.60750370272345e-09, "loss": 0.7848, "step": 51726 }, { "epoch": 0.98, "learning_rate": 7.595599752891203e-09, "loss": 0.9701, "step": 51727 }, { "epoch": 0.98, "learning_rate": 7.58370510962031e-09, "loss": 0.798, "step": 51728 }, { "epoch": 0.98, "learning_rate": 7.571819772955458e-09, "loss": 1.1075, "step": 51729 }, { "epoch": 0.98, "learning_rate": 7.559943742941056e-09, "loss": 0.8358, "step": 51730 }, { "epoch": 0.98, "learning_rate": 7.548077019621236e-09, "loss": 1.0549, "step": 51731 }, { "epoch": 0.98, "learning_rate": 7.536219603040684e-09, "loss": 0.9642, "step": 51732 }, { "epoch": 0.98, "learning_rate": 7.524371493243532e-09, "loss": 0.777, "step": 51733 }, { "epoch": 0.98, "learning_rate": 7.51253269027391e-09, "loss": 1.0312, "step": 51734 }, { "epoch": 0.98, "learning_rate": 7.50070319417595e-09, "loss": 0.9705, "step": 51735 }, { "epoch": 0.98, "learning_rate": 7.488883004994062e-09, "loss": 0.7849, "step": 51736 }, { "epoch": 0.98, "learning_rate": 7.4770721227721e-09, "loss": 1.0005, "step": 51737 }, { "epoch": 0.98, "learning_rate": 7.46527054755447e-09, "loss": 1.0482, "step": 51738 }, { "epoch": 0.98, "learning_rate": 7.453478279385029e-09, "loss": 0.8985, "step": 51739 }, { "epoch": 0.98, "learning_rate": 7.441695318307907e-09, "loss": 0.6292, "step": 51740 }, { "epoch": 0.98, "learning_rate": 7.429921664366957e-09, "loss": 0.8797, "step": 51741 }, { "epoch": 0.98, "learning_rate": 7.418157317606311e-09, "loss": 0.7919, "step": 51742 }, { "epoch": 0.98, "learning_rate": 7.406402278070101e-09, "loss": 0.9049, "step": 51743 }, { "epoch": 0.98, "learning_rate": 7.3946565458016265e-09, "loss": 1.1408, "step": 51744 }, { "epoch": 0.98, "learning_rate": 7.382920120845294e-09, "loss": 0.7983, "step": 51745 }, { "epoch": 0.98, "learning_rate": 7.371193003244403e-09, "loss": 0.9417, "step": 51746 }, { "epoch": 0.98, "learning_rate": 7.359475193043364e-09, "loss": 0.9341, "step": 51747 }, { "epoch": 0.98, "learning_rate": 7.347766690285474e-09, "loss": 0.8096, "step": 51748 }, { "epoch": 0.98, "learning_rate": 7.336067495014587e-09, "loss": 0.9624, "step": 51749 }, { "epoch": 0.98, "learning_rate": 7.3243776072745575e-09, "loss": 1.0483, "step": 51750 }, { "epoch": 0.98, "learning_rate": 7.312697027108961e-09, "loss": 0.8505, "step": 51751 }, { "epoch": 0.98, "learning_rate": 7.30102575456082e-09, "loss": 0.8542, "step": 51752 }, { "epoch": 0.98, "learning_rate": 7.289363789674819e-09, "loss": 0.967, "step": 51753 }, { "epoch": 0.98, "learning_rate": 7.277711132493426e-09, "loss": 1.1717, "step": 51754 }, { "epoch": 0.98, "learning_rate": 7.266067783061048e-09, "loss": 0.8312, "step": 51755 }, { "epoch": 0.98, "learning_rate": 7.25443374142043e-09, "loss": 0.9538, "step": 51756 }, { "epoch": 0.98, "learning_rate": 7.242809007615425e-09, "loss": 1.0082, "step": 51757 }, { "epoch": 0.98, "learning_rate": 7.231193581689333e-09, "loss": 0.7732, "step": 51758 }, { "epoch": 0.98, "learning_rate": 7.219587463685451e-09, "loss": 0.8701, "step": 51759 }, { "epoch": 0.98, "learning_rate": 7.207990653647356e-09, "loss": 0.7253, "step": 51760 }, { "epoch": 0.98, "learning_rate": 7.19640315161807e-09, "loss": 0.9833, "step": 51761 }, { "epoch": 0.98, "learning_rate": 7.184824957641168e-09, "loss": 1.1089, "step": 51762 }, { "epoch": 0.98, "learning_rate": 7.1732560717593935e-09, "loss": 1.0981, "step": 51763 }, { "epoch": 0.98, "learning_rate": 7.161696494016601e-09, "loss": 0.9042, "step": 51764 }, { "epoch": 0.98, "learning_rate": 7.150146224455256e-09, "loss": 0.7947, "step": 51765 }, { "epoch": 0.98, "learning_rate": 7.138605263119214e-09, "loss": 0.8934, "step": 51766 }, { "epoch": 0.98, "learning_rate": 7.127073610050939e-09, "loss": 0.7965, "step": 51767 }, { "epoch": 0.98, "learning_rate": 7.11555126529373e-09, "loss": 1.0005, "step": 51768 }, { "epoch": 0.98, "learning_rate": 7.104038228890608e-09, "loss": 1.0507, "step": 51769 }, { "epoch": 0.98, "learning_rate": 7.092534500884596e-09, "loss": 0.8709, "step": 51770 }, { "epoch": 0.98, "learning_rate": 7.081040081318713e-09, "loss": 0.9547, "step": 51771 }, { "epoch": 0.98, "learning_rate": 7.069554970235703e-09, "loss": 0.8285, "step": 51772 }, { "epoch": 0.98, "learning_rate": 7.058079167678589e-09, "loss": 0.9448, "step": 51773 }, { "epoch": 0.98, "learning_rate": 7.046612673690112e-09, "loss": 0.9981, "step": 51774 }, { "epoch": 0.98, "learning_rate": 7.035155488313294e-09, "loss": 0.9822, "step": 51775 }, { "epoch": 0.98, "learning_rate": 7.023707611590602e-09, "loss": 1.0284, "step": 51776 }, { "epoch": 0.98, "learning_rate": 7.012269043565057e-09, "loss": 0.8568, "step": 51777 }, { "epoch": 0.98, "learning_rate": 7.0008397842791234e-09, "loss": 0.7361, "step": 51778 }, { "epoch": 0.98, "learning_rate": 6.989419833775824e-09, "loss": 0.9528, "step": 51779 }, { "epoch": 0.98, "learning_rate": 6.978009192097346e-09, "loss": 0.963, "step": 51780 }, { "epoch": 0.98, "learning_rate": 6.966607859286989e-09, "loss": 0.8947, "step": 51781 }, { "epoch": 0.98, "learning_rate": 6.9552158353863865e-09, "loss": 0.9025, "step": 51782 }, { "epoch": 0.98, "learning_rate": 6.943833120438836e-09, "loss": 0.8012, "step": 51783 }, { "epoch": 0.98, "learning_rate": 6.932459714486528e-09, "loss": 0.84, "step": 51784 }, { "epoch": 0.98, "learning_rate": 6.921095617571927e-09, "loss": 0.651, "step": 51785 }, { "epoch": 0.98, "learning_rate": 6.909740829737499e-09, "loss": 1.0751, "step": 51786 }, { "epoch": 0.98, "learning_rate": 6.898395351025711e-09, "loss": 1.2193, "step": 51787 }, { "epoch": 0.98, "learning_rate": 6.88705918147875e-09, "loss": 0.8895, "step": 51788 }, { "epoch": 0.98, "learning_rate": 6.875732321139083e-09, "loss": 0.9196, "step": 51789 }, { "epoch": 0.98, "learning_rate": 6.864414770049177e-09, "loss": 0.8356, "step": 51790 }, { "epoch": 0.98, "learning_rate": 6.853106528250941e-09, "loss": 0.7839, "step": 51791 }, { "epoch": 0.98, "learning_rate": 6.8418075957868424e-09, "loss": 1.0373, "step": 51792 }, { "epoch": 0.98, "learning_rate": 6.830517972699069e-09, "loss": 1.1517, "step": 51793 }, { "epoch": 0.98, "learning_rate": 6.819237659029532e-09, "loss": 1.1656, "step": 51794 }, { "epoch": 0.98, "learning_rate": 6.807966654820697e-09, "loss": 0.816, "step": 51795 }, { "epoch": 0.98, "learning_rate": 6.796704960114475e-09, "loss": 1.0007, "step": 51796 }, { "epoch": 0.98, "learning_rate": 6.785452574952778e-09, "loss": 0.7677, "step": 51797 }, { "epoch": 0.98, "learning_rate": 6.774209499377793e-09, "loss": 0.762, "step": 51798 }, { "epoch": 0.98, "learning_rate": 6.762975733431431e-09, "loss": 1.0377, "step": 51799 }, { "epoch": 0.98, "learning_rate": 6.751751277155605e-09, "loss": 0.8217, "step": 51800 }, { "epoch": 0.98, "learning_rate": 6.740536130592501e-09, "loss": 0.758, "step": 51801 }, { "epoch": 0.98, "learning_rate": 6.729330293783753e-09, "loss": 0.8376, "step": 51802 }, { "epoch": 0.98, "learning_rate": 6.718133766770996e-09, "loss": 0.7092, "step": 51803 }, { "epoch": 0.98, "learning_rate": 6.706946549596694e-09, "loss": 1.0306, "step": 51804 }, { "epoch": 0.98, "learning_rate": 6.6957686423019254e-09, "loss": 0.8854, "step": 51805 }, { "epoch": 0.98, "learning_rate": 6.684600044928602e-09, "loss": 1.0195, "step": 51806 }, { "epoch": 0.98, "learning_rate": 6.673440757518912e-09, "loss": 1.0825, "step": 51807 }, { "epoch": 0.98, "learning_rate": 6.662290780113933e-09, "loss": 0.9412, "step": 51808 }, { "epoch": 0.98, "learning_rate": 6.6511501127553006e-09, "loss": 0.921, "step": 51809 }, { "epoch": 0.98, "learning_rate": 6.6400187554852005e-09, "loss": 0.9688, "step": 51810 }, { "epoch": 0.98, "learning_rate": 6.628896708344712e-09, "loss": 0.679, "step": 51811 }, { "epoch": 0.98, "learning_rate": 6.6177839713751915e-09, "loss": 1.1987, "step": 51812 }, { "epoch": 0.98, "learning_rate": 6.606680544618826e-09, "loss": 1.0435, "step": 51813 }, { "epoch": 0.98, "learning_rate": 6.595586428116419e-09, "loss": 0.9075, "step": 51814 }, { "epoch": 0.98, "learning_rate": 6.5845016219096006e-09, "loss": 0.8682, "step": 51815 }, { "epoch": 0.98, "learning_rate": 6.573426126040006e-09, "loss": 0.8545, "step": 51816 }, { "epoch": 0.98, "learning_rate": 6.562359940548713e-09, "loss": 0.8802, "step": 51817 }, { "epoch": 0.98, "learning_rate": 6.551303065477077e-09, "loss": 0.9047, "step": 51818 }, { "epoch": 0.98, "learning_rate": 6.540255500866455e-09, "loss": 1.0719, "step": 51819 }, { "epoch": 0.98, "learning_rate": 6.529217246757924e-09, "loss": 0.7355, "step": 51820 }, { "epoch": 0.98, "learning_rate": 6.518188303193118e-09, "loss": 0.8142, "step": 51821 }, { "epoch": 0.98, "learning_rate": 6.507168670212838e-09, "loss": 0.7576, "step": 51822 }, { "epoch": 0.98, "learning_rate": 6.496158347858161e-09, "loss": 1.1407, "step": 51823 }, { "epoch": 0.98, "learning_rate": 6.485157336170445e-09, "loss": 1.0701, "step": 51824 }, { "epoch": 0.98, "learning_rate": 6.474165635191043e-09, "loss": 1.0286, "step": 51825 }, { "epoch": 0.98, "learning_rate": 6.463183244960203e-09, "loss": 1.0771, "step": 51826 }, { "epoch": 0.98, "learning_rate": 6.4522101655195565e-09, "loss": 0.6529, "step": 51827 }, { "epoch": 0.98, "learning_rate": 6.441246396909906e-09, "loss": 0.9985, "step": 51828 }, { "epoch": 0.98, "learning_rate": 6.430291939172328e-09, "loss": 0.8984, "step": 51829 }, { "epoch": 0.98, "learning_rate": 6.419346792347348e-09, "loss": 1.0693, "step": 51830 }, { "epoch": 0.98, "learning_rate": 6.4084109564763185e-09, "loss": 1.1369, "step": 51831 }, { "epoch": 0.98, "learning_rate": 6.397484431599765e-09, "loss": 0.9427, "step": 51832 }, { "epoch": 0.98, "learning_rate": 6.386567217758211e-09, "loss": 0.9491, "step": 51833 }, { "epoch": 0.98, "learning_rate": 6.37565931499301e-09, "loss": 0.9037, "step": 51834 }, { "epoch": 0.98, "learning_rate": 6.364760723344687e-09, "loss": 0.8297, "step": 51835 }, { "epoch": 0.98, "learning_rate": 6.353871442853765e-09, "loss": 0.8495, "step": 51836 }, { "epoch": 0.98, "learning_rate": 6.3429914735613215e-09, "loss": 0.9771, "step": 51837 }, { "epoch": 0.98, "learning_rate": 6.332120815507326e-09, "loss": 1.032, "step": 51838 }, { "epoch": 0.98, "learning_rate": 6.321259468732854e-09, "loss": 0.9111, "step": 51839 }, { "epoch": 0.98, "learning_rate": 6.310407433278431e-09, "loss": 0.8909, "step": 51840 }, { "epoch": 0.98, "learning_rate": 6.2995647091845804e-09, "loss": 0.9473, "step": 51841 }, { "epoch": 0.98, "learning_rate": 6.288731296491546e-09, "loss": 1.0019, "step": 51842 }, { "epoch": 0.98, "learning_rate": 6.277907195239852e-09, "loss": 1.0582, "step": 51843 }, { "epoch": 0.98, "learning_rate": 6.267092405470021e-09, "loss": 0.9592, "step": 51844 }, { "epoch": 0.98, "learning_rate": 6.256286927222577e-09, "loss": 0.8202, "step": 51845 }, { "epoch": 0.98, "learning_rate": 6.245490760537487e-09, "loss": 0.7587, "step": 51846 }, { "epoch": 0.98, "learning_rate": 6.234703905455552e-09, "loss": 0.8606, "step": 51847 }, { "epoch": 0.98, "learning_rate": 6.223926362016463e-09, "loss": 0.7496, "step": 51848 }, { "epoch": 0.98, "learning_rate": 6.213158130261021e-09, "loss": 0.9593, "step": 51849 }, { "epoch": 0.98, "learning_rate": 6.202399210228915e-09, "loss": 0.8775, "step": 51850 }, { "epoch": 0.98, "learning_rate": 6.19164960196067e-09, "loss": 0.8988, "step": 51851 }, { "epoch": 0.98, "learning_rate": 6.18090930549653e-09, "loss": 0.7994, "step": 51852 }, { "epoch": 0.98, "learning_rate": 6.1701783208764635e-09, "loss": 0.9413, "step": 51853 }, { "epoch": 0.98, "learning_rate": 6.15945664814016e-09, "loss": 0.8139, "step": 51854 }, { "epoch": 0.98, "learning_rate": 6.148744287328145e-09, "loss": 1.2017, "step": 51855 }, { "epoch": 0.98, "learning_rate": 6.138041238480386e-09, "loss": 0.7643, "step": 51856 }, { "epoch": 0.98, "learning_rate": 6.127347501636294e-09, "loss": 0.8714, "step": 51857 }, { "epoch": 0.98, "learning_rate": 6.116663076836671e-09, "loss": 0.8143, "step": 51858 }, { "epoch": 0.98, "learning_rate": 6.10598796412093e-09, "loss": 0.9749, "step": 51859 }, { "epoch": 0.98, "learning_rate": 6.095322163528761e-09, "loss": 0.8033, "step": 51860 }, { "epoch": 0.98, "learning_rate": 6.084665675100132e-09, "loss": 0.8422, "step": 51861 }, { "epoch": 0.98, "learning_rate": 6.0740184988752896e-09, "loss": 0.9324, "step": 51862 }, { "epoch": 0.98, "learning_rate": 6.0633806348930905e-09, "loss": 0.8927, "step": 51863 }, { "epoch": 0.98, "learning_rate": 6.052752083194058e-09, "loss": 1.0126, "step": 51864 }, { "epoch": 0.98, "learning_rate": 6.0421328438176056e-09, "loss": 0.9209, "step": 51865 }, { "epoch": 0.98, "learning_rate": 6.031522916803423e-09, "loss": 0.8134, "step": 51866 }, { "epoch": 0.98, "learning_rate": 6.020922302190923e-09, "loss": 0.7332, "step": 51867 }, { "epoch": 0.98, "learning_rate": 6.010331000019798e-09, "loss": 1.0529, "step": 51868 }, { "epoch": 0.98, "learning_rate": 5.9997490103297365e-09, "loss": 0.9291, "step": 51869 }, { "epoch": 0.98, "learning_rate": 5.989176333160152e-09, "loss": 0.8413, "step": 51870 }, { "epoch": 0.98, "learning_rate": 5.978612968550457e-09, "loss": 0.8386, "step": 51871 }, { "epoch": 0.98, "learning_rate": 5.968058916540065e-09, "loss": 0.9641, "step": 51872 }, { "epoch": 0.98, "learning_rate": 5.957514177168666e-09, "loss": 0.8058, "step": 51873 }, { "epoch": 0.98, "learning_rate": 5.9469787504753965e-09, "loss": 1.0711, "step": 51874 }, { "epoch": 0.98, "learning_rate": 5.9364526364993906e-09, "loss": 0.9321, "step": 51875 }, { "epoch": 0.98, "learning_rate": 5.925935835280339e-09, "loss": 0.7914, "step": 51876 }, { "epoch": 0.98, "learning_rate": 5.915428346857655e-09, "loss": 0.9745, "step": 51877 }, { "epoch": 0.98, "learning_rate": 5.904930171269918e-09, "loss": 1.0366, "step": 51878 }, { "epoch": 0.98, "learning_rate": 5.89444130855682e-09, "loss": 0.7705, "step": 51879 }, { "epoch": 0.98, "learning_rate": 5.8839617587574945e-09, "loss": 1.0629, "step": 51880 }, { "epoch": 0.98, "learning_rate": 5.873491521910801e-09, "loss": 0.9954, "step": 51881 }, { "epoch": 0.98, "learning_rate": 5.863030598056152e-09, "loss": 0.6349, "step": 51882 }, { "epoch": 0.98, "learning_rate": 5.8525789872324045e-09, "loss": 1.0125, "step": 51883 }, { "epoch": 0.98, "learning_rate": 5.8421366894786944e-09, "loss": 1.0801, "step": 51884 }, { "epoch": 0.98, "learning_rate": 5.831703704834157e-09, "loss": 0.6843, "step": 51885 }, { "epoch": 0.98, "learning_rate": 5.8212800333373734e-09, "loss": 0.9103, "step": 51886 }, { "epoch": 0.98, "learning_rate": 5.810865675027477e-09, "loss": 0.8376, "step": 51887 }, { "epoch": 0.98, "learning_rate": 5.800460629943327e-09, "loss": 0.7637, "step": 51888 }, { "epoch": 0.98, "learning_rate": 5.7900648981237816e-09, "loss": 0.9132, "step": 51889 }, { "epoch": 0.98, "learning_rate": 5.779678479607698e-09, "loss": 0.8642, "step": 51890 }, { "epoch": 0.98, "learning_rate": 5.769301374433656e-09, "loss": 0.9393, "step": 51891 }, { "epoch": 0.98, "learning_rate": 5.758933582640791e-09, "loss": 0.9419, "step": 51892 }, { "epoch": 0.98, "learning_rate": 5.748575104267684e-09, "loss": 0.925, "step": 51893 }, { "epoch": 0.98, "learning_rate": 5.738225939352638e-09, "loss": 1.1216, "step": 51894 }, { "epoch": 0.98, "learning_rate": 5.727886087934787e-09, "loss": 1.0323, "step": 51895 }, { "epoch": 0.98, "learning_rate": 5.717555550052433e-09, "loss": 1.0085, "step": 51896 }, { "epoch": 0.98, "learning_rate": 5.70723432574416e-09, "loss": 0.825, "step": 51897 }, { "epoch": 0.98, "learning_rate": 5.696922415048822e-09, "loss": 0.8642, "step": 51898 }, { "epoch": 0.98, "learning_rate": 5.686619818004447e-09, "loss": 1.0507, "step": 51899 }, { "epoch": 0.98, "learning_rate": 5.67632653464989e-09, "loss": 1.1926, "step": 51900 }, { "epoch": 0.98, "learning_rate": 5.666042565023455e-09, "loss": 0.798, "step": 51901 }, { "epoch": 0.98, "learning_rate": 5.6557679091634456e-09, "loss": 0.7504, "step": 51902 }, { "epoch": 0.98, "learning_rate": 5.645502567108441e-09, "loss": 0.9957, "step": 51903 }, { "epoch": 0.98, "learning_rate": 5.6352465388964665e-09, "loss": 0.807, "step": 51904 }, { "epoch": 0.98, "learning_rate": 5.62499982456638e-09, "loss": 1.0701, "step": 51905 }, { "epoch": 0.98, "learning_rate": 5.6147624241556505e-09, "loss": 1.0092, "step": 51906 }, { "epoch": 0.98, "learning_rate": 5.604534337703138e-09, "loss": 0.6339, "step": 51907 }, { "epoch": 0.98, "learning_rate": 5.594315565246866e-09, "loss": 1.007, "step": 51908 }, { "epoch": 0.98, "learning_rate": 5.58410610682486e-09, "loss": 0.8772, "step": 51909 }, { "epoch": 0.98, "learning_rate": 5.573905962475146e-09, "loss": 0.7677, "step": 51910 }, { "epoch": 0.98, "learning_rate": 5.5637151322363025e-09, "loss": 0.7227, "step": 51911 }, { "epoch": 0.98, "learning_rate": 5.553533616145801e-09, "loss": 0.9031, "step": 51912 }, { "epoch": 0.98, "learning_rate": 5.543361414242221e-09, "loss": 1.1533, "step": 51913 }, { "epoch": 0.98, "learning_rate": 5.533198526563033e-09, "loss": 0.9319, "step": 51914 }, { "epoch": 0.98, "learning_rate": 5.523044953146261e-09, "loss": 0.704, "step": 51915 }, { "epoch": 0.98, "learning_rate": 5.51290069403021e-09, "loss": 0.7258, "step": 51916 }, { "epoch": 0.98, "learning_rate": 5.502765749252348e-09, "loss": 0.9052, "step": 51917 }, { "epoch": 0.98, "learning_rate": 5.4926401188507e-09, "loss": 1.2533, "step": 51918 }, { "epoch": 0.98, "learning_rate": 5.482523802863293e-09, "loss": 0.7532, "step": 51919 }, { "epoch": 0.98, "learning_rate": 5.472416801327318e-09, "loss": 0.7673, "step": 51920 }, { "epoch": 0.98, "learning_rate": 5.462319114281078e-09, "loss": 0.7617, "step": 51921 }, { "epoch": 0.98, "learning_rate": 5.4522307417620435e-09, "loss": 0.9457, "step": 51922 }, { "epoch": 0.98, "learning_rate": 5.4421516838076835e-09, "loss": 0.8263, "step": 51923 }, { "epoch": 0.98, "learning_rate": 5.432081940456024e-09, "loss": 0.9988, "step": 51924 }, { "epoch": 0.98, "learning_rate": 5.422021511744535e-09, "loss": 1.1459, "step": 51925 }, { "epoch": 0.98, "learning_rate": 5.411970397710686e-09, "loss": 0.9391, "step": 51926 }, { "epoch": 0.98, "learning_rate": 5.401928598391948e-09, "loss": 0.866, "step": 51927 }, { "epoch": 0.98, "learning_rate": 5.391896113826067e-09, "loss": 0.7877, "step": 51928 }, { "epoch": 0.98, "learning_rate": 5.381872944050237e-09, "loss": 0.8477, "step": 51929 }, { "epoch": 0.98, "learning_rate": 5.3718590891019275e-09, "loss": 1.0847, "step": 51930 }, { "epoch": 0.98, "learning_rate": 5.3618545490188855e-09, "loss": 0.988, "step": 51931 }, { "epoch": 0.98, "learning_rate": 5.351859323838027e-09, "loss": 1.0472, "step": 51932 }, { "epoch": 0.98, "learning_rate": 5.341873413596821e-09, "loss": 0.9019, "step": 51933 }, { "epoch": 0.98, "learning_rate": 5.33189681833246e-09, "loss": 0.902, "step": 51934 }, { "epoch": 0.98, "learning_rate": 5.3219295380824155e-09, "loss": 0.9128, "step": 51935 }, { "epoch": 0.98, "learning_rate": 5.311971572883878e-09, "loss": 0.9336, "step": 51936 }, { "epoch": 0.98, "learning_rate": 5.302022922774042e-09, "loss": 0.9407, "step": 51937 }, { "epoch": 0.98, "learning_rate": 5.29208358778982e-09, "loss": 1.0059, "step": 51938 }, { "epoch": 0.98, "learning_rate": 5.282153567968407e-09, "loss": 0.9769, "step": 51939 }, { "epoch": 0.98, "learning_rate": 5.272232863346993e-09, "loss": 0.969, "step": 51940 }, { "epoch": 0.98, "learning_rate": 5.262321473962495e-09, "loss": 1.0629, "step": 51941 }, { "epoch": 0.98, "learning_rate": 5.252419399852104e-09, "loss": 0.8496, "step": 51942 }, { "epoch": 0.98, "learning_rate": 5.242526641052736e-09, "loss": 0.9456, "step": 51943 }, { "epoch": 0.98, "learning_rate": 5.232643197601306e-09, "loss": 1.1373, "step": 51944 }, { "epoch": 0.98, "learning_rate": 5.22276906953445e-09, "loss": 0.774, "step": 51945 }, { "epoch": 0.98, "learning_rate": 5.21290425688964e-09, "loss": 0.9403, "step": 51946 }, { "epoch": 0.98, "learning_rate": 5.203048759702955e-09, "loss": 0.8465, "step": 51947 }, { "epoch": 0.98, "learning_rate": 5.193202578011869e-09, "loss": 0.7548, "step": 51948 }, { "epoch": 0.98, "learning_rate": 5.183365711853017e-09, "loss": 0.7964, "step": 51949 }, { "epoch": 0.98, "learning_rate": 5.1735381612624815e-09, "loss": 1.0983, "step": 51950 }, { "epoch": 0.98, "learning_rate": 5.16371992627801e-09, "loss": 0.7992, "step": 51951 }, { "epoch": 0.98, "learning_rate": 5.153911006935408e-09, "loss": 0.7181, "step": 51952 }, { "epoch": 0.98, "learning_rate": 5.14411140327159e-09, "loss": 0.8622, "step": 51953 }, { "epoch": 0.98, "learning_rate": 5.134321115323193e-09, "loss": 0.7617, "step": 51954 }, { "epoch": 0.98, "learning_rate": 5.124540143126855e-09, "loss": 0.7779, "step": 51955 }, { "epoch": 0.98, "learning_rate": 5.114768486718935e-09, "loss": 1.2148, "step": 51956 }, { "epoch": 0.98, "learning_rate": 5.105006146135794e-09, "loss": 0.85, "step": 51957 }, { "epoch": 0.98, "learning_rate": 5.095253121414345e-09, "loss": 0.7599, "step": 51958 }, { "epoch": 0.98, "learning_rate": 5.085509412590672e-09, "loss": 0.7328, "step": 51959 }, { "epoch": 0.98, "learning_rate": 5.075775019701135e-09, "loss": 0.8635, "step": 51960 }, { "epoch": 0.98, "learning_rate": 5.066049942782092e-09, "loss": 0.8534, "step": 51961 }, { "epoch": 0.98, "learning_rate": 5.056334181869904e-09, "loss": 1.057, "step": 51962 }, { "epoch": 0.98, "learning_rate": 5.046627737001208e-09, "loss": 0.8533, "step": 51963 }, { "epoch": 0.98, "learning_rate": 5.036930608211532e-09, "loss": 0.9775, "step": 51964 }, { "epoch": 0.98, "learning_rate": 5.0272427955375126e-09, "loss": 0.9077, "step": 51965 }, { "epoch": 0.98, "learning_rate": 5.017564299015509e-09, "loss": 0.9068, "step": 51966 }, { "epoch": 0.98, "learning_rate": 5.00789511868105e-09, "loss": 0.9351, "step": 51967 }, { "epoch": 0.98, "learning_rate": 4.998235254571049e-09, "loss": 0.9485, "step": 51968 }, { "epoch": 0.98, "learning_rate": 4.988584706720756e-09, "loss": 0.9574, "step": 51969 }, { "epoch": 0.98, "learning_rate": 4.9789434751668085e-09, "loss": 0.7997, "step": 51970 }, { "epoch": 0.98, "learning_rate": 4.969311559945011e-09, "loss": 0.9691, "step": 51971 }, { "epoch": 0.98, "learning_rate": 4.959688961091169e-09, "loss": 0.9264, "step": 51972 }, { "epoch": 0.98, "learning_rate": 4.950075678641364e-09, "loss": 0.764, "step": 51973 }, { "epoch": 0.98, "learning_rate": 4.940471712631401e-09, "loss": 0.976, "step": 51974 }, { "epoch": 0.98, "learning_rate": 4.930877063097361e-09, "loss": 1.2114, "step": 51975 }, { "epoch": 0.98, "learning_rate": 4.921291730075051e-09, "loss": 0.7213, "step": 51976 }, { "epoch": 0.98, "learning_rate": 4.911715713599996e-09, "loss": 0.8552, "step": 51977 }, { "epoch": 0.98, "learning_rate": 4.902149013708002e-09, "loss": 0.8531, "step": 51978 }, { "epoch": 0.98, "learning_rate": 4.892591630434873e-09, "loss": 0.7619, "step": 51979 }, { "epoch": 0.98, "learning_rate": 4.883043563816414e-09, "loss": 1.0994, "step": 51980 }, { "epoch": 0.98, "learning_rate": 4.873504813888153e-09, "loss": 1.1418, "step": 51981 }, { "epoch": 0.98, "learning_rate": 4.863975380685893e-09, "loss": 0.8197, "step": 51982 }, { "epoch": 0.98, "learning_rate": 4.854455264244606e-09, "loss": 0.8737, "step": 51983 }, { "epoch": 0.98, "learning_rate": 4.844944464600654e-09, "loss": 0.87, "step": 51984 }, { "epoch": 0.98, "learning_rate": 4.835442981789007e-09, "loss": 1.0495, "step": 51985 }, { "epoch": 0.98, "learning_rate": 4.825950815845471e-09, "loss": 0.7194, "step": 51986 }, { "epoch": 0.98, "learning_rate": 4.8164679668052935e-09, "loss": 1.0685, "step": 51987 }, { "epoch": 0.98, "learning_rate": 4.806994434703727e-09, "loss": 0.8738, "step": 51988 }, { "epoch": 0.98, "learning_rate": 4.7975302195765735e-09, "loss": 0.7801, "step": 51989 }, { "epoch": 0.98, "learning_rate": 4.7880753214588076e-09, "loss": 0.8792, "step": 51990 }, { "epoch": 0.98, "learning_rate": 4.778629740385954e-09, "loss": 0.7711, "step": 51991 }, { "epoch": 0.98, "learning_rate": 4.769193476392986e-09, "loss": 1.1742, "step": 51992 }, { "epoch": 0.98, "learning_rate": 4.759766529515431e-09, "loss": 1.2394, "step": 51993 }, { "epoch": 0.98, "learning_rate": 4.750348899788537e-09, "loss": 1.0898, "step": 51994 }, { "epoch": 0.98, "learning_rate": 4.740940587247278e-09, "loss": 1.0082, "step": 51995 }, { "epoch": 0.98, "learning_rate": 4.7315415919269026e-09, "loss": 0.8114, "step": 51996 }, { "epoch": 0.98, "learning_rate": 4.722151913862105e-09, "loss": 0.9477, "step": 51997 }, { "epoch": 0.98, "learning_rate": 4.7127715530886905e-09, "loss": 0.9787, "step": 51998 }, { "epoch": 0.98, "learning_rate": 4.7034005096410765e-09, "loss": 0.9977, "step": 51999 }, { "epoch": 0.98, "learning_rate": 4.694038783554511e-09, "loss": 1.2095, "step": 52000 }, { "epoch": 0.98, "learning_rate": 4.684686374863967e-09, "loss": 0.9941, "step": 52001 }, { "epoch": 0.98, "learning_rate": 4.675343283604139e-09, "loss": 0.8964, "step": 52002 }, { "epoch": 0.98, "learning_rate": 4.666009509810277e-09, "loss": 1.0204, "step": 52003 }, { "epoch": 0.98, "learning_rate": 4.656685053516796e-09, "loss": 0.7324, "step": 52004 }, { "epoch": 0.98, "learning_rate": 4.6473699147589476e-09, "loss": 0.9568, "step": 52005 }, { "epoch": 0.98, "learning_rate": 4.638064093571149e-09, "loss": 1.1339, "step": 52006 }, { "epoch": 0.98, "learning_rate": 4.62876758998837e-09, "loss": 0.7675, "step": 52007 }, { "epoch": 0.98, "learning_rate": 4.619480404045307e-09, "loss": 0.9309, "step": 52008 }, { "epoch": 0.98, "learning_rate": 4.610202535776376e-09, "loss": 0.8899, "step": 52009 }, { "epoch": 0.98, "learning_rate": 4.600933985216826e-09, "loss": 0.8069, "step": 52010 }, { "epoch": 0.98, "learning_rate": 4.5916747524005216e-09, "loss": 0.8157, "step": 52011 }, { "epoch": 0.98, "learning_rate": 4.582424837362709e-09, "loss": 1.0092, "step": 52012 }, { "epoch": 0.98, "learning_rate": 4.5731842401372516e-09, "loss": 0.902, "step": 52013 }, { "epoch": 0.98, "learning_rate": 4.563952960759399e-09, "loss": 0.8026, "step": 52014 }, { "epoch": 0.98, "learning_rate": 4.554730999263013e-09, "loss": 0.8928, "step": 52015 }, { "epoch": 0.98, "learning_rate": 4.545518355682787e-09, "loss": 0.9621, "step": 52016 }, { "epoch": 0.98, "learning_rate": 4.5363150300528625e-09, "loss": 0.7252, "step": 52017 }, { "epoch": 0.98, "learning_rate": 4.52712102240821e-09, "loss": 1.0201, "step": 52018 }, { "epoch": 0.98, "learning_rate": 4.517936332782691e-09, "loss": 0.9308, "step": 52019 }, { "epoch": 0.98, "learning_rate": 4.5087609612104454e-09, "loss": 0.916, "step": 52020 }, { "epoch": 0.98, "learning_rate": 4.499594907726168e-09, "loss": 0.7253, "step": 52021 }, { "epoch": 0.98, "learning_rate": 4.49043817236372e-09, "loss": 0.7437, "step": 52022 }, { "epoch": 0.98, "learning_rate": 4.481290755157519e-09, "loss": 0.7031, "step": 52023 }, { "epoch": 0.98, "learning_rate": 4.472152656141982e-09, "loss": 0.9708, "step": 52024 }, { "epoch": 0.98, "learning_rate": 4.463023875350691e-09, "loss": 0.9199, "step": 52025 }, { "epoch": 0.98, "learning_rate": 4.453904412817789e-09, "loss": 0.9669, "step": 52026 }, { "epoch": 0.98, "learning_rate": 4.44479426857769e-09, "loss": 0.9535, "step": 52027 }, { "epoch": 0.98, "learning_rate": 4.43569344266398e-09, "loss": 0.9117, "step": 52028 }, { "epoch": 0.98, "learning_rate": 4.426601935111074e-09, "loss": 0.8307, "step": 52029 }, { "epoch": 0.98, "learning_rate": 4.417519745952836e-09, "loss": 0.6797, "step": 52030 }, { "epoch": 0.98, "learning_rate": 4.408446875222849e-09, "loss": 1.0439, "step": 52031 }, { "epoch": 0.98, "learning_rate": 4.399383322955253e-09, "loss": 0.8945, "step": 52032 }, { "epoch": 0.98, "learning_rate": 4.390329089183909e-09, "loss": 0.9885, "step": 52033 }, { "epoch": 0.98, "learning_rate": 4.381284173942401e-09, "loss": 0.8026, "step": 52034 }, { "epoch": 0.98, "learning_rate": 4.372248577264871e-09, "loss": 0.6887, "step": 52035 }, { "epoch": 0.98, "learning_rate": 4.363222299184899e-09, "loss": 0.6251, "step": 52036 }, { "epoch": 0.98, "learning_rate": 4.354205339735795e-09, "loss": 0.9711, "step": 52037 }, { "epoch": 0.98, "learning_rate": 4.345197698951698e-09, "loss": 1.022, "step": 52038 }, { "epoch": 0.98, "learning_rate": 4.33619937686619e-09, "loss": 0.9113, "step": 52039 }, { "epoch": 0.98, "learning_rate": 4.3272103735128576e-09, "loss": 0.8647, "step": 52040 }, { "epoch": 0.98, "learning_rate": 4.318230688925284e-09, "loss": 0.8734, "step": 52041 }, { "epoch": 0.98, "learning_rate": 4.309260323136777e-09, "loss": 1.0129, "step": 52042 }, { "epoch": 0.98, "learning_rate": 4.300299276180919e-09, "loss": 0.7592, "step": 52043 }, { "epoch": 0.98, "learning_rate": 4.291347548091019e-09, "loss": 0.8188, "step": 52044 }, { "epoch": 0.98, "learning_rate": 4.282405138901213e-09, "loss": 0.8395, "step": 52045 }, { "epoch": 0.98, "learning_rate": 4.273472048643978e-09, "loss": 0.8671, "step": 52046 }, { "epoch": 0.98, "learning_rate": 4.264548277353176e-09, "loss": 0.9803, "step": 52047 }, { "epoch": 0.98, "learning_rate": 4.255633825062111e-09, "loss": 0.7848, "step": 52048 }, { "epoch": 0.98, "learning_rate": 4.246728691804092e-09, "loss": 0.879, "step": 52049 }, { "epoch": 0.98, "learning_rate": 4.237832877612147e-09, "loss": 1.0956, "step": 52050 }, { "epoch": 0.98, "learning_rate": 4.228946382519583e-09, "loss": 1.0495, "step": 52051 }, { "epoch": 0.98, "learning_rate": 4.220069206559707e-09, "loss": 0.8218, "step": 52052 }, { "epoch": 0.98, "learning_rate": 4.21120134976527e-09, "loss": 0.8096, "step": 52053 }, { "epoch": 0.98, "learning_rate": 4.202342812169857e-09, "loss": 0.9294, "step": 52054 }, { "epoch": 0.98, "learning_rate": 4.193493593806497e-09, "loss": 1.0366, "step": 52055 }, { "epoch": 0.98, "learning_rate": 4.184653694707941e-09, "loss": 0.9601, "step": 52056 }, { "epoch": 0.98, "learning_rate": 4.175823114907496e-09, "loss": 1.0031, "step": 52057 }, { "epoch": 0.98, "learning_rate": 4.167001854437913e-09, "loss": 0.9217, "step": 52058 }, { "epoch": 0.98, "learning_rate": 4.1581899133325e-09, "loss": 0.9871, "step": 52059 }, { "epoch": 0.98, "learning_rate": 4.149387291623452e-09, "loss": 0.7134, "step": 52060 }, { "epoch": 0.98, "learning_rate": 4.1405939893443546e-09, "loss": 0.6971, "step": 52061 }, { "epoch": 0.98, "learning_rate": 4.131810006527681e-09, "loss": 1.0806, "step": 52062 }, { "epoch": 0.98, "learning_rate": 4.123035343206183e-09, "loss": 1.0279, "step": 52063 }, { "epoch": 0.98, "learning_rate": 4.11426999941289e-09, "loss": 0.9015, "step": 52064 }, { "epoch": 0.98, "learning_rate": 4.1055139751802756e-09, "loss": 0.7447, "step": 52065 }, { "epoch": 0.98, "learning_rate": 4.096767270541368e-09, "loss": 0.9385, "step": 52066 }, { "epoch": 0.98, "learning_rate": 4.088029885528366e-09, "loss": 0.7292, "step": 52067 }, { "epoch": 0.98, "learning_rate": 4.079301820174297e-09, "loss": 0.8529, "step": 52068 }, { "epoch": 0.98, "learning_rate": 4.070583074511636e-09, "loss": 1.0132, "step": 52069 }, { "epoch": 0.98, "learning_rate": 4.061873648572579e-09, "loss": 0.8203, "step": 52070 }, { "epoch": 0.98, "learning_rate": 4.053173542390154e-09, "loss": 0.8636, "step": 52071 }, { "epoch": 0.98, "learning_rate": 4.044482755996837e-09, "loss": 0.9643, "step": 52072 }, { "epoch": 0.98, "learning_rate": 4.0358012894245456e-09, "loss": 0.7953, "step": 52073 }, { "epoch": 0.98, "learning_rate": 4.027129142706309e-09, "loss": 0.9479, "step": 52074 }, { "epoch": 0.98, "learning_rate": 4.018466315874048e-09, "loss": 0.9135, "step": 52075 }, { "epoch": 0.98, "learning_rate": 4.009812808960512e-09, "loss": 0.9497, "step": 52076 }, { "epoch": 0.98, "learning_rate": 4.00116862199762e-09, "loss": 0.9797, "step": 52077 }, { "epoch": 0.98, "learning_rate": 3.992533755017846e-09, "loss": 0.7477, "step": 52078 }, { "epoch": 0.98, "learning_rate": 3.983908208053666e-09, "loss": 0.8203, "step": 52079 }, { "epoch": 0.98, "learning_rate": 3.97529198113672e-09, "loss": 1.1371, "step": 52080 }, { "epoch": 0.98, "learning_rate": 3.966685074299759e-09, "loss": 1.0321, "step": 52081 }, { "epoch": 0.98, "learning_rate": 3.958087487574425e-09, "loss": 0.8589, "step": 52082 }, { "epoch": 0.98, "learning_rate": 3.949499220993191e-09, "loss": 0.7639, "step": 52083 }, { "epoch": 0.98, "learning_rate": 3.940920274587978e-09, "loss": 1.006, "step": 52084 }, { "epoch": 0.98, "learning_rate": 3.932350648390981e-09, "loss": 0.8167, "step": 52085 }, { "epoch": 0.98, "learning_rate": 3.923790342433842e-09, "loss": 0.7442, "step": 52086 }, { "epoch": 0.98, "learning_rate": 3.9152393567487565e-09, "loss": 1.108, "step": 52087 }, { "epoch": 0.98, "learning_rate": 3.906697691367644e-09, "loss": 0.9261, "step": 52088 }, { "epoch": 0.98, "learning_rate": 3.898165346322702e-09, "loss": 0.8219, "step": 52089 }, { "epoch": 0.98, "learning_rate": 3.889642321645015e-09, "loss": 0.8018, "step": 52090 }, { "epoch": 0.98, "learning_rate": 3.881128617367058e-09, "loss": 0.8552, "step": 52091 }, { "epoch": 0.98, "learning_rate": 3.872624233520472e-09, "loss": 0.7992, "step": 52092 }, { "epoch": 0.98, "learning_rate": 3.864129170136899e-09, "loss": 0.8598, "step": 52093 }, { "epoch": 0.98, "learning_rate": 3.855643427248257e-09, "loss": 1.063, "step": 52094 }, { "epoch": 0.98, "learning_rate": 3.847167004886187e-09, "loss": 0.915, "step": 52095 }, { "epoch": 0.98, "learning_rate": 3.838699903082055e-09, "loss": 0.6736, "step": 52096 }, { "epoch": 0.98, "learning_rate": 3.830242121867777e-09, "loss": 0.8518, "step": 52097 }, { "epoch": 0.98, "learning_rate": 3.82179366127472e-09, "loss": 1.0375, "step": 52098 }, { "epoch": 0.98, "learning_rate": 3.8133545213348e-09, "loss": 1.0667, "step": 52099 }, { "epoch": 0.98, "learning_rate": 3.804924702079104e-09, "loss": 1.1431, "step": 52100 }, { "epoch": 0.98, "learning_rate": 3.796504203539275e-09, "loss": 1.0253, "step": 52101 }, { "epoch": 0.98, "learning_rate": 3.788093025746675e-09, "loss": 0.8047, "step": 52102 }, { "epoch": 0.98, "learning_rate": 3.7796911687329465e-09, "loss": 0.6958, "step": 52103 }, { "epoch": 0.98, "learning_rate": 3.771298632529452e-09, "loss": 0.723, "step": 52104 }, { "epoch": 0.98, "learning_rate": 3.762915417167279e-09, "loss": 0.9976, "step": 52105 }, { "epoch": 0.98, "learning_rate": 3.754541522677791e-09, "loss": 1.1013, "step": 52106 }, { "epoch": 0.98, "learning_rate": 3.746176949092073e-09, "loss": 0.9091, "step": 52107 }, { "epoch": 0.98, "learning_rate": 3.737821696442046e-09, "loss": 0.9424, "step": 52108 }, { "epoch": 0.98, "learning_rate": 3.729475764758239e-09, "loss": 1.1948, "step": 52109 }, { "epoch": 0.98, "learning_rate": 3.721139154072018e-09, "loss": 0.9023, "step": 52110 }, { "epoch": 0.98, "learning_rate": 3.7128118644144674e-09, "loss": 0.8847, "step": 52111 }, { "epoch": 0.98, "learning_rate": 3.704493895816674e-09, "loss": 1.0237, "step": 52112 }, { "epoch": 0.98, "learning_rate": 3.6961852483100026e-09, "loss": 0.9946, "step": 52113 }, { "epoch": 0.98, "learning_rate": 3.6878859219252606e-09, "loss": 0.6188, "step": 52114 }, { "epoch": 0.98, "learning_rate": 3.679595916693257e-09, "loss": 0.7672, "step": 52115 }, { "epoch": 0.98, "learning_rate": 3.6713152326450785e-09, "loss": 0.7258, "step": 52116 }, { "epoch": 0.98, "learning_rate": 3.663043869811811e-09, "loss": 0.886, "step": 52117 }, { "epoch": 0.98, "learning_rate": 3.6547818282239855e-09, "loss": 0.9812, "step": 52118 }, { "epoch": 0.98, "learning_rate": 3.646529107912966e-09, "loss": 0.9263, "step": 52119 }, { "epoch": 0.98, "learning_rate": 3.6382857089090062e-09, "loss": 0.817, "step": 52120 }, { "epoch": 0.98, "learning_rate": 3.630051631243192e-09, "loss": 0.8842, "step": 52121 }, { "epoch": 0.98, "learning_rate": 3.6218268749463324e-09, "loss": 0.7779, "step": 52122 }, { "epoch": 0.98, "learning_rate": 3.6136114400489584e-09, "loss": 0.9388, "step": 52123 }, { "epoch": 0.98, "learning_rate": 3.6054053265818787e-09, "loss": 1.1343, "step": 52124 }, { "epoch": 0.98, "learning_rate": 3.5972085345756245e-09, "loss": 1.1063, "step": 52125 }, { "epoch": 0.98, "learning_rate": 3.589021064060727e-09, "loss": 0.8837, "step": 52126 }, { "epoch": 0.98, "learning_rate": 3.5808429150679947e-09, "loss": 0.9816, "step": 52127 }, { "epoch": 0.98, "learning_rate": 3.5726740876279587e-09, "loss": 0.6776, "step": 52128 }, { "epoch": 0.98, "learning_rate": 3.5645145817708728e-09, "loss": 0.9525, "step": 52129 }, { "epoch": 0.98, "learning_rate": 3.5563643975272677e-09, "loss": 0.9975, "step": 52130 }, { "epoch": 0.98, "learning_rate": 3.5482235349279527e-09, "loss": 1.0948, "step": 52131 }, { "epoch": 0.98, "learning_rate": 3.540091994002903e-09, "loss": 0.9885, "step": 52132 }, { "epoch": 0.98, "learning_rate": 3.5319697747823734e-09, "loss": 0.7557, "step": 52133 }, { "epoch": 0.98, "learning_rate": 3.5238568772971717e-09, "loss": 0.9635, "step": 52134 }, { "epoch": 0.98, "learning_rate": 3.515753301577274e-09, "loss": 0.9324, "step": 52135 }, { "epoch": 0.98, "learning_rate": 3.5076590476532112e-09, "loss": 0.9728, "step": 52136 }, { "epoch": 0.98, "learning_rate": 3.4995741155546825e-09, "loss": 0.9513, "step": 52137 }, { "epoch": 0.98, "learning_rate": 3.491498505312496e-09, "loss": 1.0776, "step": 52138 }, { "epoch": 0.98, "learning_rate": 3.483432216956073e-09, "loss": 0.9816, "step": 52139 }, { "epoch": 0.98, "learning_rate": 3.4753752505164996e-09, "loss": 0.6983, "step": 52140 }, { "epoch": 0.98, "learning_rate": 3.4673276060229187e-09, "loss": 0.7648, "step": 52141 }, { "epoch": 0.98, "learning_rate": 3.4592892835058624e-09, "loss": 0.8502, "step": 52142 }, { "epoch": 0.98, "learning_rate": 3.4512602829955832e-09, "loss": 0.8146, "step": 52143 }, { "epoch": 0.98, "learning_rate": 3.443240604521503e-09, "loss": 0.9261, "step": 52144 }, { "epoch": 0.98, "learning_rate": 3.4352302481138744e-09, "loss": 0.9412, "step": 52145 }, { "epoch": 0.98, "learning_rate": 3.4272292138023966e-09, "loss": 0.7922, "step": 52146 }, { "epoch": 0.98, "learning_rate": 3.419237501617323e-09, "loss": 0.9395, "step": 52147 }, { "epoch": 0.98, "learning_rate": 3.4112551115880743e-09, "loss": 0.8846, "step": 52148 }, { "epoch": 0.98, "learning_rate": 3.4032820437446266e-09, "loss": 0.9342, "step": 52149 }, { "epoch": 0.98, "learning_rate": 3.3953182981169565e-09, "loss": 1.2786, "step": 52150 }, { "epoch": 0.98, "learning_rate": 3.387363874734484e-09, "loss": 0.7271, "step": 52151 }, { "epoch": 0.98, "learning_rate": 3.3794187736271853e-09, "loss": 0.7491, "step": 52152 }, { "epoch": 0.98, "learning_rate": 3.371482994824482e-09, "loss": 1.0148, "step": 52153 }, { "epoch": 0.98, "learning_rate": 3.3635565383563497e-09, "loss": 0.8909, "step": 52154 }, { "epoch": 0.98, "learning_rate": 3.3556394042519313e-09, "loss": 0.8947, "step": 52155 }, { "epoch": 0.98, "learning_rate": 3.3477315925409258e-09, "loss": 1.066, "step": 52156 }, { "epoch": 0.98, "learning_rate": 3.339833103253032e-09, "loss": 0.8476, "step": 52157 }, { "epoch": 0.98, "learning_rate": 3.33194393641767e-09, "loss": 0.8132, "step": 52158 }, { "epoch": 0.98, "learning_rate": 3.3240640920642607e-09, "loss": 0.7939, "step": 52159 }, { "epoch": 0.98, "learning_rate": 3.3161935702222257e-09, "loss": 0.9106, "step": 52160 }, { "epoch": 0.98, "learning_rate": 3.3083323709209857e-09, "loss": 0.748, "step": 52161 }, { "epoch": 0.98, "learning_rate": 3.3004804941899615e-09, "loss": 0.9883, "step": 52162 }, { "epoch": 0.98, "learning_rate": 3.2926379400582962e-09, "loss": 1.0521, "step": 52163 }, { "epoch": 0.98, "learning_rate": 3.2848047085554115e-09, "loss": 0.8542, "step": 52164 }, { "epoch": 0.98, "learning_rate": 3.2769807997107273e-09, "loss": 0.9069, "step": 52165 }, { "epoch": 0.98, "learning_rate": 3.269166213552832e-09, "loss": 1.037, "step": 52166 }, { "epoch": 0.98, "learning_rate": 3.2613609501117028e-09, "loss": 0.8928, "step": 52167 }, { "epoch": 0.98, "learning_rate": 3.2535650094159264e-09, "loss": 1.0084, "step": 52168 }, { "epoch": 0.98, "learning_rate": 3.245778391494647e-09, "loss": 0.7784, "step": 52169 }, { "epoch": 0.98, "learning_rate": 3.2380010963772857e-09, "loss": 1.0688, "step": 52170 }, { "epoch": 0.98, "learning_rate": 3.23023312409243e-09, "loss": 0.8994, "step": 52171 }, { "epoch": 0.98, "learning_rate": 3.2224744746695013e-09, "loss": 0.8826, "step": 52172 }, { "epoch": 0.98, "learning_rate": 3.2147251481373653e-09, "loss": 0.7662, "step": 52173 }, { "epoch": 0.98, "learning_rate": 3.206985144524888e-09, "loss": 0.7617, "step": 52174 }, { "epoch": 0.98, "learning_rate": 3.1992544638609347e-09, "loss": 1.1176, "step": 52175 }, { "epoch": 0.98, "learning_rate": 3.1915331061743716e-09, "loss": 0.8618, "step": 52176 }, { "epoch": 0.98, "learning_rate": 3.1838210714940643e-09, "loss": 0.9755, "step": 52177 }, { "epoch": 0.98, "learning_rate": 3.1761183598488788e-09, "loss": 0.9099, "step": 52178 }, { "epoch": 0.98, "learning_rate": 3.168424971267403e-09, "loss": 0.8211, "step": 52179 }, { "epoch": 0.98, "learning_rate": 3.1607409057785033e-09, "loss": 0.7591, "step": 52180 }, { "epoch": 0.98, "learning_rate": 3.1530661634110447e-09, "loss": 1.0424, "step": 52181 }, { "epoch": 0.98, "learning_rate": 3.1454007441933387e-09, "loss": 0.9232, "step": 52182 }, { "epoch": 0.98, "learning_rate": 3.137744648153973e-09, "loss": 0.855, "step": 52183 }, { "epoch": 0.98, "learning_rate": 3.1300978753218137e-09, "loss": 0.7827, "step": 52184 }, { "epoch": 0.98, "learning_rate": 3.1224604257254487e-09, "loss": 0.6691, "step": 52185 }, { "epoch": 0.98, "learning_rate": 3.114832299393189e-09, "loss": 0.8283, "step": 52186 }, { "epoch": 0.98, "learning_rate": 3.1072134963536228e-09, "loss": 0.9922, "step": 52187 }, { "epoch": 0.98, "learning_rate": 3.0996040166350603e-09, "loss": 1.0652, "step": 52188 }, { "epoch": 0.98, "learning_rate": 3.0920038602660907e-09, "loss": 0.842, "step": 52189 }, { "epoch": 0.98, "learning_rate": 3.084413027275024e-09, "loss": 0.8069, "step": 52190 }, { "epoch": 0.98, "learning_rate": 3.0768315176901707e-09, "loss": 0.7982, "step": 52191 }, { "epoch": 0.98, "learning_rate": 3.0692593315401196e-09, "loss": 0.7753, "step": 52192 }, { "epoch": 0.98, "learning_rate": 3.061696468852626e-09, "loss": 0.8142, "step": 52193 }, { "epoch": 0.98, "learning_rate": 3.0541429296562787e-09, "loss": 0.8762, "step": 52194 }, { "epoch": 0.98, "learning_rate": 3.0465987139791098e-09, "loss": 0.7969, "step": 52195 }, { "epoch": 0.98, "learning_rate": 3.0390638218494308e-09, "loss": 0.8518, "step": 52196 }, { "epoch": 0.98, "learning_rate": 3.031538253295274e-09, "loss": 0.9325, "step": 52197 }, { "epoch": 0.98, "learning_rate": 3.024022008344951e-09, "loss": 0.914, "step": 52198 }, { "epoch": 0.98, "learning_rate": 3.016515087026217e-09, "loss": 1.0203, "step": 52199 }, { "epoch": 0.98, "learning_rate": 3.009017489367383e-09, "loss": 1.1122, "step": 52200 }, { "epoch": 0.98, "learning_rate": 3.0015292153962038e-09, "loss": 1.0438, "step": 52201 }, { "epoch": 0.98, "learning_rate": 2.994050265140713e-09, "loss": 0.9468, "step": 52202 }, { "epoch": 0.98, "learning_rate": 2.986580638628944e-09, "loss": 0.7172, "step": 52203 }, { "epoch": 0.98, "learning_rate": 2.97912033588893e-09, "loss": 0.8025, "step": 52204 }, { "epoch": 0.98, "learning_rate": 2.971669356948148e-09, "loss": 0.7699, "step": 52205 }, { "epoch": 0.98, "learning_rate": 2.9642277018346323e-09, "loss": 1.112, "step": 52206 }, { "epoch": 0.98, "learning_rate": 2.95679537057586e-09, "loss": 0.9045, "step": 52207 }, { "epoch": 0.99, "learning_rate": 2.9493723632001425e-09, "loss": 0.8704, "step": 52208 }, { "epoch": 0.99, "learning_rate": 2.9419586797349576e-09, "loss": 0.7866, "step": 52209 }, { "epoch": 0.99, "learning_rate": 2.934554320207783e-09, "loss": 0.7443, "step": 52210 }, { "epoch": 0.99, "learning_rate": 2.9271592846463746e-09, "loss": 0.8756, "step": 52211 }, { "epoch": 0.99, "learning_rate": 2.919773573078488e-09, "loss": 0.8962, "step": 52212 }, { "epoch": 0.99, "learning_rate": 2.9123971855316014e-09, "loss": 0.9731, "step": 52213 }, { "epoch": 0.99, "learning_rate": 2.905030122033192e-09, "loss": 0.9306, "step": 52214 }, { "epoch": 0.99, "learning_rate": 2.8976723826110165e-09, "loss": 0.9612, "step": 52215 }, { "epoch": 0.99, "learning_rate": 2.8903239672922744e-09, "loss": 0.7694, "step": 52216 }, { "epoch": 0.99, "learning_rate": 2.8829848761044443e-09, "loss": 0.6555, "step": 52217 }, { "epoch": 0.99, "learning_rate": 2.875655109075004e-09, "loss": 1.0132, "step": 52218 }, { "epoch": 0.99, "learning_rate": 2.8683346662314314e-09, "loss": 1.0663, "step": 52219 }, { "epoch": 0.99, "learning_rate": 2.8610235476006497e-09, "loss": 0.9076, "step": 52220 }, { "epoch": 0.99, "learning_rate": 2.8537217532104146e-09, "loss": 0.9801, "step": 52221 }, { "epoch": 0.99, "learning_rate": 2.8464292830879258e-09, "loss": 0.8135, "step": 52222 }, { "epoch": 0.99, "learning_rate": 2.839146137260107e-09, "loss": 0.8613, "step": 52223 }, { "epoch": 0.99, "learning_rate": 2.831872315754436e-09, "loss": 0.843, "step": 52224 }, { "epoch": 0.99, "learning_rate": 2.824607818598113e-09, "loss": 1.0807, "step": 52225 }, { "epoch": 0.99, "learning_rate": 2.817352645818061e-09, "loss": 0.8373, "step": 52226 }, { "epoch": 0.99, "learning_rate": 2.810106797441481e-09, "loss": 0.8653, "step": 52227 }, { "epoch": 0.99, "learning_rate": 2.802870273495295e-09, "loss": 0.9758, "step": 52228 }, { "epoch": 0.99, "learning_rate": 2.7956430740067044e-09, "loss": 0.7922, "step": 52229 }, { "epoch": 0.99, "learning_rate": 2.7884251990023538e-09, "loss": 1.0223, "step": 52230 }, { "epoch": 0.99, "learning_rate": 2.7812166485097214e-09, "loss": 1.0035, "step": 52231 }, { "epoch": 0.99, "learning_rate": 2.774017422555453e-09, "loss": 1.012, "step": 52232 }, { "epoch": 0.99, "learning_rate": 2.766827521166471e-09, "loss": 0.8757, "step": 52233 }, { "epoch": 0.99, "learning_rate": 2.759646944369421e-09, "loss": 0.9335, "step": 52234 }, { "epoch": 0.99, "learning_rate": 2.752475692191503e-09, "loss": 0.8548, "step": 52235 }, { "epoch": 0.99, "learning_rate": 2.7453137646590854e-09, "loss": 0.9055, "step": 52236 }, { "epoch": 0.99, "learning_rate": 2.738161161799091e-09, "loss": 0.7831, "step": 52237 }, { "epoch": 0.99, "learning_rate": 2.731017883638165e-09, "loss": 0.8382, "step": 52238 }, { "epoch": 0.99, "learning_rate": 2.7238839302032307e-09, "loss": 0.7581, "step": 52239 }, { "epoch": 0.99, "learning_rate": 2.716759301520655e-09, "loss": 0.8978, "step": 52240 }, { "epoch": 0.99, "learning_rate": 2.7096439976173615e-09, "loss": 0.6674, "step": 52241 }, { "epoch": 0.99, "learning_rate": 2.7025380185194405e-09, "loss": 0.8555, "step": 52242 }, { "epoch": 0.99, "learning_rate": 2.6954413642538146e-09, "loss": 1.0328, "step": 52243 }, { "epoch": 0.99, "learning_rate": 2.688354034846574e-09, "loss": 0.8798, "step": 52244 }, { "epoch": 0.99, "learning_rate": 2.6812760303246423e-09, "loss": 0.8807, "step": 52245 }, { "epoch": 0.99, "learning_rate": 2.6742073507143863e-09, "loss": 0.8877, "step": 52246 }, { "epoch": 0.99, "learning_rate": 2.6671479960418965e-09, "loss": 1.0034, "step": 52247 }, { "epoch": 0.99, "learning_rate": 2.660097966333819e-09, "loss": 0.8585, "step": 52248 }, { "epoch": 0.99, "learning_rate": 2.6530572616162432e-09, "loss": 1.0458, "step": 52249 }, { "epoch": 0.99, "learning_rate": 2.6460258819158145e-09, "loss": 0.9338, "step": 52250 }, { "epoch": 0.99, "learning_rate": 2.6390038272583462e-09, "loss": 0.9537, "step": 52251 }, { "epoch": 0.99, "learning_rate": 2.6319910976702058e-09, "loss": 0.8547, "step": 52252 }, { "epoch": 0.99, "learning_rate": 2.6249876931777606e-09, "loss": 0.9488, "step": 52253 }, { "epoch": 0.99, "learning_rate": 2.617993613806824e-09, "loss": 0.8562, "step": 52254 }, { "epoch": 0.99, "learning_rate": 2.611008859584041e-09, "loss": 0.8433, "step": 52255 }, { "epoch": 0.99, "learning_rate": 2.6040334305349467e-09, "loss": 1.026, "step": 52256 }, { "epoch": 0.99, "learning_rate": 2.5970673266861866e-09, "loss": 1.1245, "step": 52257 }, { "epoch": 0.99, "learning_rate": 2.5901105480630185e-09, "loss": 0.8085, "step": 52258 }, { "epoch": 0.99, "learning_rate": 2.5831630946918097e-09, "loss": 0.9522, "step": 52259 }, { "epoch": 0.99, "learning_rate": 2.5762249665986503e-09, "loss": 0.9042, "step": 52260 }, { "epoch": 0.99, "learning_rate": 2.5692961638093537e-09, "loss": 0.7917, "step": 52261 }, { "epoch": 0.99, "learning_rate": 2.5623766863497325e-09, "loss": 0.9976, "step": 52262 }, { "epoch": 0.99, "learning_rate": 2.555466534245321e-09, "loss": 0.8793, "step": 52263 }, { "epoch": 0.99, "learning_rate": 2.548565707522488e-09, "loss": 1.0265, "step": 52264 }, { "epoch": 0.99, "learning_rate": 2.541674206206768e-09, "loss": 0.7792, "step": 52265 }, { "epoch": 0.99, "learning_rate": 2.5347920303236963e-09, "loss": 0.9049, "step": 52266 }, { "epoch": 0.99, "learning_rate": 2.5279191798990854e-09, "loss": 0.8218, "step": 52267 }, { "epoch": 0.99, "learning_rate": 2.5210556549590258e-09, "loss": 1.0057, "step": 52268 }, { "epoch": 0.99, "learning_rate": 2.5142014555284975e-09, "loss": 0.8822, "step": 52269 }, { "epoch": 0.99, "learning_rate": 2.5073565816333136e-09, "loss": 0.813, "step": 52270 }, { "epoch": 0.99, "learning_rate": 2.5005210332992858e-09, "loss": 0.6908, "step": 52271 }, { "epoch": 0.99, "learning_rate": 2.493694810551395e-09, "loss": 0.8745, "step": 52272 }, { "epoch": 0.99, "learning_rate": 2.4868779134157307e-09, "loss": 0.6345, "step": 52273 }, { "epoch": 0.99, "learning_rate": 2.480070341917551e-09, "loss": 0.7995, "step": 52274 }, { "epoch": 0.99, "learning_rate": 2.473272096082113e-09, "loss": 1.1332, "step": 52275 }, { "epoch": 0.99, "learning_rate": 2.466483175934953e-09, "loss": 0.9978, "step": 52276 }, { "epoch": 0.99, "learning_rate": 2.459703581501327e-09, "loss": 1.0518, "step": 52277 }, { "epoch": 0.99, "learning_rate": 2.4529333128064937e-09, "loss": 0.7564, "step": 52278 }, { "epoch": 0.99, "learning_rate": 2.4461723698759875e-09, "loss": 0.8525, "step": 52279 }, { "epoch": 0.99, "learning_rate": 2.439420752734789e-09, "loss": 0.9778, "step": 52280 }, { "epoch": 0.99, "learning_rate": 2.432678461408433e-09, "loss": 1.0682, "step": 52281 }, { "epoch": 0.99, "learning_rate": 2.425945495921622e-09, "loss": 0.7991, "step": 52282 }, { "epoch": 0.99, "learning_rate": 2.4192218562998915e-09, "loss": 1.0278, "step": 52283 }, { "epoch": 0.99, "learning_rate": 2.4125075425679435e-09, "loss": 0.8043, "step": 52284 }, { "epoch": 0.99, "learning_rate": 2.405802554751313e-09, "loss": 0.8149, "step": 52285 }, { "epoch": 0.99, "learning_rate": 2.3991068928749804e-09, "loss": 1.0046, "step": 52286 }, { "epoch": 0.99, "learning_rate": 2.392420556963648e-09, "loss": 1.2001, "step": 52287 }, { "epoch": 0.99, "learning_rate": 2.3857435470425737e-09, "loss": 0.9338, "step": 52288 }, { "epoch": 0.99, "learning_rate": 2.3790758631361823e-09, "loss": 0.7599, "step": 52289 }, { "epoch": 0.99, "learning_rate": 2.3724175052702857e-09, "loss": 0.8516, "step": 52290 }, { "epoch": 0.99, "learning_rate": 2.365768473468755e-09, "loss": 0.7917, "step": 52291 }, { "epoch": 0.99, "learning_rate": 2.3591287677571238e-09, "loss": 0.7565, "step": 52292 }, { "epoch": 0.99, "learning_rate": 2.3524983881598184e-09, "loss": 0.7943, "step": 52293 }, { "epoch": 0.99, "learning_rate": 2.3458773347018183e-09, "loss": 0.9586, "step": 52294 }, { "epoch": 0.99, "learning_rate": 2.339265607407548e-09, "loss": 1.0738, "step": 52295 }, { "epoch": 0.99, "learning_rate": 2.3326632063019883e-09, "loss": 1.0467, "step": 52296 }, { "epoch": 0.99, "learning_rate": 2.3260701314095633e-09, "loss": 0.7392, "step": 52297 }, { "epoch": 0.99, "learning_rate": 2.3194863827552537e-09, "loss": 0.8189, "step": 52298 }, { "epoch": 0.99, "learning_rate": 2.312911960363207e-09, "loss": 0.9673, "step": 52299 }, { "epoch": 0.99, "learning_rate": 2.3063468642581245e-09, "loss": 0.872, "step": 52300 }, { "epoch": 0.99, "learning_rate": 2.2997910944647095e-09, "loss": 0.8695, "step": 52301 }, { "epoch": 0.99, "learning_rate": 2.293244651007387e-09, "loss": 0.7874, "step": 52302 }, { "epoch": 0.99, "learning_rate": 2.286707533910304e-09, "loss": 0.9275, "step": 52303 }, { "epoch": 0.99, "learning_rate": 2.280179743198163e-09, "loss": 0.8612, "step": 52304 }, { "epoch": 0.99, "learning_rate": 2.273661278895112e-09, "loss": 0.928, "step": 52305 }, { "epoch": 0.99, "learning_rate": 2.2671521410258524e-09, "loss": 0.882, "step": 52306 }, { "epoch": 0.99, "learning_rate": 2.2606523296142545e-09, "loss": 0.8896, "step": 52307 }, { "epoch": 0.99, "learning_rate": 2.2541618446847435e-09, "loss": 0.8608, "step": 52308 }, { "epoch": 0.99, "learning_rate": 2.2476806862620215e-09, "loss": 0.8361, "step": 52309 }, { "epoch": 0.99, "learning_rate": 2.2412088543694033e-09, "loss": 0.8496, "step": 52310 }, { "epoch": 0.99, "learning_rate": 2.2347463490318687e-09, "loss": 0.954, "step": 52311 }, { "epoch": 0.99, "learning_rate": 2.2282931702730104e-09, "loss": 1.0916, "step": 52312 }, { "epoch": 0.99, "learning_rate": 2.221849318117253e-09, "loss": 1.1592, "step": 52313 }, { "epoch": 0.99, "learning_rate": 2.215414792588466e-09, "loss": 0.9566, "step": 52314 }, { "epoch": 0.99, "learning_rate": 2.2089895937107974e-09, "loss": 0.8368, "step": 52315 }, { "epoch": 0.99, "learning_rate": 2.2025737215081167e-09, "loss": 0.7805, "step": 52316 }, { "epoch": 0.99, "learning_rate": 2.1961671760042934e-09, "loss": 0.8005, "step": 52317 }, { "epoch": 0.99, "learning_rate": 2.1897699572234754e-09, "loss": 1.0287, "step": 52318 }, { "epoch": 0.99, "learning_rate": 2.1833820651895323e-09, "loss": 1.0845, "step": 52319 }, { "epoch": 0.99, "learning_rate": 2.1770034999263335e-09, "loss": 0.6956, "step": 52320 }, { "epoch": 0.99, "learning_rate": 2.1706342614574715e-09, "loss": 0.8682, "step": 52321 }, { "epoch": 0.99, "learning_rate": 2.1642743498070938e-09, "loss": 0.6768, "step": 52322 }, { "epoch": 0.99, "learning_rate": 2.1579237649985153e-09, "loss": 0.8435, "step": 52323 }, { "epoch": 0.99, "learning_rate": 2.1515825070558826e-09, "loss": 0.9641, "step": 52324 }, { "epoch": 0.99, "learning_rate": 2.145250576002511e-09, "loss": 1.1198, "step": 52325 }, { "epoch": 0.99, "learning_rate": 2.1389279718619927e-09, "loss": 1.0302, "step": 52326 }, { "epoch": 0.99, "learning_rate": 2.1326146946584746e-09, "loss": 0.8426, "step": 52327 }, { "epoch": 0.99, "learning_rate": 2.1263107444149945e-09, "loss": 0.9114, "step": 52328 }, { "epoch": 0.99, "learning_rate": 2.1200161211554216e-09, "loss": 0.7076, "step": 52329 }, { "epoch": 0.99, "learning_rate": 2.113730824902793e-09, "loss": 0.8718, "step": 52330 }, { "epoch": 0.99, "learning_rate": 2.107454855681257e-09, "loss": 1.0937, "step": 52331 }, { "epoch": 0.99, "learning_rate": 2.1011882135138495e-09, "loss": 0.8169, "step": 52332 }, { "epoch": 0.99, "learning_rate": 2.0949308984238857e-09, "loss": 0.8586, "step": 52333 }, { "epoch": 0.99, "learning_rate": 2.0886829104349582e-09, "loss": 1.0858, "step": 52334 }, { "epoch": 0.99, "learning_rate": 2.0824442495703812e-09, "loss": 0.7396, "step": 52335 }, { "epoch": 0.99, "learning_rate": 2.076214915853192e-09, "loss": 0.8402, "step": 52336 }, { "epoch": 0.99, "learning_rate": 2.069994909306705e-09, "loss": 1.0934, "step": 52337 }, { "epoch": 0.99, "learning_rate": 2.063784229954513e-09, "loss": 0.7578, "step": 52338 }, { "epoch": 0.99, "learning_rate": 2.0575828778196527e-09, "loss": 0.7242, "step": 52339 }, { "epoch": 0.99, "learning_rate": 2.051390852924884e-09, "loss": 0.7184, "step": 52340 }, { "epoch": 0.99, "learning_rate": 2.0452081552937984e-09, "loss": 0.6704, "step": 52341 }, { "epoch": 0.99, "learning_rate": 2.039034784949434e-09, "loss": 0.7787, "step": 52342 }, { "epoch": 0.99, "learning_rate": 2.03287074191455e-09, "loss": 1.0271, "step": 52343 }, { "epoch": 0.99, "learning_rate": 2.026716026212461e-09, "loss": 1.1085, "step": 52344 }, { "epoch": 0.99, "learning_rate": 2.0205706378659263e-09, "loss": 1.0289, "step": 52345 }, { "epoch": 0.99, "learning_rate": 2.0144345768979835e-09, "loss": 1.0357, "step": 52346 }, { "epoch": 0.99, "learning_rate": 2.0083078433316692e-09, "loss": 0.8222, "step": 52347 }, { "epoch": 0.99, "learning_rate": 2.002190437189466e-09, "loss": 0.997, "step": 52348 }, { "epoch": 0.99, "learning_rate": 1.9960823584946886e-09, "loss": 0.9046, "step": 52349 }, { "epoch": 0.99, "learning_rate": 1.9899836072700963e-09, "loss": 0.8914, "step": 52350 }, { "epoch": 0.99, "learning_rate": 1.983894183538171e-09, "loss": 0.8697, "step": 52351 }, { "epoch": 0.99, "learning_rate": 1.9778140873216723e-09, "loss": 0.7718, "step": 52352 }, { "epoch": 0.99, "learning_rate": 1.9717433186436376e-09, "loss": 0.7659, "step": 52353 }, { "epoch": 0.99, "learning_rate": 1.9656818775262708e-09, "loss": 0.6576, "step": 52354 }, { "epoch": 0.99, "learning_rate": 1.959629763992887e-09, "loss": 0.8761, "step": 52355 }, { "epoch": 0.99, "learning_rate": 1.9535869780651363e-09, "loss": 0.8822, "step": 52356 }, { "epoch": 0.99, "learning_rate": 1.947553519766332e-09, "loss": 0.6007, "step": 52357 }, { "epoch": 0.99, "learning_rate": 1.9415293891189567e-09, "loss": 0.9351, "step": 52358 }, { "epoch": 0.99, "learning_rate": 1.935514586145215e-09, "loss": 0.9883, "step": 52359 }, { "epoch": 0.99, "learning_rate": 1.929509110867589e-09, "loss": 0.7463, "step": 52360 }, { "epoch": 0.99, "learning_rate": 1.9235129633085604e-09, "loss": 0.7943, "step": 52361 }, { "epoch": 0.99, "learning_rate": 1.917526143490611e-09, "loss": 1.1343, "step": 52362 }, { "epoch": 0.99, "learning_rate": 1.911548651435946e-09, "loss": 0.974, "step": 52363 }, { "epoch": 0.99, "learning_rate": 1.9055804871667694e-09, "loss": 0.8039, "step": 52364 }, { "epoch": 0.99, "learning_rate": 1.899621650705841e-09, "loss": 0.7717, "step": 52365 }, { "epoch": 0.99, "learning_rate": 1.893672142075087e-09, "loss": 0.7439, "step": 52366 }, { "epoch": 0.99, "learning_rate": 1.8877319612969904e-09, "loss": 0.9449, "step": 52367 }, { "epoch": 0.99, "learning_rate": 1.8818011083931996e-09, "loss": 0.9351, "step": 52368 }, { "epoch": 0.99, "learning_rate": 1.8758795833861976e-09, "loss": 0.907, "step": 52369 }, { "epoch": 0.99, "learning_rate": 1.869967386298188e-09, "loss": 0.838, "step": 52370 }, { "epoch": 0.99, "learning_rate": 1.8640645171510983e-09, "loss": 1.0394, "step": 52371 }, { "epoch": 0.99, "learning_rate": 1.8581709759668553e-09, "loss": 1.0789, "step": 52372 }, { "epoch": 0.99, "learning_rate": 1.8522867627676633e-09, "loss": 0.906, "step": 52373 }, { "epoch": 0.99, "learning_rate": 1.8464118775757267e-09, "loss": 1.0204, "step": 52374 }, { "epoch": 0.99, "learning_rate": 1.8405463204124175e-09, "loss": 1.1745, "step": 52375 }, { "epoch": 0.99, "learning_rate": 1.83469009129994e-09, "loss": 0.9034, "step": 52376 }, { "epoch": 0.99, "learning_rate": 1.828843190260221e-09, "loss": 0.8183, "step": 52377 }, { "epoch": 0.99, "learning_rate": 1.8230056173149101e-09, "loss": 0.8004, "step": 52378 }, { "epoch": 0.99, "learning_rate": 1.8171773724859344e-09, "loss": 0.8475, "step": 52379 }, { "epoch": 0.99, "learning_rate": 1.8113584557949426e-09, "loss": 1.062, "step": 52380 }, { "epoch": 0.99, "learning_rate": 1.805548867263862e-09, "loss": 1.0443, "step": 52381 }, { "epoch": 0.99, "learning_rate": 1.7997486069140645e-09, "loss": 0.789, "step": 52382 }, { "epoch": 0.99, "learning_rate": 1.7939576747677545e-09, "loss": 0.9093, "step": 52383 }, { "epoch": 0.99, "learning_rate": 1.788176070846026e-09, "loss": 0.9529, "step": 52384 }, { "epoch": 0.99, "learning_rate": 1.7824037951705287e-09, "loss": 0.9164, "step": 52385 }, { "epoch": 0.99, "learning_rate": 1.776640847763189e-09, "loss": 0.9061, "step": 52386 }, { "epoch": 0.99, "learning_rate": 1.7708872286451017e-09, "loss": 0.9861, "step": 52387 }, { "epoch": 0.99, "learning_rate": 1.765142937837916e-09, "loss": 1.0739, "step": 52388 }, { "epoch": 0.99, "learning_rate": 1.7594079753630033e-09, "loss": 0.9466, "step": 52389 }, { "epoch": 0.99, "learning_rate": 1.7536823412420135e-09, "loss": 0.8739, "step": 52390 }, { "epoch": 0.99, "learning_rate": 1.747966035496318e-09, "loss": 0.825, "step": 52391 }, { "epoch": 0.99, "learning_rate": 1.7422590581467336e-09, "loss": 0.7976, "step": 52392 }, { "epoch": 0.99, "learning_rate": 1.7365614092151873e-09, "loss": 1.0423, "step": 52393 }, { "epoch": 0.99, "learning_rate": 1.7308730887227731e-09, "loss": 1.0615, "step": 52394 }, { "epoch": 0.99, "learning_rate": 1.7251940966905856e-09, "loss": 0.7213, "step": 52395 }, { "epoch": 0.99, "learning_rate": 1.7195244331399964e-09, "loss": 0.7996, "step": 52396 }, { "epoch": 0.99, "learning_rate": 1.7138640980920996e-09, "loss": 0.7333, "step": 52397 }, { "epoch": 0.99, "learning_rate": 1.7082130915679895e-09, "loss": 1.0961, "step": 52398 }, { "epoch": 0.99, "learning_rate": 1.7025714135887606e-09, "loss": 0.7885, "step": 52399 }, { "epoch": 0.99, "learning_rate": 1.6969390641757844e-09, "loss": 1.1533, "step": 52400 }, { "epoch": 0.99, "learning_rate": 1.6913160433496001e-09, "loss": 0.857, "step": 52401 }, { "epoch": 0.99, "learning_rate": 1.6857023511315796e-09, "loss": 1.1102, "step": 52402 }, { "epoch": 0.99, "learning_rate": 1.680097987542262e-09, "loss": 1.0707, "step": 52403 }, { "epoch": 0.99, "learning_rate": 1.6745029526030188e-09, "loss": 0.8152, "step": 52404 }, { "epoch": 0.99, "learning_rate": 1.668917246334667e-09, "loss": 0.9816, "step": 52405 }, { "epoch": 0.99, "learning_rate": 1.6633408687580232e-09, "loss": 0.9852, "step": 52406 }, { "epoch": 0.99, "learning_rate": 1.6577738198936267e-09, "loss": 0.8233, "step": 52407 }, { "epoch": 0.99, "learning_rate": 1.6522160997628489e-09, "loss": 0.5705, "step": 52408 }, { "epoch": 0.99, "learning_rate": 1.6466677083856741e-09, "loss": 0.9029, "step": 52409 }, { "epoch": 0.99, "learning_rate": 1.641128645783474e-09, "loss": 0.9659, "step": 52410 }, { "epoch": 0.99, "learning_rate": 1.6355989119767879e-09, "loss": 0.7863, "step": 52411 }, { "epoch": 0.99, "learning_rate": 1.6300785069861546e-09, "loss": 1.2079, "step": 52412 }, { "epoch": 0.99, "learning_rate": 1.6245674308321135e-09, "loss": 0.9596, "step": 52413 }, { "epoch": 0.99, "learning_rate": 1.6190656835352037e-09, "loss": 0.7159, "step": 52414 }, { "epoch": 0.99, "learning_rate": 1.6135732651162416e-09, "loss": 0.8566, "step": 52415 }, { "epoch": 0.99, "learning_rate": 1.6080901755957667e-09, "loss": 0.9494, "step": 52416 }, { "epoch": 0.99, "learning_rate": 1.602616414993763e-09, "loss": 0.8182, "step": 52417 }, { "epoch": 0.99, "learning_rate": 1.5971519833310468e-09, "loss": 1.1118, "step": 52418 }, { "epoch": 0.99, "learning_rate": 1.5916968806281574e-09, "loss": 1.1064, "step": 52419 }, { "epoch": 0.99, "learning_rate": 1.586251106905079e-09, "loss": 0.8326, "step": 52420 }, { "epoch": 0.99, "learning_rate": 1.5808146621823505e-09, "loss": 1.0333, "step": 52421 }, { "epoch": 0.99, "learning_rate": 1.5753875464805112e-09, "loss": 0.8086, "step": 52422 }, { "epoch": 0.99, "learning_rate": 1.5699697598192675e-09, "loss": 0.7578, "step": 52423 }, { "epoch": 0.99, "learning_rate": 1.5645613022194362e-09, "loss": 0.9094, "step": 52424 }, { "epoch": 0.99, "learning_rate": 1.5591621737007235e-09, "loss": 0.9799, "step": 52425 }, { "epoch": 0.99, "learning_rate": 1.553772374283391e-09, "loss": 0.9282, "step": 52426 }, { "epoch": 0.99, "learning_rate": 1.548391903987978e-09, "loss": 1.0241, "step": 52427 }, { "epoch": 0.99, "learning_rate": 1.5430207628339133e-09, "loss": 0.8156, "step": 52428 }, { "epoch": 0.99, "learning_rate": 1.5376589508420137e-09, "loss": 0.6994, "step": 52429 }, { "epoch": 0.99, "learning_rate": 1.5323064680314303e-09, "loss": 0.8038, "step": 52430 }, { "epoch": 0.99, "learning_rate": 1.5269633144229802e-09, "loss": 1.0013, "step": 52431 }, { "epoch": 0.99, "learning_rate": 1.5216294900360918e-09, "loss": 0.9872, "step": 52432 }, { "epoch": 0.99, "learning_rate": 1.5163049948907493e-09, "loss": 0.8195, "step": 52433 }, { "epoch": 0.99, "learning_rate": 1.5109898290072146e-09, "loss": 0.8196, "step": 52434 }, { "epoch": 0.99, "learning_rate": 1.5056839924046386e-09, "loss": 0.8961, "step": 52435 }, { "epoch": 0.99, "learning_rate": 1.5003874851035604e-09, "loss": 0.9929, "step": 52436 }, { "epoch": 0.99, "learning_rate": 1.4951003071234094e-09, "loss": 1.056, "step": 52437 }, { "epoch": 0.99, "learning_rate": 1.489822458483614e-09, "loss": 0.896, "step": 52438 }, { "epoch": 0.99, "learning_rate": 1.484553939204436e-09, "loss": 0.8369, "step": 52439 }, { "epoch": 0.99, "learning_rate": 1.4792947493055821e-09, "loss": 0.8518, "step": 52440 }, { "epoch": 0.99, "learning_rate": 1.4740448888059256e-09, "loss": 0.8624, "step": 52441 }, { "epoch": 0.99, "learning_rate": 1.4688043577260058e-09, "loss": 0.8069, "step": 52442 }, { "epoch": 0.99, "learning_rate": 1.4635731560846967e-09, "loss": 0.999, "step": 52443 }, { "epoch": 0.99, "learning_rate": 1.458351283901982e-09, "loss": 0.8646, "step": 52444 }, { "epoch": 0.99, "learning_rate": 1.4531387411970133e-09, "loss": 0.7583, "step": 52445 }, { "epoch": 0.99, "learning_rate": 1.4479355279894968e-09, "loss": 0.882, "step": 52446 }, { "epoch": 0.99, "learning_rate": 1.4427416442988618e-09, "loss": 1.0658, "step": 52447 }, { "epoch": 0.99, "learning_rate": 1.4375570901442593e-09, "loss": 0.8154, "step": 52448 }, { "epoch": 0.99, "learning_rate": 1.4323818655453959e-09, "loss": 0.8884, "step": 52449 }, { "epoch": 0.99, "learning_rate": 1.4272159705214228e-09, "loss": 1.0195, "step": 52450 }, { "epoch": 0.99, "learning_rate": 1.4220594050914916e-09, "loss": 0.8579, "step": 52451 }, { "epoch": 0.99, "learning_rate": 1.416912169275031e-09, "loss": 0.9312, "step": 52452 }, { "epoch": 0.99, "learning_rate": 1.4117742630911923e-09, "loss": 0.9332, "step": 52453 }, { "epoch": 0.99, "learning_rate": 1.406645686559127e-09, "loss": 0.6819, "step": 52454 }, { "epoch": 0.99, "learning_rate": 1.4015264396979867e-09, "loss": 1.1926, "step": 52455 }, { "epoch": 0.99, "learning_rate": 1.3964165225271998e-09, "loss": 1.0061, "step": 52456 }, { "epoch": 0.99, "learning_rate": 1.3913159350653627e-09, "loss": 0.7026, "step": 52457 }, { "epoch": 0.99, "learning_rate": 1.3862246773316268e-09, "loss": 0.8293, "step": 52458 }, { "epoch": 0.99, "learning_rate": 1.381142749345421e-09, "loss": 0.929, "step": 52459 }, { "epoch": 0.99, "learning_rate": 1.3760701511253416e-09, "loss": 0.8564, "step": 52460 }, { "epoch": 0.99, "learning_rate": 1.3710068826902622e-09, "loss": 0.8275, "step": 52461 }, { "epoch": 0.99, "learning_rate": 1.3659529440593344e-09, "loss": 0.9316, "step": 52462 }, { "epoch": 0.99, "learning_rate": 1.3609083352514318e-09, "loss": 0.9406, "step": 52463 }, { "epoch": 0.99, "learning_rate": 1.3558730562851507e-09, "loss": 0.8145, "step": 52464 }, { "epoch": 0.99, "learning_rate": 1.3508471071793649e-09, "loss": 0.7906, "step": 52465 }, { "epoch": 0.99, "learning_rate": 1.3458304879529482e-09, "loss": 0.9553, "step": 52466 }, { "epoch": 0.99, "learning_rate": 1.3408231986247743e-09, "loss": 0.8128, "step": 52467 }, { "epoch": 0.99, "learning_rate": 1.335825239213162e-09, "loss": 0.9736, "step": 52468 }, { "epoch": 0.99, "learning_rate": 1.3308366097369852e-09, "loss": 1.0379, "step": 52469 }, { "epoch": 0.99, "learning_rate": 1.3258573102148397e-09, "loss": 0.8491, "step": 52470 }, { "epoch": 0.99, "learning_rate": 1.3208873406655997e-09, "loss": 0.8631, "step": 52471 }, { "epoch": 0.99, "learning_rate": 1.3159267011073062e-09, "loss": 0.8086, "step": 52472 }, { "epoch": 0.99, "learning_rate": 1.3109753915585554e-09, "loss": 0.8892, "step": 52473 }, { "epoch": 0.99, "learning_rate": 1.3060334120382212e-09, "loss": 0.972, "step": 52474 }, { "epoch": 0.99, "learning_rate": 1.301100762564622e-09, "loss": 1.2839, "step": 52475 }, { "epoch": 0.99, "learning_rate": 1.296177443156077e-09, "loss": 1.1425, "step": 52476 }, { "epoch": 0.99, "learning_rate": 1.2912634538309044e-09, "loss": 1.0864, "step": 52477 }, { "epoch": 0.99, "learning_rate": 1.2863587946077005e-09, "loss": 0.9109, "step": 52478 }, { "epoch": 0.99, "learning_rate": 1.2814634655045066e-09, "loss": 0.8757, "step": 52479 }, { "epoch": 0.99, "learning_rate": 1.2765774665396413e-09, "loss": 0.9504, "step": 52480 }, { "epoch": 0.99, "learning_rate": 1.2717007977314234e-09, "loss": 0.9706, "step": 52481 }, { "epoch": 0.99, "learning_rate": 1.2668334590981713e-09, "loss": 1.0017, "step": 52482 }, { "epoch": 0.99, "learning_rate": 1.2619754506579262e-09, "loss": 0.8448, "step": 52483 }, { "epoch": 0.99, "learning_rate": 1.2571267724287295e-09, "loss": 0.9176, "step": 52484 }, { "epoch": 0.99, "learning_rate": 1.2522874244288996e-09, "loss": 0.7466, "step": 52485 }, { "epoch": 0.99, "learning_rate": 1.2474574066764778e-09, "loss": 1.0977, "step": 52486 }, { "epoch": 0.99, "learning_rate": 1.242636719189505e-09, "loss": 0.886, "step": 52487 }, { "epoch": 0.99, "learning_rate": 1.237825361985745e-09, "loss": 1.0524, "step": 52488 }, { "epoch": 0.99, "learning_rate": 1.2330233350832388e-09, "loss": 0.8271, "step": 52489 }, { "epoch": 0.99, "learning_rate": 1.2282306385003052e-09, "loss": 0.7233, "step": 52490 }, { "epoch": 0.99, "learning_rate": 1.2234472722544299e-09, "loss": 0.8364, "step": 52491 }, { "epoch": 0.99, "learning_rate": 1.2186732363633768e-09, "loss": 0.7163, "step": 52492 }, { "epoch": 0.99, "learning_rate": 1.2139085308454645e-09, "loss": 1.2031, "step": 52493 }, { "epoch": 0.99, "learning_rate": 1.209153155718179e-09, "loss": 0.9241, "step": 52494 }, { "epoch": 0.99, "learning_rate": 1.2044071109990062e-09, "loss": 1.0719, "step": 52495 }, { "epoch": 0.99, "learning_rate": 1.199670396706265e-09, "loss": 0.7327, "step": 52496 }, { "epoch": 0.99, "learning_rate": 1.1949430128571637e-09, "loss": 0.81, "step": 52497 }, { "epoch": 0.99, "learning_rate": 1.1902249594697435e-09, "loss": 0.9191, "step": 52498 }, { "epoch": 0.99, "learning_rate": 1.1855162365612128e-09, "loss": 0.8527, "step": 52499 }, { "epoch": 0.99, "learning_rate": 1.180816844149335e-09, "loss": 0.9142, "step": 52500 }, { "epoch": 0.99, "learning_rate": 1.176126782251874e-09, "loss": 0.79, "step": 52501 }, { "epoch": 0.99, "learning_rate": 1.1714460508860381e-09, "loss": 0.8714, "step": 52502 }, { "epoch": 0.99, "learning_rate": 1.1667746500693133e-09, "loss": 0.8218, "step": 52503 }, { "epoch": 0.99, "learning_rate": 1.1621125798194632e-09, "loss": 0.7593, "step": 52504 }, { "epoch": 0.99, "learning_rate": 1.1574598401534188e-09, "loss": 0.8748, "step": 52505 }, { "epoch": 0.99, "learning_rate": 1.1528164310889433e-09, "loss": 0.938, "step": 52506 }, { "epoch": 0.99, "learning_rate": 1.1481823526432457e-09, "loss": 0.8553, "step": 52507 }, { "epoch": 0.99, "learning_rate": 1.143557604833534e-09, "loss": 0.7359, "step": 52508 }, { "epoch": 0.99, "learning_rate": 1.1389421876770167e-09, "loss": 0.8837, "step": 52509 }, { "epoch": 0.99, "learning_rate": 1.1343361011914578e-09, "loss": 0.9592, "step": 52510 }, { "epoch": 0.99, "learning_rate": 1.1297393453932325e-09, "loss": 0.9879, "step": 52511 }, { "epoch": 0.99, "learning_rate": 1.1251519203003824e-09, "loss": 0.9556, "step": 52512 }, { "epoch": 0.99, "learning_rate": 1.120573825929283e-09, "loss": 0.8067, "step": 52513 }, { "epoch": 0.99, "learning_rate": 1.1160050622974206e-09, "loss": 0.9558, "step": 52514 }, { "epoch": 0.99, "learning_rate": 1.1114456294217258e-09, "loss": 0.6356, "step": 52515 }, { "epoch": 0.99, "learning_rate": 1.106895527319407e-09, "loss": 0.747, "step": 52516 }, { "epoch": 0.99, "learning_rate": 1.1023547560073956e-09, "loss": 0.9501, "step": 52517 }, { "epoch": 0.99, "learning_rate": 1.0978233155023443e-09, "loss": 0.8343, "step": 52518 }, { "epoch": 0.99, "learning_rate": 1.0933012058214621e-09, "loss": 0.9644, "step": 52519 }, { "epoch": 0.99, "learning_rate": 1.0887884269816795e-09, "loss": 0.8634, "step": 52520 }, { "epoch": 0.99, "learning_rate": 1.0842849789996501e-09, "loss": 0.9824, "step": 52521 }, { "epoch": 0.99, "learning_rate": 1.0797908618923049e-09, "loss": 0.9494, "step": 52522 }, { "epoch": 0.99, "learning_rate": 1.0753060756765743e-09, "loss": 0.6643, "step": 52523 }, { "epoch": 0.99, "learning_rate": 1.0708306203688346e-09, "loss": 0.9631, "step": 52524 }, { "epoch": 0.99, "learning_rate": 1.0663644959860163e-09, "loss": 0.9521, "step": 52525 }, { "epoch": 0.99, "learning_rate": 1.0619077025447732e-09, "loss": 0.8571, "step": 52526 }, { "epoch": 0.99, "learning_rate": 1.0574602400617584e-09, "loss": 0.7524, "step": 52527 }, { "epoch": 0.99, "learning_rate": 1.0530221085536251e-09, "loss": 0.8588, "step": 52528 }, { "epoch": 0.99, "learning_rate": 1.0485933080367493e-09, "loss": 0.7556, "step": 52529 }, { "epoch": 0.99, "learning_rate": 1.0441738385277844e-09, "loss": 0.7808, "step": 52530 }, { "epoch": 0.99, "learning_rate": 1.0397637000433836e-09, "loss": 1.0439, "step": 52531 }, { "epoch": 0.99, "learning_rate": 1.0353628925999226e-09, "loss": 1.0562, "step": 52532 }, { "epoch": 0.99, "learning_rate": 1.0309714162137773e-09, "loss": 1.0121, "step": 52533 }, { "epoch": 0.99, "learning_rate": 1.0265892709013236e-09, "loss": 0.9705, "step": 52534 }, { "epoch": 0.99, "learning_rate": 1.0222164566789372e-09, "loss": 0.9992, "step": 52535 }, { "epoch": 0.99, "learning_rate": 1.0178529735629938e-09, "loss": 0.8303, "step": 52536 }, { "epoch": 0.99, "learning_rate": 1.0134988215698693e-09, "loss": 1.068, "step": 52537 }, { "epoch": 0.99, "learning_rate": 1.009154000715662e-09, "loss": 0.8953, "step": 52538 }, { "epoch": 0.99, "learning_rate": 1.00481851101647e-09, "loss": 0.8654, "step": 52539 }, { "epoch": 0.99, "learning_rate": 1.0004923524889464e-09, "loss": 0.9717, "step": 52540 }, { "epoch": 0.99, "learning_rate": 9.961755251486348e-10, "loss": 0.7968, "step": 52541 }, { "epoch": 0.99, "learning_rate": 9.918680290121885e-10, "loss": 0.7819, "step": 52542 }, { "epoch": 0.99, "learning_rate": 9.875698640957055e-10, "loss": 0.8217, "step": 52543 }, { "epoch": 0.99, "learning_rate": 9.83281030414729e-10, "loss": 1.0947, "step": 52544 }, { "epoch": 0.99, "learning_rate": 9.790015279856347e-10, "loss": 1.0072, "step": 52545 }, { "epoch": 0.99, "learning_rate": 9.747313568242434e-10, "loss": 0.9415, "step": 52546 }, { "epoch": 0.99, "learning_rate": 9.704705169466533e-10, "loss": 0.9352, "step": 52547 }, { "epoch": 0.99, "learning_rate": 9.662190083686852e-10, "loss": 0.7418, "step": 52548 }, { "epoch": 0.99, "learning_rate": 9.619768311061594e-10, "loss": 0.8666, "step": 52549 }, { "epoch": 0.99, "learning_rate": 9.577439851751746e-10, "loss": 1.0832, "step": 52550 }, { "epoch": 0.99, "learning_rate": 9.535204705912737e-10, "loss": 1.0025, "step": 52551 }, { "epoch": 0.99, "learning_rate": 9.493062873702774e-10, "loss": 0.8082, "step": 52552 }, { "epoch": 0.99, "learning_rate": 9.451014355280064e-10, "loss": 0.931, "step": 52553 }, { "epoch": 0.99, "learning_rate": 9.409059150800038e-10, "loss": 0.851, "step": 52554 }, { "epoch": 0.99, "learning_rate": 9.367197260420902e-10, "loss": 0.6037, "step": 52555 }, { "epoch": 0.99, "learning_rate": 9.325428684298089e-10, "loss": 1.1342, "step": 52556 }, { "epoch": 0.99, "learning_rate": 9.283753422587028e-10, "loss": 0.9943, "step": 52557 }, { "epoch": 0.99, "learning_rate": 9.242171475445927e-10, "loss": 0.8998, "step": 52558 }, { "epoch": 0.99, "learning_rate": 9.200682843027441e-10, "loss": 0.9432, "step": 52559 }, { "epoch": 0.99, "learning_rate": 9.159287525489779e-10, "loss": 0.7729, "step": 52560 }, { "epoch": 0.99, "learning_rate": 9.11798552298282e-10, "loss": 0.9222, "step": 52561 }, { "epoch": 0.99, "learning_rate": 9.076776835661994e-10, "loss": 0.9774, "step": 52562 }, { "epoch": 0.99, "learning_rate": 9.035661463685508e-10, "loss": 1.0226, "step": 52563 }, { "epoch": 0.99, "learning_rate": 8.994639407200468e-10, "loss": 0.9957, "step": 52564 }, { "epoch": 0.99, "learning_rate": 8.953710666365078e-10, "loss": 0.8189, "step": 52565 }, { "epoch": 0.99, "learning_rate": 8.912875241329222e-10, "loss": 0.8931, "step": 52566 }, { "epoch": 0.99, "learning_rate": 8.872133132245553e-10, "loss": 1.0589, "step": 52567 }, { "epoch": 0.99, "learning_rate": 8.831484339269502e-10, "loss": 0.8058, "step": 52568 }, { "epoch": 0.99, "learning_rate": 8.790928862548176e-10, "loss": 1.0915, "step": 52569 }, { "epoch": 0.99, "learning_rate": 8.750466702237004e-10, "loss": 0.8024, "step": 52570 }, { "epoch": 0.99, "learning_rate": 8.710097858485866e-10, "loss": 0.9288, "step": 52571 }, { "epoch": 0.99, "learning_rate": 8.669822331441869e-10, "loss": 0.9062, "step": 52572 }, { "epoch": 0.99, "learning_rate": 8.629640121260441e-10, "loss": 0.5751, "step": 52573 }, { "epoch": 0.99, "learning_rate": 8.589551228091464e-10, "loss": 0.9477, "step": 52574 }, { "epoch": 0.99, "learning_rate": 8.549555652079266e-10, "loss": 1.1688, "step": 52575 }, { "epoch": 0.99, "learning_rate": 8.50965339337928e-10, "loss": 0.8921, "step": 52576 }, { "epoch": 0.99, "learning_rate": 8.469844452138609e-10, "loss": 0.7132, "step": 52577 }, { "epoch": 0.99, "learning_rate": 8.430128828501582e-10, "loss": 0.6789, "step": 52578 }, { "epoch": 0.99, "learning_rate": 8.390506522623632e-10, "loss": 0.728, "step": 52579 }, { "epoch": 0.99, "learning_rate": 8.350977534649085e-10, "loss": 1.0192, "step": 52580 }, { "epoch": 0.99, "learning_rate": 8.311541864725047e-10, "loss": 0.9888, "step": 52581 }, { "epoch": 0.99, "learning_rate": 8.272199512998625e-10, "loss": 1.0561, "step": 52582 }, { "epoch": 0.99, "learning_rate": 8.232950479616919e-10, "loss": 0.9206, "step": 52583 }, { "epoch": 0.99, "learning_rate": 8.193794764729813e-10, "loss": 0.7341, "step": 52584 }, { "epoch": 0.99, "learning_rate": 8.154732368478857e-10, "loss": 0.7889, "step": 52585 }, { "epoch": 0.99, "learning_rate": 8.115763291013934e-10, "loss": 0.9288, "step": 52586 }, { "epoch": 0.99, "learning_rate": 8.076887532476596e-10, "loss": 1.0905, "step": 52587 }, { "epoch": 0.99, "learning_rate": 8.038105093013948e-10, "loss": 0.9755, "step": 52588 }, { "epoch": 0.99, "learning_rate": 7.999415972770319e-10, "loss": 0.9504, "step": 52589 }, { "epoch": 0.99, "learning_rate": 7.960820171890038e-10, "loss": 0.8928, "step": 52590 }, { "epoch": 0.99, "learning_rate": 7.922317690520209e-10, "loss": 0.653, "step": 52591 }, { "epoch": 0.99, "learning_rate": 7.883908528802386e-10, "loss": 0.7168, "step": 52592 }, { "epoch": 0.99, "learning_rate": 7.845592686878123e-10, "loss": 1.0934, "step": 52593 }, { "epoch": 0.99, "learning_rate": 7.807370164891748e-10, "loss": 1.2114, "step": 52594 }, { "epoch": 0.99, "learning_rate": 7.76924096298759e-10, "loss": 0.5749, "step": 52595 }, { "epoch": 0.99, "learning_rate": 7.731205081304427e-10, "loss": 0.7188, "step": 52596 }, { "epoch": 0.99, "learning_rate": 7.693262519989364e-10, "loss": 0.9407, "step": 52597 }, { "epoch": 0.99, "learning_rate": 7.655413279181179e-10, "loss": 0.84, "step": 52598 }, { "epoch": 0.99, "learning_rate": 7.617657359021424e-10, "loss": 0.9105, "step": 52599 }, { "epoch": 0.99, "learning_rate": 7.579994759648879e-10, "loss": 1.0345, "step": 52600 }, { "epoch": 0.99, "learning_rate": 7.542425481207872e-10, "loss": 0.9497, "step": 52601 }, { "epoch": 0.99, "learning_rate": 7.504949523837179e-10, "loss": 0.7669, "step": 52602 }, { "epoch": 0.99, "learning_rate": 7.467566887678356e-10, "loss": 0.8226, "step": 52603 }, { "epoch": 0.99, "learning_rate": 7.430277572867406e-10, "loss": 0.9123, "step": 52604 }, { "epoch": 0.99, "learning_rate": 7.39308157954588e-10, "loss": 0.7209, "step": 52605 }, { "epoch": 0.99, "learning_rate": 7.355978907852557e-10, "loss": 1.1287, "step": 52606 }, { "epoch": 0.99, "learning_rate": 7.318969557923439e-10, "loss": 0.9537, "step": 52607 }, { "epoch": 0.99, "learning_rate": 7.282053529902855e-10, "loss": 0.7439, "step": 52608 }, { "epoch": 0.99, "learning_rate": 7.245230823921256e-10, "loss": 0.9484, "step": 52609 }, { "epoch": 0.99, "learning_rate": 7.208501440120197e-10, "loss": 0.9452, "step": 52610 }, { "epoch": 0.99, "learning_rate": 7.171865378638454e-10, "loss": 0.9285, "step": 52611 }, { "epoch": 0.99, "learning_rate": 7.135322639609255e-10, "loss": 1.0024, "step": 52612 }, { "epoch": 0.99, "learning_rate": 7.098873223171376e-10, "loss": 0.842, "step": 52613 }, { "epoch": 0.99, "learning_rate": 7.062517129458046e-10, "loss": 0.7616, "step": 52614 }, { "epoch": 0.99, "learning_rate": 7.026254358610818e-10, "loss": 0.8537, "step": 52615 }, { "epoch": 0.99, "learning_rate": 6.990084910757366e-10, "loss": 0.8672, "step": 52616 }, { "epoch": 0.99, "learning_rate": 6.954008786039246e-10, "loss": 0.9462, "step": 52617 }, { "epoch": 0.99, "learning_rate": 6.918025984586907e-10, "loss": 0.9648, "step": 52618 }, { "epoch": 0.99, "learning_rate": 6.882136506536352e-10, "loss": 1.1298, "step": 52619 }, { "epoch": 0.99, "learning_rate": 6.846340352020809e-10, "loss": 0.8622, "step": 52620 }, { "epoch": 0.99, "learning_rate": 6.810637521176277e-10, "loss": 0.9357, "step": 52621 }, { "epoch": 0.99, "learning_rate": 6.775028014135987e-10, "loss": 1.0242, "step": 52622 }, { "epoch": 0.99, "learning_rate": 6.739511831027612e-10, "loss": 0.9934, "step": 52623 }, { "epoch": 0.99, "learning_rate": 6.704088971989931e-10, "loss": 0.9985, "step": 52624 }, { "epoch": 0.99, "learning_rate": 6.668759437153394e-10, "loss": 1.1567, "step": 52625 }, { "epoch": 0.99, "learning_rate": 6.633523226648453e-10, "loss": 1.0721, "step": 52626 }, { "epoch": 0.99, "learning_rate": 6.598380340608335e-10, "loss": 0.7541, "step": 52627 }, { "epoch": 0.99, "learning_rate": 6.56333077916349e-10, "loss": 0.9011, "step": 52628 }, { "epoch": 0.99, "learning_rate": 6.528374542444371e-10, "loss": 0.7668, "step": 52629 }, { "epoch": 0.99, "learning_rate": 6.493511630581428e-10, "loss": 0.7846, "step": 52630 }, { "epoch": 0.99, "learning_rate": 6.458742043705113e-10, "loss": 1.0256, "step": 52631 }, { "epoch": 0.99, "learning_rate": 6.424065781945877e-10, "loss": 0.9154, "step": 52632 }, { "epoch": 0.99, "learning_rate": 6.389482845434169e-10, "loss": 0.7661, "step": 52633 }, { "epoch": 0.99, "learning_rate": 6.354993234297668e-10, "loss": 1.0081, "step": 52634 }, { "epoch": 0.99, "learning_rate": 6.320596948664048e-10, "loss": 0.8289, "step": 52635 }, { "epoch": 0.99, "learning_rate": 6.286293988663761e-10, "loss": 0.8757, "step": 52636 }, { "epoch": 0.99, "learning_rate": 6.252084354424482e-10, "loss": 0.8542, "step": 52637 }, { "epoch": 0.99, "learning_rate": 6.21796804607111e-10, "loss": 1.0483, "step": 52638 }, { "epoch": 0.99, "learning_rate": 6.183945063736873e-10, "loss": 0.901, "step": 52639 }, { "epoch": 0.99, "learning_rate": 6.150015407543896e-10, "loss": 1.1679, "step": 52640 }, { "epoch": 0.99, "learning_rate": 6.116179077619855e-10, "loss": 0.7221, "step": 52641 }, { "epoch": 0.99, "learning_rate": 6.082436074092424e-10, "loss": 0.7586, "step": 52642 }, { "epoch": 0.99, "learning_rate": 6.048786397086504e-10, "loss": 1.0131, "step": 52643 }, { "epoch": 0.99, "learning_rate": 6.01523004672977e-10, "loss": 1.175, "step": 52644 }, { "epoch": 0.99, "learning_rate": 5.981767023144347e-10, "loss": 0.8984, "step": 52645 }, { "epoch": 0.99, "learning_rate": 5.948397326455136e-10, "loss": 0.9575, "step": 52646 }, { "epoch": 0.99, "learning_rate": 5.915120956789811e-10, "loss": 0.7383, "step": 52647 }, { "epoch": 0.99, "learning_rate": 5.881937914273273e-10, "loss": 0.7563, "step": 52648 }, { "epoch": 0.99, "learning_rate": 5.84884819902487e-10, "loss": 1.0984, "step": 52649 }, { "epoch": 0.99, "learning_rate": 5.815851811169503e-10, "loss": 1.2224, "step": 52650 }, { "epoch": 0.99, "learning_rate": 5.782948750832073e-10, "loss": 0.8555, "step": 52651 }, { "epoch": 0.99, "learning_rate": 5.750139018137479e-10, "loss": 0.801, "step": 52652 }, { "epoch": 0.99, "learning_rate": 5.717422613202294e-10, "loss": 1.0007, "step": 52653 }, { "epoch": 0.99, "learning_rate": 5.684799536154195e-10, "loss": 0.7354, "step": 52654 }, { "epoch": 0.99, "learning_rate": 5.652269787109754e-10, "loss": 0.9128, "step": 52655 }, { "epoch": 0.99, "learning_rate": 5.619833366196647e-10, "loss": 0.9268, "step": 52656 }, { "epoch": 0.99, "learning_rate": 5.587490273531449e-10, "loss": 0.8809, "step": 52657 }, { "epoch": 0.99, "learning_rate": 5.555240509236281e-10, "loss": 0.778, "step": 52658 }, { "epoch": 0.99, "learning_rate": 5.523084073430496e-10, "loss": 0.8404, "step": 52659 }, { "epoch": 0.99, "learning_rate": 5.491020966236216e-10, "loss": 0.8671, "step": 52660 }, { "epoch": 0.99, "learning_rate": 5.45905118777279e-10, "loss": 0.8822, "step": 52661 }, { "epoch": 0.99, "learning_rate": 5.427174738156793e-10, "loss": 0.9796, "step": 52662 }, { "epoch": 0.99, "learning_rate": 5.395391617510348e-10, "loss": 1.0912, "step": 52663 }, { "epoch": 0.99, "learning_rate": 5.363701825952805e-10, "loss": 0.7473, "step": 52664 }, { "epoch": 0.99, "learning_rate": 5.332105363597962e-10, "loss": 1.0242, "step": 52665 }, { "epoch": 0.99, "learning_rate": 5.300602230567941e-10, "loss": 1.015, "step": 52666 }, { "epoch": 0.99, "learning_rate": 5.26919242697932e-10, "loss": 0.9294, "step": 52667 }, { "epoch": 0.99, "learning_rate": 5.237875952948668e-10, "loss": 0.9205, "step": 52668 }, { "epoch": 0.99, "learning_rate": 5.206652808595336e-10, "loss": 1.0586, "step": 52669 }, { "epoch": 0.99, "learning_rate": 5.175522994033122e-10, "loss": 0.9779, "step": 52670 }, { "epoch": 0.99, "learning_rate": 5.144486509378599e-10, "loss": 0.8615, "step": 52671 }, { "epoch": 0.99, "learning_rate": 5.11354335474834e-10, "loss": 0.9666, "step": 52672 }, { "epoch": 0.99, "learning_rate": 5.082693530256145e-10, "loss": 0.7752, "step": 52673 }, { "epoch": 0.99, "learning_rate": 5.05193703602136e-10, "loss": 0.8425, "step": 52674 }, { "epoch": 0.99, "learning_rate": 5.021273872155008e-10, "loss": 1.1052, "step": 52675 }, { "epoch": 0.99, "learning_rate": 4.990704038773664e-10, "loss": 0.7601, "step": 52676 }, { "epoch": 0.99, "learning_rate": 4.960227535988349e-10, "loss": 0.9304, "step": 52677 }, { "epoch": 0.99, "learning_rate": 4.929844363918413e-10, "loss": 1.0379, "step": 52678 }, { "epoch": 0.99, "learning_rate": 4.899554522672101e-10, "loss": 0.8835, "step": 52679 }, { "epoch": 0.99, "learning_rate": 4.869358012365988e-10, "loss": 1.0849, "step": 52680 }, { "epoch": 0.99, "learning_rate": 4.83925483310832e-10, "loss": 1.0969, "step": 52681 }, { "epoch": 0.99, "learning_rate": 4.809244985018446e-10, "loss": 1.0776, "step": 52682 }, { "epoch": 0.99, "learning_rate": 4.779328468201838e-10, "loss": 0.8293, "step": 52683 }, { "epoch": 0.99, "learning_rate": 4.749505282772293e-10, "loss": 0.994, "step": 52684 }, { "epoch": 0.99, "learning_rate": 4.71977542884361e-10, "loss": 0.771, "step": 52685 }, { "epoch": 0.99, "learning_rate": 4.690138906524033e-10, "loss": 1.1945, "step": 52686 }, { "epoch": 0.99, "learning_rate": 4.660595715927363e-10, "loss": 0.9046, "step": 52687 }, { "epoch": 0.99, "learning_rate": 4.6311458571590695e-10, "loss": 0.914, "step": 52688 }, { "epoch": 0.99, "learning_rate": 4.601789330332951e-10, "loss": 0.7516, "step": 52689 }, { "epoch": 0.99, "learning_rate": 4.5725261355544783e-10, "loss": 0.767, "step": 52690 }, { "epoch": 0.99, "learning_rate": 4.543356272940225e-10, "loss": 0.9113, "step": 52691 }, { "epoch": 0.99, "learning_rate": 4.514279742590111e-10, "loss": 0.7204, "step": 52692 }, { "epoch": 0.99, "learning_rate": 4.4852965446207097e-10, "loss": 1.103, "step": 52693 }, { "epoch": 0.99, "learning_rate": 4.456406679137493e-10, "loss": 1.032, "step": 52694 }, { "epoch": 0.99, "learning_rate": 4.427610146245931e-10, "loss": 0.8936, "step": 52695 }, { "epoch": 0.99, "learning_rate": 4.398906946054271e-10, "loss": 0.8866, "step": 52696 }, { "epoch": 0.99, "learning_rate": 4.37029707867076e-10, "loss": 0.7603, "step": 52697 }, { "epoch": 0.99, "learning_rate": 4.341780544203644e-10, "loss": 0.97, "step": 52698 }, { "epoch": 0.99, "learning_rate": 4.313357342758395e-10, "loss": 0.9857, "step": 52699 }, { "epoch": 0.99, "learning_rate": 4.285027474440484e-10, "loss": 0.9479, "step": 52700 }, { "epoch": 0.99, "learning_rate": 4.256790939355382e-10, "loss": 0.7946, "step": 52701 }, { "epoch": 0.99, "learning_rate": 4.22864773760856e-10, "loss": 0.9646, "step": 52702 }, { "epoch": 0.99, "learning_rate": 4.2005978693054894e-10, "loss": 0.922, "step": 52703 }, { "epoch": 0.99, "learning_rate": 4.1726413345516414e-10, "loss": 0.7299, "step": 52704 }, { "epoch": 0.99, "learning_rate": 4.1447781334497117e-10, "loss": 0.9236, "step": 52705 }, { "epoch": 0.99, "learning_rate": 4.1170082661051713e-10, "loss": 1.1002, "step": 52706 }, { "epoch": 0.99, "learning_rate": 4.0893317326234917e-10, "loss": 1.0708, "step": 52707 }, { "epoch": 0.99, "learning_rate": 4.061748533101817e-10, "loss": 0.7002, "step": 52708 }, { "epoch": 0.99, "learning_rate": 4.03425866765117e-10, "loss": 0.9877, "step": 52709 }, { "epoch": 0.99, "learning_rate": 4.0068621363686946e-10, "loss": 0.8997, "step": 52710 }, { "epoch": 0.99, "learning_rate": 3.9795589393570864e-10, "loss": 0.7994, "step": 52711 }, { "epoch": 0.99, "learning_rate": 3.9523490767218176e-10, "loss": 1.0777, "step": 52712 }, { "epoch": 0.99, "learning_rate": 3.925232548560032e-10, "loss": 0.8843, "step": 52713 }, { "epoch": 0.99, "learning_rate": 3.8982093549744247e-10, "loss": 0.9344, "step": 52714 }, { "epoch": 0.99, "learning_rate": 3.8712794960676925e-10, "loss": 0.8699, "step": 52715 }, { "epoch": 0.99, "learning_rate": 3.8444429719397547e-10, "loss": 0.6629, "step": 52716 }, { "epoch": 0.99, "learning_rate": 3.8176997826905315e-10, "loss": 0.8023, "step": 52717 }, { "epoch": 0.99, "learning_rate": 3.7910499284171676e-10, "loss": 1.1783, "step": 52718 }, { "epoch": 0.99, "learning_rate": 3.764493409225134e-10, "loss": 1.0115, "step": 52719 }, { "epoch": 0.99, "learning_rate": 3.7380302252087997e-10, "loss": 0.9468, "step": 52720 }, { "epoch": 0.99, "learning_rate": 3.711660376465309e-10, "loss": 0.6508, "step": 52721 }, { "epoch": 0.99, "learning_rate": 3.6853838631001337e-10, "loss": 0.8133, "step": 52722 }, { "epoch": 0.99, "learning_rate": 3.659200685204867e-10, "loss": 0.8857, "step": 52723 }, { "epoch": 0.99, "learning_rate": 3.633110842879428e-10, "loss": 0.9631, "step": 52724 }, { "epoch": 0.99, "learning_rate": 3.6071143362237383e-10, "loss": 1.1748, "step": 52725 }, { "epoch": 0.99, "learning_rate": 3.581211165332166e-10, "loss": 0.7856, "step": 52726 }, { "epoch": 0.99, "learning_rate": 3.555401330301855e-10, "loss": 0.812, "step": 52727 }, { "epoch": 0.99, "learning_rate": 3.529684831227176e-10, "loss": 0.9579, "step": 52728 }, { "epoch": 0.99, "learning_rate": 3.5040616682080476e-10, "loss": 0.8351, "step": 52729 }, { "epoch": 0.99, "learning_rate": 3.478531841338839e-10, "loss": 0.9632, "step": 52730 }, { "epoch": 0.99, "learning_rate": 3.4530953507139196e-10, "loss": 1.2796, "step": 52731 }, { "epoch": 0.99, "learning_rate": 3.4277521964276586e-10, "loss": 1.0969, "step": 52732 }, { "epoch": 0.99, "learning_rate": 3.4025023785771996e-10, "loss": 1.0349, "step": 52733 }, { "epoch": 0.99, "learning_rate": 3.3773458972541363e-10, "loss": 0.7129, "step": 52734 }, { "epoch": 0.99, "learning_rate": 3.3522827525556134e-10, "loss": 0.7911, "step": 52735 }, { "epoch": 0.99, "learning_rate": 3.327312944570449e-10, "loss": 0.9968, "step": 52736 }, { "epoch": 0.99, "learning_rate": 3.302436473395787e-10, "loss": 0.9891, "step": 52737 }, { "epoch": 1.0, "learning_rate": 3.277653339125997e-10, "loss": 1.0328, "step": 52738 }, { "epoch": 1.0, "learning_rate": 3.2529635418471207e-10, "loss": 0.9226, "step": 52739 }, { "epoch": 1.0, "learning_rate": 3.228367081656303e-10, "loss": 0.9326, "step": 52740 }, { "epoch": 1.0, "learning_rate": 3.203863958645137e-10, "loss": 0.7379, "step": 52741 }, { "epoch": 1.0, "learning_rate": 3.1794541729052166e-10, "loss": 0.584, "step": 52742 }, { "epoch": 1.0, "learning_rate": 3.155137724525359e-10, "loss": 0.9993, "step": 52743 }, { "epoch": 1.0, "learning_rate": 3.1309146135999333e-10, "loss": 0.9871, "step": 52744 }, { "epoch": 1.0, "learning_rate": 3.1067848402149825e-10, "loss": 1.032, "step": 52745 }, { "epoch": 1.0, "learning_rate": 3.0827484044620993e-10, "loss": 0.8411, "step": 52746 }, { "epoch": 1.0, "learning_rate": 3.0588053064328773e-10, "loss": 0.8514, "step": 52747 }, { "epoch": 1.0, "learning_rate": 3.034955546216134e-10, "loss": 0.6403, "step": 52748 }, { "epoch": 1.0, "learning_rate": 3.0111991239006874e-10, "loss": 1.0269, "step": 52749 }, { "epoch": 1.0, "learning_rate": 2.987536039575356e-10, "loss": 1.1835, "step": 52750 }, { "epoch": 1.0, "learning_rate": 2.9639662933261813e-10, "loss": 0.9663, "step": 52751 }, { "epoch": 1.0, "learning_rate": 2.940489885244757e-10, "loss": 0.8898, "step": 52752 }, { "epoch": 1.0, "learning_rate": 2.9171068154171256e-10, "loss": 0.794, "step": 52753 }, { "epoch": 1.0, "learning_rate": 2.893817083929329e-10, "loss": 0.7911, "step": 52754 }, { "epoch": 1.0, "learning_rate": 2.870620690870185e-10, "loss": 0.9099, "step": 52755 }, { "epoch": 1.0, "learning_rate": 2.8475176363257364e-10, "loss": 1.112, "step": 52756 }, { "epoch": 1.0, "learning_rate": 2.824507920382025e-10, "loss": 1.0609, "step": 52757 }, { "epoch": 1.0, "learning_rate": 2.8015915431278683e-10, "loss": 0.9801, "step": 52758 }, { "epoch": 1.0, "learning_rate": 2.7787685046437584e-10, "loss": 0.9564, "step": 52759 }, { "epoch": 1.0, "learning_rate": 2.756038805015737e-10, "loss": 0.8705, "step": 52760 }, { "epoch": 1.0, "learning_rate": 2.7334024443326223e-10, "loss": 0.7706, "step": 52761 }, { "epoch": 1.0, "learning_rate": 2.710859422674905e-10, "loss": 0.9081, "step": 52762 }, { "epoch": 1.0, "learning_rate": 2.688409740128628e-10, "loss": 1.0107, "step": 52763 }, { "epoch": 1.0, "learning_rate": 2.666053396779833e-10, "loss": 0.8406, "step": 52764 }, { "epoch": 1.0, "learning_rate": 2.643790392706236e-10, "loss": 0.7677, "step": 52765 }, { "epoch": 1.0, "learning_rate": 2.6216207279966544e-10, "loss": 0.7289, "step": 52766 }, { "epoch": 1.0, "learning_rate": 2.59954440273158e-10, "loss": 0.8866, "step": 52767 }, { "epoch": 1.0, "learning_rate": 2.5775614169915033e-10, "loss": 0.7884, "step": 52768 }, { "epoch": 1.0, "learning_rate": 2.5556717708624665e-10, "loss": 1.1321, "step": 52769 }, { "epoch": 1.0, "learning_rate": 2.533875464422186e-10, "loss": 0.8544, "step": 52770 }, { "epoch": 1.0, "learning_rate": 2.5121724977539285e-10, "loss": 0.8764, "step": 52771 }, { "epoch": 1.0, "learning_rate": 2.4905628709409603e-10, "loss": 0.8489, "step": 52772 }, { "epoch": 1.0, "learning_rate": 2.4690465840609965e-10, "loss": 0.6921, "step": 52773 }, { "epoch": 1.0, "learning_rate": 2.4476236371945294e-10, "loss": 1.0189, "step": 52774 }, { "epoch": 1.0, "learning_rate": 2.4262940304220494e-10, "loss": 1.0079, "step": 52775 }, { "epoch": 1.0, "learning_rate": 2.405057763821272e-10, "loss": 0.657, "step": 52776 }, { "epoch": 1.0, "learning_rate": 2.3839148374782406e-10, "loss": 0.731, "step": 52777 }, { "epoch": 1.0, "learning_rate": 2.3628652514651183e-10, "loss": 0.7194, "step": 52778 }, { "epoch": 1.0, "learning_rate": 2.3419090058596215e-10, "loss": 0.8412, "step": 52779 }, { "epoch": 1.0, "learning_rate": 2.3210461007477924e-10, "loss": 0.7962, "step": 52780 }, { "epoch": 1.0, "learning_rate": 2.3002765361990199e-10, "loss": 1.0348, "step": 52781 }, { "epoch": 1.0, "learning_rate": 2.2796003122965703e-10, "loss": 1.0333, "step": 52782 }, { "epoch": 1.0, "learning_rate": 2.2590174291153843e-10, "loss": 0.9107, "step": 52783 }, { "epoch": 1.0, "learning_rate": 2.2385278867331772e-10, "loss": 0.7502, "step": 52784 }, { "epoch": 1.0, "learning_rate": 2.2181316852248892e-10, "loss": 0.7779, "step": 52785 }, { "epoch": 1.0, "learning_rate": 2.1978288246682355e-10, "loss": 1.009, "step": 52786 }, { "epoch": 1.0, "learning_rate": 2.1776193051381567e-10, "loss": 0.9688, "step": 52787 }, { "epoch": 1.0, "learning_rate": 2.1575031267095926e-10, "loss": 0.99, "step": 52788 }, { "epoch": 1.0, "learning_rate": 2.1374802894602588e-10, "loss": 1.1097, "step": 52789 }, { "epoch": 1.0, "learning_rate": 2.1175507934623196e-10, "loss": 0.8972, "step": 52790 }, { "epoch": 1.0, "learning_rate": 2.0977146387907155e-10, "loss": 0.9565, "step": 52791 }, { "epoch": 1.0, "learning_rate": 2.077971825520386e-10, "loss": 0.7584, "step": 52792 }, { "epoch": 1.0, "learning_rate": 2.0583223537234965e-10, "loss": 0.8922, "step": 52793 }, { "epoch": 1.0, "learning_rate": 2.038766223474986e-10, "loss": 0.8467, "step": 52794 }, { "epoch": 1.0, "learning_rate": 2.0193034348470198e-10, "loss": 1.165, "step": 52795 }, { "epoch": 1.0, "learning_rate": 1.999933987911762e-10, "loss": 0.9381, "step": 52796 }, { "epoch": 1.0, "learning_rate": 1.9806578827441525e-10, "loss": 0.8054, "step": 52797 }, { "epoch": 1.0, "learning_rate": 1.961475119410805e-10, "loss": 0.9572, "step": 52798 }, { "epoch": 1.0, "learning_rate": 1.9423856979922107e-10, "loss": 0.7578, "step": 52799 }, { "epoch": 1.0, "learning_rate": 1.9233896185494317e-10, "loss": 1.0867, "step": 52800 }, { "epoch": 1.0, "learning_rate": 1.9044868811601835e-10, "loss": 0.8149, "step": 52801 }, { "epoch": 1.0, "learning_rate": 1.8856774858938554e-10, "loss": 0.8759, "step": 52802 }, { "epoch": 1.0, "learning_rate": 1.866961432819836e-10, "loss": 0.9177, "step": 52803 }, { "epoch": 1.0, "learning_rate": 1.8483387220075144e-10, "loss": 0.9023, "step": 52804 }, { "epoch": 1.0, "learning_rate": 1.8298093535262795e-10, "loss": 0.7303, "step": 52805 }, { "epoch": 1.0, "learning_rate": 1.8113733274482958e-10, "loss": 1.059, "step": 52806 }, { "epoch": 1.0, "learning_rate": 1.7930306438374013e-10, "loss": 0.865, "step": 52807 }, { "epoch": 1.0, "learning_rate": 1.7747813027657602e-10, "loss": 1.0254, "step": 52808 }, { "epoch": 1.0, "learning_rate": 1.7566253043027613e-10, "loss": 0.8883, "step": 52809 }, { "epoch": 1.0, "learning_rate": 1.7385626485122432e-10, "loss": 0.9138, "step": 52810 }, { "epoch": 1.0, "learning_rate": 1.720593335463594e-10, "loss": 0.917, "step": 52811 }, { "epoch": 1.0, "learning_rate": 1.7027173652234276e-10, "loss": 1.0551, "step": 52812 }, { "epoch": 1.0, "learning_rate": 1.6849347378583568e-10, "loss": 0.9385, "step": 52813 }, { "epoch": 1.0, "learning_rate": 1.6672454534377714e-10, "loss": 0.8719, "step": 52814 }, { "epoch": 1.0, "learning_rate": 1.649649512022733e-10, "loss": 0.9483, "step": 52815 }, { "epoch": 1.0, "learning_rate": 1.6321469136826306e-10, "loss": 0.8916, "step": 52816 }, { "epoch": 1.0, "learning_rate": 1.6147376584813024e-10, "loss": 0.9536, "step": 52817 }, { "epoch": 1.0, "learning_rate": 1.5974217464825859e-10, "loss": 0.9475, "step": 52818 }, { "epoch": 1.0, "learning_rate": 1.5801991777558702e-10, "loss": 0.9297, "step": 52819 }, { "epoch": 1.0, "learning_rate": 1.5630699523594418e-10, "loss": 0.8377, "step": 52820 }, { "epoch": 1.0, "learning_rate": 1.5460340703599143e-10, "loss": 1.028, "step": 52821 }, { "epoch": 1.0, "learning_rate": 1.5290915318239008e-10, "loss": 0.9037, "step": 52822 }, { "epoch": 1.0, "learning_rate": 1.5122423368096884e-10, "loss": 0.7816, "step": 52823 }, { "epoch": 1.0, "learning_rate": 1.4954864853811145e-10, "loss": 1.0713, "step": 52824 }, { "epoch": 1.0, "learning_rate": 1.478823977604793e-10, "loss": 1.0613, "step": 52825 }, { "epoch": 1.0, "learning_rate": 1.4622548135390102e-10, "loss": 0.9753, "step": 52826 }, { "epoch": 1.0, "learning_rate": 1.445778993247604e-10, "loss": 0.8722, "step": 52827 }, { "epoch": 1.0, "learning_rate": 1.4293965167888614e-10, "loss": 0.8375, "step": 52828 }, { "epoch": 1.0, "learning_rate": 1.4131073842266197e-10, "loss": 0.8427, "step": 52829 }, { "epoch": 1.0, "learning_rate": 1.3969115956219414e-10, "loss": 0.8165, "step": 52830 }, { "epoch": 1.0, "learning_rate": 1.380809151035889e-10, "loss": 0.8531, "step": 52831 }, { "epoch": 1.0, "learning_rate": 1.3648000505267489e-10, "loss": 0.7565, "step": 52832 }, { "epoch": 1.0, "learning_rate": 1.3488842941555835e-10, "loss": 0.7936, "step": 52833 }, { "epoch": 1.0, "learning_rate": 1.3330618819779039e-10, "loss": 0.8661, "step": 52834 }, { "epoch": 1.0, "learning_rate": 1.3173328140603238e-10, "loss": 1.0265, "step": 52835 }, { "epoch": 1.0, "learning_rate": 1.301697090455578e-10, "loss": 0.7567, "step": 52836 }, { "epoch": 1.0, "learning_rate": 1.286154711221954e-10, "loss": 0.8677, "step": 52837 }, { "epoch": 1.0, "learning_rate": 1.2707056764232894e-10, "loss": 0.9437, "step": 52838 }, { "epoch": 1.0, "learning_rate": 1.2553499861095442e-10, "loss": 0.8851, "step": 52839 }, { "epoch": 1.0, "learning_rate": 1.2400876403445562e-10, "loss": 1.0501, "step": 52840 }, { "epoch": 1.0, "learning_rate": 1.2249186391810607e-10, "loss": 0.9384, "step": 52841 }, { "epoch": 1.0, "learning_rate": 1.209842982677345e-10, "loss": 0.8009, "step": 52842 }, { "epoch": 1.0, "learning_rate": 1.1948606708916956e-10, "loss": 1.0195, "step": 52843 }, { "epoch": 1.0, "learning_rate": 1.1799717038768476e-10, "loss": 1.2898, "step": 52844 }, { "epoch": 1.0, "learning_rate": 1.1651760816883128e-10, "loss": 0.6941, "step": 52845 }, { "epoch": 1.0, "learning_rate": 1.1504738043816021e-10, "loss": 0.6507, "step": 52846 }, { "epoch": 1.0, "learning_rate": 1.1358648720150023e-10, "loss": 0.8721, "step": 52847 }, { "epoch": 1.0, "learning_rate": 1.1213492846384732e-10, "loss": 0.7868, "step": 52848 }, { "epoch": 1.0, "learning_rate": 1.1069270423103018e-10, "loss": 1.1046, "step": 52849 }, { "epoch": 1.0, "learning_rate": 1.0925981450832235e-10, "loss": 1.1073, "step": 52850 }, { "epoch": 1.0, "learning_rate": 1.0783625930071984e-10, "loss": 0.8843, "step": 52851 }, { "epoch": 1.0, "learning_rate": 1.0642203861377376e-10, "loss": 0.9859, "step": 52852 }, { "epoch": 1.0, "learning_rate": 1.0501715245303523e-10, "loss": 0.9646, "step": 52853 }, { "epoch": 1.0, "learning_rate": 1.0362160082350026e-10, "loss": 0.7835, "step": 52854 }, { "epoch": 1.0, "learning_rate": 1.0223538373016484e-10, "loss": 0.9636, "step": 52855 }, { "epoch": 1.0, "learning_rate": 1.0085850117885765e-10, "loss": 0.9432, "step": 52856 }, { "epoch": 1.0, "learning_rate": 9.949095317401958e-11, "loss": 0.9377, "step": 52857 }, { "epoch": 1.0, "learning_rate": 9.813273972092418e-11, "loss": 0.7185, "step": 52858 }, { "epoch": 1.0, "learning_rate": 9.678386082484504e-11, "loss": 0.8156, "step": 52859 }, { "epoch": 1.0, "learning_rate": 9.544431649077813e-11, "loss": 0.8828, "step": 52860 }, { "epoch": 1.0, "learning_rate": 9.411410672371945e-11, "loss": 0.7607, "step": 52861 }, { "epoch": 1.0, "learning_rate": 9.279323152838749e-11, "loss": 1.0313, "step": 52862 }, { "epoch": 1.0, "learning_rate": 9.148169091005577e-11, "loss": 0.9249, "step": 52863 }, { "epoch": 1.0, "learning_rate": 9.017948487344275e-11, "loss": 0.7074, "step": 52864 }, { "epoch": 1.0, "learning_rate": 8.888661342354444e-11, "loss": 1.0716, "step": 52865 }, { "epoch": 1.0, "learning_rate": 8.760307656507926e-11, "loss": 0.8035, "step": 52866 }, { "epoch": 1.0, "learning_rate": 8.63288743027657e-11, "loss": 0.8656, "step": 52867 }, { "epoch": 1.0, "learning_rate": 8.506400664159975e-11, "loss": 0.9595, "step": 52868 }, { "epoch": 1.0, "learning_rate": 8.380847358602229e-11, "loss": 1.0321, "step": 52869 }, { "epoch": 1.0, "learning_rate": 8.256227514075177e-11, "loss": 0.7289, "step": 52870 }, { "epoch": 1.0, "learning_rate": 8.13254113107842e-11, "loss": 0.8792, "step": 52871 }, { "epoch": 1.0, "learning_rate": 8.009788210028291e-11, "loss": 0.8712, "step": 52872 }, { "epoch": 1.0, "learning_rate": 7.88796875142439e-11, "loss": 0.8494, "step": 52873 }, { "epoch": 1.0, "learning_rate": 7.767082755683053e-11, "loss": 0.9245, "step": 52874 }, { "epoch": 1.0, "learning_rate": 7.647130223276123e-11, "loss": 1.1066, "step": 52875 }, { "epoch": 1.0, "learning_rate": 7.528111154675444e-11, "loss": 0.9349, "step": 52876 }, { "epoch": 1.0, "learning_rate": 7.410025550269595e-11, "loss": 0.813, "step": 52877 }, { "epoch": 1.0, "learning_rate": 7.292873410558177e-11, "loss": 0.7522, "step": 52878 }, { "epoch": 1.0, "learning_rate": 7.176654735929767e-11, "loss": 0.7141, "step": 52879 }, { "epoch": 1.0, "learning_rate": 7.061369526828454e-11, "loss": 0.8875, "step": 52880 }, { "epoch": 1.0, "learning_rate": 6.947017783726084e-11, "loss": 0.8311, "step": 52881 }, { "epoch": 1.0, "learning_rate": 6.833599506983479e-11, "loss": 0.7851, "step": 52882 }, { "epoch": 1.0, "learning_rate": 6.72111469710024e-11, "loss": 0.9842, "step": 52883 }, { "epoch": 1.0, "learning_rate": 6.609563354409432e-11, "loss": 0.836, "step": 52884 }, { "epoch": 1.0, "learning_rate": 6.498945479410657e-11, "loss": 0.7378, "step": 52885 }, { "epoch": 1.0, "learning_rate": 6.389261072464737e-11, "loss": 0.9844, "step": 52886 }, { "epoch": 1.0, "learning_rate": 6.280510133988004e-11, "loss": 1.1162, "step": 52887 }, { "epoch": 1.0, "learning_rate": 6.172692664424551e-11, "loss": 0.8969, "step": 52888 }, { "epoch": 1.0, "learning_rate": 6.065808664135197e-11, "loss": 0.8036, "step": 52889 }, { "epoch": 1.0, "learning_rate": 5.959858133508523e-11, "loss": 0.691, "step": 52890 }, { "epoch": 1.0, "learning_rate": 5.854841072988615e-11, "loss": 0.8485, "step": 52891 }, { "epoch": 1.0, "learning_rate": 5.750757482936298e-11, "loss": 0.6486, "step": 52892 }, { "epoch": 1.0, "learning_rate": 5.6476073637401485e-11, "loss": 1.0699, "step": 52893 }, { "epoch": 1.0, "learning_rate": 5.545390715788745e-11, "loss": 0.9381, "step": 52894 }, { "epoch": 1.0, "learning_rate": 5.4441075394706666e-11, "loss": 0.9192, "step": 52895 }, { "epoch": 1.0, "learning_rate": 5.3437578351467345e-11, "loss": 0.9077, "step": 52896 }, { "epoch": 1.0, "learning_rate": 5.2443416032055274e-11, "loss": 0.9379, "step": 52897 }, { "epoch": 1.0, "learning_rate": 5.1458588440356225e-11, "loss": 0.7521, "step": 52898 }, { "epoch": 1.0, "learning_rate": 5.048309557970088e-11, "loss": 0.932, "step": 52899 }, { "epoch": 1.0, "learning_rate": 4.951693745397501e-11, "loss": 0.8759, "step": 52900 }, { "epoch": 1.0, "learning_rate": 4.8560114066786846e-11, "loss": 0.939, "step": 52901 }, { "epoch": 1.0, "learning_rate": 4.761262542146705e-11, "loss": 0.9764, "step": 52902 }, { "epoch": 1.0, "learning_rate": 4.6674471521623857e-11, "loss": 0.6638, "step": 52903 }, { "epoch": 1.0, "learning_rate": 4.5745652371143037e-11, "loss": 0.7549, "step": 52904 }, { "epoch": 1.0, "learning_rate": 4.482616797307771e-11, "loss": 0.9449, "step": 52905 }, { "epoch": 1.0, "learning_rate": 4.391601833075854e-11, "loss": 1.1476, "step": 52906 }, { "epoch": 1.0, "learning_rate": 4.3015203448071305e-11, "loss": 0.8239, "step": 52907 }, { "epoch": 1.0, "learning_rate": 4.212372332806913e-11, "loss": 0.7284, "step": 52908 }, { "epoch": 1.0, "learning_rate": 4.124157797408268e-11, "loss": 0.7539, "step": 52909 }, { "epoch": 1.0, "learning_rate": 4.036876738944262e-11, "loss": 1.045, "step": 52910 }, { "epoch": 1.0, "learning_rate": 3.9505291577479624e-11, "loss": 0.7339, "step": 52911 }, { "epoch": 1.0, "learning_rate": 3.86511505412468e-11, "loss": 1.037, "step": 52912 }, { "epoch": 1.0, "learning_rate": 3.780634428407481e-11, "loss": 1.0627, "step": 52913 }, { "epoch": 1.0, "learning_rate": 3.6970872809294346e-11, "loss": 0.873, "step": 52914 }, { "epoch": 1.0, "learning_rate": 3.614473611968095e-11, "loss": 0.8915, "step": 52915 }, { "epoch": 1.0, "learning_rate": 3.532793421828773e-11, "loss": 0.821, "step": 52916 }, { "epoch": 1.0, "learning_rate": 3.452046710844537e-11, "loss": 0.7575, "step": 52917 }, { "epoch": 1.0, "learning_rate": 3.3722334792929413e-11, "loss": 0.8051, "step": 52918 }, { "epoch": 1.0, "learning_rate": 3.293353727507054e-11, "loss": 1.0942, "step": 52919 }, { "epoch": 1.0, "learning_rate": 3.215407455736674e-11, "loss": 0.8796, "step": 52920 }, { "epoch": 1.0, "learning_rate": 3.1383946643148697e-11, "loss": 0.9221, "step": 52921 }, { "epoch": 1.0, "learning_rate": 3.062315353491441e-11, "loss": 0.9155, "step": 52922 }, { "epoch": 1.0, "learning_rate": 2.987169523599454e-11, "loss": 0.8472, "step": 52923 }, { "epoch": 1.0, "learning_rate": 2.912957174860953e-11, "loss": 0.8979, "step": 52924 }, { "epoch": 1.0, "learning_rate": 2.8396783075812506e-11, "loss": 1.1523, "step": 52925 }, { "epoch": 1.0, "learning_rate": 2.767332922037902e-11, "loss": 0.8405, "step": 52926 }, { "epoch": 1.0, "learning_rate": 2.6959210185084628e-11, "loss": 0.727, "step": 52927 }, { "epoch": 1.0, "learning_rate": 2.6254425972149778e-11, "loss": 0.8159, "step": 52928 }, { "epoch": 1.0, "learning_rate": 2.5558976584905137e-11, "loss": 0.7596, "step": 52929 }, { "epoch": 1.0, "learning_rate": 2.4872862025293598e-11, "loss": 0.9252, "step": 52930 }, { "epoch": 1.0, "learning_rate": 2.419608229636827e-11, "loss": 1.1349, "step": 52931 }, { "epoch": 1.0, "learning_rate": 2.3528637400349607e-11, "loss": 0.9073, "step": 52932 }, { "epoch": 1.0, "learning_rate": 2.2870527339735603e-11, "loss": 0.9844, "step": 52933 }, { "epoch": 1.0, "learning_rate": 2.2221752117024264e-11, "loss": 0.9758, "step": 52934 }, { "epoch": 1.0, "learning_rate": 2.1582311734991147e-11, "loss": 0.9083, "step": 52935 }, { "epoch": 1.0, "learning_rate": 2.095220619557914e-11, "loss": 0.802, "step": 52936 }, { "epoch": 1.0, "learning_rate": 2.033143550100869e-11, "loss": 1.1331, "step": 52937 }, { "epoch": 1.0, "learning_rate": 1.971999965433291e-11, "loss": 0.9434, "step": 52938 }, { "epoch": 1.0, "learning_rate": 1.911789865693958e-11, "loss": 0.9313, "step": 52939 }, { "epoch": 1.0, "learning_rate": 1.8525132511881817e-11, "loss": 0.6974, "step": 52940 }, { "epoch": 1.0, "learning_rate": 1.794170122082495e-11, "loss": 0.774, "step": 52941 }, { "epoch": 1.0, "learning_rate": 1.7367604785989422e-11, "loss": 0.7238, "step": 52942 }, { "epoch": 1.0, "learning_rate": 1.6802843209873243e-11, "loss": 1.1539, "step": 52943 }, { "epoch": 1.0, "learning_rate": 1.6247416494141742e-11, "loss": 0.737, "step": 52944 }, { "epoch": 1.0, "learning_rate": 1.5701324641292924e-11, "loss": 1.007, "step": 52945 }, { "epoch": 1.0, "learning_rate": 1.5164567652992123e-11, "loss": 0.9922, "step": 52946 }, { "epoch": 1.0, "learning_rate": 1.463714553173734e-11, "loss": 0.8724, "step": 52947 }, { "epoch": 1.0, "learning_rate": 1.4119058278916353e-11, "loss": 0.8761, "step": 52948 }, { "epoch": 1.0, "learning_rate": 1.3610305896749609e-11, "loss": 0.8982, "step": 52949 }, { "epoch": 1.0, "learning_rate": 1.3110888387179999e-11, "loss": 1.1276, "step": 52950 }, { "epoch": 1.0, "learning_rate": 1.2620805751872855e-11, "loss": 0.9751, "step": 52951 }, { "epoch": 1.0, "learning_rate": 1.214005799277107e-11, "loss": 0.8741, "step": 52952 }, { "epoch": 1.0, "learning_rate": 1.1668645111817534e-11, "loss": 0.8193, "step": 52953 }, { "epoch": 1.0, "learning_rate": 1.120656711067758e-11, "loss": 0.7098, "step": 52954 }, { "epoch": 1.0, "learning_rate": 1.0753823991016543e-11, "loss": 0.826, "step": 52955 }, { "epoch": 1.0, "learning_rate": 1.0310415754499758e-11, "loss": 1.0163, "step": 52956 }, { "epoch": 1.0, "learning_rate": 9.876342402792561e-12, "loss": 1.0002, "step": 52957 }, { "epoch": 1.0, "learning_rate": 9.451603937560283e-12, "loss": 0.8681, "step": 52958 }, { "epoch": 1.0, "learning_rate": 9.03620036046826e-12, "loss": 0.928, "step": 52959 }, { "epoch": 1.0, "learning_rate": 8.630131672904274e-12, "loss": 0.7274, "step": 52960 }, { "epoch": 1.0, "learning_rate": 8.233397876533655e-12, "loss": 1.043, "step": 52961 }, { "epoch": 1.0, "learning_rate": 7.845998972744184e-12, "loss": 1.1779, "step": 52962 }, { "epoch": 1.0, "learning_rate": 7.46793496292364e-12, "loss": 0.9633, "step": 52963 }, { "epoch": 1.0, "learning_rate": 7.099205848737356e-12, "loss": 0.9919, "step": 52964 }, { "epoch": 1.0, "learning_rate": 6.739811631295556e-12, "loss": 0.5312, "step": 52965 }, { "epoch": 1.0, "learning_rate": 6.389752311986019e-12, "loss": 0.6754, "step": 52966 }, { "epoch": 1.0, "learning_rate": 6.049027892196524e-12, "loss": 0.6197, "step": 52967 }, { "epoch": 1.0, "learning_rate": 5.717638373314849e-12, "loss": 0.9976, "step": 52968 }, { "epoch": 1.0, "learning_rate": 5.395583756173661e-12, "loss": 0.9355, "step": 52969 }, { "epoch": 1.0, "learning_rate": 5.082864042438296e-12, "loss": 0.7728, "step": 52970 }, { "epoch": 1.0, "learning_rate": 4.7794792329414195e-12, "loss": 0.7881, "step": 52971 }, { "epoch": 1.0, "learning_rate": 4.485429329070812e-12, "loss": 0.8463, "step": 52972 }, { "epoch": 1.0, "learning_rate": 4.2007143316591394e-12, "loss": 0.85, "step": 52973 }, { "epoch": 1.0, "learning_rate": 3.925334242094181e-12, "loss": 0.9897, "step": 52974 }, { "epoch": 1.0, "learning_rate": 3.659289060931048e-12, "loss": 1.0714, "step": 52975 }, { "epoch": 1.0, "learning_rate": 3.40257878955752e-12, "loss": 1.0577, "step": 52976 }, { "epoch": 1.0, "learning_rate": 3.1552034290838194e-12, "loss": 0.8057, "step": 52977 }, { "epoch": 1.0, "learning_rate": 2.917162980065058e-12, "loss": 0.7873, "step": 52978 }, { "epoch": 1.0, "learning_rate": 2.6884574433339027e-12, "loss": 0.9515, "step": 52979 }, { "epoch": 1.0, "learning_rate": 2.469086820000577e-12, "loss": 0.8586, "step": 52980 }, { "epoch": 1.0, "learning_rate": 2.2590511108977475e-12, "loss": 1.1, "step": 52981 }, { "epoch": 1.0, "learning_rate": 2.058350316580526e-12, "loss": 0.8796, "step": 52982 }, { "epoch": 1.0, "learning_rate": 1.8669844378815806e-12, "loss": 0.8594, "step": 52983 }, { "epoch": 1.0, "learning_rate": 1.6849534756335773e-12, "loss": 0.8323, "step": 52984 }, { "epoch": 1.0, "learning_rate": 1.5122574303916282e-12, "loss": 0.6568, "step": 52985 }, { "epoch": 1.0, "learning_rate": 1.3488963029884005e-12, "loss": 0.8588, "step": 52986 }, { "epoch": 1.0, "learning_rate": 1.1948700937014502e-12, "loss": 0.9415, "step": 52987 }, { "epoch": 1.0, "learning_rate": 1.0501788033634442e-12, "loss": 1.0064, "step": 52988 }, { "epoch": 1.0, "learning_rate": 9.14822432529494e-13, "loss": 0.9668, "step": 52989 }, { "epoch": 1.0, "learning_rate": 7.888009817547115e-13, "loss": 0.9681, "step": 52990 }, { "epoch": 1.0, "learning_rate": 6.721144510390965e-13, "loss": 0.8154, "step": 52991 }, { "epoch": 1.0, "learning_rate": 5.647628414928718e-13, "loss": 0.7144, "step": 52992 }, { "epoch": 1.0, "learning_rate": 4.667461531160377e-13, "loss": 1.0073, "step": 52993 }, { "epoch": 1.0, "learning_rate": 3.7806438618614993e-13, "loss": 0.9565, "step": 52994 }, { "epoch": 1.0, "learning_rate": 2.9871754125831986e-13, "loss": 0.9034, "step": 52995 }, { "epoch": 1.0, "learning_rate": 2.287056186101033e-13, "loss": 0.8512, "step": 52996 }, { "epoch": 1.0, "learning_rate": 1.6802861851905606e-13, "loss": 0.9341, "step": 52997 }, { "epoch": 1.0, "learning_rate": 1.1668654098517806e-13, "loss": 0.8668, "step": 52998 }, { "epoch": 1.0, "learning_rate": 7.467938656358087e-14, "loss": 0.9785, "step": 52999 }, { "epoch": 1.0, "learning_rate": 4.200715497670871e-14, "loss": 0.9182, "step": 53000 }, { "epoch": 1.0, "learning_rate": 1.8669846779673096e-14, "loss": 0.7025, "step": 53001 }, { "epoch": 1.0, "learning_rate": 4.667461694918274e-15, "loss": 0.8538, "step": 53002 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 0.967, "step": 53003 }, { "epoch": 1.0, "step": 53003, "total_flos": 1.0137691576928256e+16, "train_loss": 0.9420517254507281, "train_runtime": 127015.2279, "train_samples_per_second": 13.353, "train_steps_per_second": 0.417 } ], "max_steps": 53003, "num_train_epochs": 1, "total_flos": 1.0137691576928256e+16, "trial_name": null, "trial_params": null }